Home Reference Source

src/utils/imsc1-ttml-parser.ts

  1. import { findBox } from './mp4-tools';
  2. import { parseTimeStamp } from './vttparser';
  3. import VTTCue from './vttcue';
  4. import { utf8ArrayToStr } from '../demux/id3';
  5. import { toTimescaleFromScale } from './timescale-conversion';
  6. import { generateCueId } from './webvtt-parser';
  7.  
  8. export const IMSC1_CODEC = 'stpp.ttml.im1t';
  9.  
  10. // Time format: h:m:s:frames(.subframes)
  11. const HMSF_REGEX = /^(\d{2,}):(\d{2}):(\d{2}):(\d{2})\.?(\d+)?$/;
  12.  
  13. // Time format: hours, minutes, seconds, milliseconds, frames, ticks
  14. const TIME_UNIT_REGEX = /^(\d*(?:\.\d*)?)(h|m|s|ms|f|t)$/;
  15.  
  16. export function parseIMSC1(
  17. payload: ArrayBuffer,
  18. initPTS: number,
  19. timescale: number,
  20. callBack: (cues: Array<VTTCue>) => any,
  21. errorCallBack: (error: Error) => any
  22. ) {
  23. const results = findBox(new Uint8Array(payload), ['mdat']);
  24. if (results.length === 0) {
  25. errorCallBack(new Error('Could not parse IMSC1 mdat'));
  26. return;
  27. }
  28. const mdat = results[0];
  29. const ttml = utf8ArrayToStr(
  30. new Uint8Array(payload, mdat.start, mdat.end - mdat.start)
  31. );
  32. const syncTime = toTimescaleFromScale(initPTS, 1, timescale);
  33.  
  34. try {
  35. callBack(parseTTML(ttml, syncTime));
  36. } catch (error) {
  37. errorCallBack(error);
  38. }
  39. }
  40.  
  41. function parseTTML(ttml: string, syncTime: number): Array<VTTCue> {
  42. const parser = new DOMParser();
  43. const xmlDoc = parser.parseFromString(ttml, 'text/xml');
  44. const tt = xmlDoc.getElementsByTagName('tt')[0];
  45. if (!tt) {
  46. throw new Error('Invalid ttml');
  47. }
  48. const defaultRateInfo = {
  49. frameRate: 30,
  50. subFrameRate: 1,
  51. frameRateMultiplier: 0,
  52. tickRate: 0,
  53. };
  54. const rateInfo: Object = Object.keys(defaultRateInfo).reduce(
  55. (result, key) => {
  56. result[key] = tt.getAttribute(`ttp:${key}`) || defaultRateInfo[key];
  57. return result;
  58. },
  59. {}
  60. );
  61.  
  62. const trim = tt.getAttribute('xml:space') !== 'preserve';
  63.  
  64. const styleElements = collectionToDictionary(
  65. getElementCollection(tt, 'styling', 'style')
  66. );
  67. const regionElements = collectionToDictionary(
  68. getElementCollection(tt, 'layout', 'region')
  69. );
  70. const cueElements = getElementCollection(tt, 'body', '[begin]');
  71.  
  72. return [].map
  73. .call(cueElements, (cueElement) => {
  74. const cueText = getTextContent(cueElement, trim);
  75.  
  76. if (!cueText || !cueElement.hasAttribute('begin')) {
  77. return null;
  78. }
  79. const startTime = parseTtmlTime(
  80. cueElement.getAttribute('begin'),
  81. rateInfo
  82. );
  83. const duration = parseTtmlTime(cueElement.getAttribute('dur'), rateInfo);
  84. let endTime = parseTtmlTime(cueElement.getAttribute('end'), rateInfo);
  85. if (startTime === null) {
  86. throw timestampParsingError(cueElement);
  87. }
  88. if (endTime === null) {
  89. if (duration === null) {
  90. throw timestampParsingError(cueElement);
  91. }
  92. endTime = startTime + duration;
  93. }
  94. const cue = new VTTCue(startTime - syncTime, endTime - syncTime, cueText);
  95. cue.id = generateCueId(cue.startTime, cue.endTime, cue.text);
  96.  
  97. const region = regionElements[cueElement.getAttribute('region')];
  98. const style = styleElements[cueElement.getAttribute('style')];
  99.  
  100. // TODO: Add regions to track and cue (origin and extend)
  101. // These values are hard-coded (for now) to simulate region settings in the demo
  102. cue.position = 10;
  103. cue.size = 80;
  104.  
  105. // Apply styles to cue
  106. const styles = getTtmlStyles(region, style);
  107. const { textAlign } = styles;
  108. if (textAlign) {
  109. // cue.positionAlign not settable in FF~2016
  110. cue.lineAlign = {
  111. left: 'start',
  112. center: 'center',
  113. right: 'end',
  114. start: 'start',
  115. end: 'end',
  116. }[textAlign];
  117. cue.align = textAlign as AlignSetting;
  118. }
  119. Object.assign(cue, styles);
  120.  
  121. return cue;
  122. })
  123. .filter((cue) => cue !== null);
  124. }
  125.  
  126. function getElementCollection(
  127. fromElement,
  128. parentName,
  129. childName
  130. ): Array<HTMLElement> {
  131. const parent = fromElement.getElementsByTagName(parentName)[0];
  132. if (parent) {
  133. return [].slice.call(parent.querySelectorAll(childName));
  134. }
  135. return [];
  136. }
  137.  
  138. function collectionToDictionary(
  139. elementsWithId: Array<HTMLElement>
  140. ): { [id: string]: HTMLElement } {
  141. return elementsWithId.reduce((dict, element: HTMLElement) => {
  142. const id = element.getAttribute('xml:id');
  143. if (id) {
  144. dict[id] = element;
  145. }
  146. return dict;
  147. }, {});
  148. }
  149.  
  150. function getTextContent(element, trim): string {
  151. return [].slice.call(element.childNodes).reduce((str, node, i) => {
  152. if (node.nodeName === 'br' && i) {
  153. return str + '\n';
  154. }
  155. if (node.childNodes?.length) {
  156. return getTextContent(node, trim);
  157. } else if (trim) {
  158. return str + node.textContent.trim().replace(/\s+/g, ' ');
  159. }
  160. return str + node.textContent;
  161. }, '');
  162. }
  163.  
  164. function getTtmlStyles(region, style): { [style: string]: string } {
  165. const ttsNs = 'http://www.w3.org/ns/ttml#styling';
  166. const styleAttributes = [
  167. 'displayAlign',
  168. 'textAlign',
  169. 'color',
  170. 'backgroundColor',
  171. 'fontSize',
  172. 'fontFamily',
  173. // 'fontWeight',
  174. // 'lineHeight',
  175. // 'wrapOption',
  176. // 'fontStyle',
  177. // 'direction',
  178. // 'writingMode'
  179. ];
  180. return styleAttributes.reduce((styles, name) => {
  181. const value =
  182. getAttributeNS(style, ttsNs, name) || getAttributeNS(region, ttsNs, name);
  183. if (value) {
  184. styles[name] = value;
  185. }
  186. return styles;
  187. }, {});
  188. }
  189.  
  190. function getAttributeNS(element, ns, name): string | null {
  191. return element.hasAttributeNS(ns, name)
  192. ? element.getAttributeNS(ns, name)
  193. : null;
  194. }
  195.  
  196. function timestampParsingError(node) {
  197. return new Error(`Could not parse ttml timestamp ${node}`);
  198. }
  199.  
  200. function parseTtmlTime(timeAttributeValue, rateInfo): number | null {
  201. if (!timeAttributeValue) {
  202. return null;
  203. }
  204. let seconds: number | null = parseTimeStamp(timeAttributeValue);
  205. if (seconds === null) {
  206. if (HMSF_REGEX.test(timeAttributeValue)) {
  207. seconds = parseHoursMinutesSecondsFrames(timeAttributeValue, rateInfo);
  208. } else if (TIME_UNIT_REGEX.test(timeAttributeValue)) {
  209. seconds = parseTimeUnits(timeAttributeValue, rateInfo);
  210. }
  211. }
  212. return seconds;
  213. }
  214.  
  215. function parseHoursMinutesSecondsFrames(timeAttributeValue, rateInfo): number {
  216. const m = HMSF_REGEX.exec(timeAttributeValue) as Array<any>;
  217. const frames = (m[4] | 0) + (m[5] | 0) / rateInfo.subFrameRate;
  218. return (
  219. (m[1] | 0) * 3600 +
  220. (m[2] | 0) * 60 +
  221. (m[3] | 0) +
  222. frames / rateInfo.frameRate
  223. );
  224. }
  225.  
  226. function parseTimeUnits(timeAttributeValue, rateInfo): number {
  227. const m = TIME_UNIT_REGEX.exec(timeAttributeValue) as Array<any>;
  228. const value = Number(m[1]);
  229. const unit = m[2];
  230. switch (unit) {
  231. case 'h':
  232. return value * 3600;
  233. case 'm':
  234. return value * 60;
  235. case 'ms':
  236. return value * 1000;
  237. case 'f':
  238. return value / rateInfo.frameRate;
  239. case 't':
  240. return value / rateInfo.tickRate;
  241. }
  242. return value;
  243. }