Home Reference Source

src/utils/vttparser.js

  1. /*
  2. * Source: https://github.com/mozilla/vtt.js/blob/master/dist/vtt.js#L1716
  3. */
  4.  
  5. import VTTCue from './vttcue';
  6.  
  7. const StringDecoder = function StringDecoder () {
  8. return {
  9. decode: function (data) {
  10. if (!data) {
  11. return '';
  12. }
  13.  
  14. if (typeof data !== 'string') {
  15. throw new Error('Error - expected string data.');
  16. }
  17.  
  18. return decodeURIComponent(encodeURIComponent(data));
  19. }
  20. };
  21. };
  22.  
  23. function VTTParser () {
  24. this.window = window;
  25. this.state = 'INITIAL';
  26. this.buffer = '';
  27. this.decoder = new StringDecoder();
  28. this.regionList = [];
  29. }
  30.  
  31. // Try to parse input as a time stamp.
  32. function parseTimeStamp (input) {
  33. function computeSeconds (h, m, s, f) {
  34. return (h | 0) * 3600 + (m | 0) * 60 + (s | 0) + (f | 0) / 1000;
  35. }
  36.  
  37. let m = input.match(/^(\d+):(\d{2})(:\d{2})?\.(\d{3})/);
  38. if (!m) {
  39. return null;
  40. }
  41.  
  42. if (m[3]) {
  43. // Timestamp takes the form of [hours]:[minutes]:[seconds].[milliseconds]
  44. return computeSeconds(m[1], m[2], m[3].replace(':', ''), m[4]);
  45. } else if (m[1] > 59) {
  46. // Timestamp takes the form of [hours]:[minutes].[milliseconds]
  47. // First position is hours as it's over 59.
  48. return computeSeconds(m[1], m[2], 0, m[4]);
  49. } else {
  50. // Timestamp takes the form of [minutes]:[seconds].[milliseconds]
  51. return computeSeconds(0, m[1], m[2], m[4]);
  52. }
  53. }
  54.  
  55. // A settings object holds key/value pairs and will ignore anything but the first
  56. // assignment to a specific key.
  57. function Settings () {
  58. this.values = Object.create(null);
  59. }
  60.  
  61. Settings.prototype = {
  62. // Only accept the first assignment to any key.
  63. set: function (k, v) {
  64. if (!this.get(k) && v !== '') {
  65. this.values[k] = v;
  66. }
  67. },
  68. // Return the value for a key, or a default value.
  69. // If 'defaultKey' is passed then 'dflt' is assumed to be an object with
  70. // a number of possible default values as properties where 'defaultKey' is
  71. // the key of the property that will be chosen; otherwise it's assumed to be
  72. // a single value.
  73. get: function (k, dflt, defaultKey) {
  74. if (defaultKey) {
  75. return this.has(k) ? this.values[k] : dflt[defaultKey];
  76. }
  77.  
  78. return this.has(k) ? this.values[k] : dflt;
  79. },
  80. // Check whether we have a value for a key.
  81. has: function (k) {
  82. return k in this.values;
  83. },
  84. // Accept a setting if its one of the given alternatives.
  85. alt: function (k, v, a) {
  86. for (let n = 0; n < a.length; ++n) {
  87. if (v === a[n]) {
  88. this.set(k, v);
  89. break;
  90. }
  91. }
  92. },
  93. // Accept a setting if its a valid (signed) integer.
  94. integer: function (k, v) {
  95. if (/^-?\d+$/.test(v)) { // integer
  96. this.set(k, parseInt(v, 10));
  97. }
  98. },
  99. // Accept a setting if its a valid percentage.
  100. percent: function (k, v) {
  101. let m;
  102. if ((m = v.match(/^([\d]{1,3})(\.[\d]*)?%$/))) {
  103. v = parseFloat(v);
  104. if (v >= 0 && v <= 100) {
  105. this.set(k, v);
  106. return true;
  107. }
  108. }
  109. return false;
  110. }
  111. };
  112.  
  113. // Helper function to parse input into groups separated by 'groupDelim', and
  114. // interprete each group as a key/value pair separated by 'keyValueDelim'.
  115. function parseOptions (input, callback, keyValueDelim, groupDelim) {
  116. let groups = groupDelim ? input.split(groupDelim) : [input];
  117. for (let i in groups) {
  118. if (typeof groups[i] !== 'string') {
  119. continue;
  120. }
  121.  
  122. let kv = groups[i].split(keyValueDelim);
  123. if (kv.length !== 2) {
  124. continue;
  125. }
  126.  
  127. let k = kv[0];
  128. let v = kv[1];
  129. callback(k, v);
  130. }
  131. }
  132.  
  133. let defaults = new VTTCue(0, 0, 0);
  134. // 'middle' was changed to 'center' in the spec: https://github.com/w3c/webvtt/pull/244
  135. // Safari doesn't yet support this change, but FF and Chrome do.
  136. let center = defaults.align === 'middle' ? 'middle' : 'center';
  137.  
  138. function parseCue (input, cue, regionList) {
  139. // Remember the original input if we need to throw an error.
  140. let oInput = input;
  141. // 4.1 WebVTT timestamp
  142. function consumeTimeStamp () {
  143. let ts = parseTimeStamp(input);
  144. if (ts === null) {
  145. throw new Error('Malformed timestamp: ' + oInput);
  146. }
  147.  
  148. // Remove time stamp from input.
  149. input = input.replace(/^[^\sa-zA-Z-]+/, '');
  150. return ts;
  151. }
  152.  
  153. // 4.4.2 WebVTT cue settings
  154. function consumeCueSettings (input, cue) {
  155. let settings = new Settings();
  156.  
  157. parseOptions(input, function (k, v) {
  158. switch (k) {
  159. case 'region':
  160. // Find the last region we parsed with the same region id.
  161. for (let i = regionList.length - 1; i >= 0; i--) {
  162. if (regionList[i].id === v) {
  163. settings.set(k, regionList[i].region);
  164. break;
  165. }
  166. }
  167. break;
  168. case 'vertical':
  169. settings.alt(k, v, ['rl', 'lr']);
  170. break;
  171. case 'line':
  172. var vals = v.split(','),
  173. vals0 = vals[0];
  174. settings.integer(k, vals0);
  175. if (settings.percent(k, vals0)) {
  176. settings.set('snapToLines', false);
  177. }
  178.  
  179. settings.alt(k, vals0, ['auto']);
  180. if (vals.length === 2) {
  181. settings.alt('lineAlign', vals[1], ['start', center, 'end']);
  182. }
  183.  
  184. break;
  185. case 'position':
  186. vals = v.split(',');
  187. settings.percent(k, vals[0]);
  188. if (vals.length === 2) {
  189. settings.alt('positionAlign', vals[1], ['start', center, 'end', 'line-left', 'line-right', 'auto']);
  190. }
  191.  
  192. break;
  193. case 'size':
  194. settings.percent(k, v);
  195. break;
  196. case 'align':
  197. settings.alt(k, v, ['start', center, 'end', 'left', 'right']);
  198. break;
  199. }
  200. }, /:/, /\s/);
  201.  
  202. // Apply default values for any missing fields.
  203. cue.region = settings.get('region', null);
  204. cue.vertical = settings.get('vertical', '');
  205. let line = settings.get('line', 'auto');
  206. if (line === 'auto' && defaults.line === -1) {
  207. // set numeric line number for Safari
  208. line = -1;
  209. }
  210. cue.line = line;
  211. cue.lineAlign = settings.get('lineAlign', 'start');
  212. cue.snapToLines = settings.get('snapToLines', true);
  213. cue.size = settings.get('size', 100);
  214. cue.align = settings.get('align', center);
  215. let position = settings.get('position', 'auto');
  216. if (position === 'auto' && defaults.position === 50) {
  217. // set numeric position for Safari
  218. position = cue.align === 'start' || cue.align === 'left' ? 0 : cue.align === 'end' || cue.align === 'right' ? 100 : 50;
  219. }
  220. cue.position = position;
  221. }
  222.  
  223. function skipWhitespace () {
  224. input = input.replace(/^\s+/, '');
  225. }
  226.  
  227. // 4.1 WebVTT cue timings.
  228. skipWhitespace();
  229. cue.startTime = consumeTimeStamp(); // (1) collect cue start time
  230. skipWhitespace();
  231. if (input.substr(0, 3) !== '-->') { // (3) next characters must match '-->'
  232. throw new Error('Malformed time stamp (time stamps must be separated by \'-->\'): ' +
  233. oInput);
  234. }
  235. input = input.substr(3);
  236. skipWhitespace();
  237. cue.endTime = consumeTimeStamp(); // (5) collect cue end time
  238.  
  239. // 4.1 WebVTT cue settings list.
  240. skipWhitespace();
  241. consumeCueSettings(input, cue);
  242. }
  243.  
  244. function fixLineBreaks (input) {
  245. return input.replace(/<br(?: \/)?>/gi, '\n');
  246. }
  247.  
  248. VTTParser.prototype = {
  249. parse: function (data) {
  250. let self = this;
  251.  
  252. // If there is no data then we won't decode it, but will just try to parse
  253. // whatever is in buffer already. This may occur in circumstances, for
  254. // example when flush() is called.
  255. if (data) {
  256. // Try to decode the data that we received.
  257. self.buffer += self.decoder.decode(data, { stream: true });
  258. }
  259.  
  260. function collectNextLine () {
  261. let buffer = self.buffer;
  262. let pos = 0;
  263.  
  264. buffer = fixLineBreaks(buffer);
  265.  
  266. while (pos < buffer.length && buffer[pos] !== '\r' && buffer[pos] !== '\n') {
  267. ++pos;
  268. }
  269.  
  270. let line = buffer.substr(0, pos);
  271. // Advance the buffer early in case we fail below.
  272. if (buffer[pos] === '\r') {
  273. ++pos;
  274. }
  275.  
  276. if (buffer[pos] === '\n') {
  277. ++pos;
  278. }
  279.  
  280. self.buffer = buffer.substr(pos);
  281. return line;
  282. }
  283.  
  284. // 3.2 WebVTT metadata header syntax
  285. function parseHeader (input) {
  286. parseOptions(input, function (k, v) {
  287. switch (k) {
  288. case 'Region':
  289. // 3.3 WebVTT region metadata header syntax
  290. // console.log('parse region', v);
  291. // parseRegion(v);
  292. break;
  293. }
  294. }, /:/);
  295. }
  296.  
  297. // 5.1 WebVTT file parsing.
  298. try {
  299. let line;
  300. if (self.state === 'INITIAL') {
  301. // We can't start parsing until we have the first line.
  302. if (!/\r\n|\n/.test(self.buffer)) {
  303. return this;
  304. }
  305.  
  306. line = collectNextLine();
  307. // strip of UTF-8 BOM if any
  308. // https://en.wikipedia.org/wiki/Byte_order_mark#UTF-8
  309. let m = line.match(/^()?WEBVTT([ \t].*)?$/);
  310. if (!m || !m[0]) {
  311. throw new Error('Malformed WebVTT signature.');
  312. }
  313.  
  314. self.state = 'HEADER';
  315. }
  316.  
  317. let alreadyCollectedLine = false;
  318. while (self.buffer) {
  319. // We can't parse a line until we have the full line.
  320. if (!/\r\n|\n/.test(self.buffer)) {
  321. return this;
  322. }
  323.  
  324. if (!alreadyCollectedLine) {
  325. line = collectNextLine();
  326. } else {
  327. alreadyCollectedLine = false;
  328. }
  329.  
  330. switch (self.state) {
  331. case 'HEADER':
  332. // 13-18 - Allow a header (metadata) under the WEBVTT line.
  333. if (/:/.test(line)) {
  334. parseHeader(line);
  335. } else if (!line) {
  336. // An empty line terminates the header and starts the body (cues).
  337. self.state = 'ID';
  338. }
  339. continue;
  340. case 'NOTE':
  341. // Ignore NOTE blocks.
  342. if (!line) {
  343. self.state = 'ID';
  344. }
  345.  
  346. continue;
  347. case 'ID':
  348. // Check for the start of NOTE blocks.
  349. if (/^NOTE($|[ \t])/.test(line)) {
  350. self.state = 'NOTE';
  351. break;
  352. }
  353. // 19-29 - Allow any number of line terminators, then initialize new cue values.
  354. if (!line) {
  355. continue;
  356. }
  357.  
  358. self.cue = new VTTCue(0, 0, '');
  359. self.state = 'CUE';
  360. // 30-39 - Check if self line contains an optional identifier or timing data.
  361. if (line.indexOf('-->') === -1) {
  362. self.cue.id = line;
  363. continue;
  364. }
  365. // Process line as start of a cue.
  366. /* falls through */
  367. case 'CUE':
  368. // 40 - Collect cue timings and settings.
  369. try {
  370. parseCue(line, self.cue, self.regionList);
  371. } catch (e) {
  372. // In case of an error ignore rest of the cue.
  373. self.cue = null;
  374. self.state = 'BADCUE';
  375. continue;
  376. }
  377. self.state = 'CUETEXT';
  378. continue;
  379. case 'CUETEXT':
  380. var hasSubstring = line.indexOf('-->') !== -1;
  381. // 34 - If we have an empty line then report the cue.
  382. // 35 - If we have the special substring '-->' then report the cue,
  383. // but do not collect the line as we need to process the current
  384. // one as a new cue.
  385. if (!line || hasSubstring && (alreadyCollectedLine = true)) {
  386. // We are done parsing self cue.
  387. if (self.oncue) {
  388. self.oncue(self.cue);
  389. }
  390.  
  391. self.cue = null;
  392. self.state = 'ID';
  393. continue;
  394. }
  395. if (self.cue.text) {
  396. self.cue.text += '\n';
  397. }
  398.  
  399. self.cue.text += line;
  400. continue;
  401. case 'BADCUE': // BADCUE
  402. // 54-62 - Collect and discard the remaining cue.
  403. if (!line) {
  404. self.state = 'ID';
  405. }
  406.  
  407. continue;
  408. }
  409. }
  410. } catch (e) {
  411. // If we are currently parsing a cue, report what we have.
  412. if (self.state === 'CUETEXT' && self.cue && self.oncue) {
  413. self.oncue(self.cue);
  414. }
  415.  
  416. self.cue = null;
  417. // Enter BADWEBVTT state if header was not parsed correctly otherwise
  418. // another exception occurred so enter BADCUE state.
  419. self.state = self.state === 'INITIAL' ? 'BADWEBVTT' : 'BADCUE';
  420. }
  421. return this;
  422. },
  423. flush: function () {
  424. let self = this;
  425. try {
  426. // Finish decoding the stream.
  427. self.buffer += self.decoder.decode();
  428. // Synthesize the end of the current cue or region.
  429. if (self.cue || self.state === 'HEADER') {
  430. self.buffer += '\n\n';
  431. self.parse();
  432. }
  433. // If we've flushed, parsed, and we're still on the INITIAL state then
  434. // that means we don't have enough of the stream to parse the first
  435. // line.
  436. if (self.state === 'INITIAL') {
  437. throw new Error('Malformed WebVTT signature.');
  438. }
  439. } catch (e) {
  440. throw e;
  441. }
  442. if (self.onflush) {
  443. self.onflush();
  444. }
  445.  
  446. return this;
  447. }
  448. };
  449.  
  450. export { fixLineBreaks };
  451.  
  452. export default VTTParser;