Skip welcome & menu and move to editor
Welcome to JS Bin
Load cached copy from
 
<html lang="en">
<head>
    <meta charset=utf-8>
    <title>HTML5 Video WebVTT Example</title>
</head>
<body>
    <section id="all">
 <h1>Using the track API to extract the content of webVTT files in <code>&lt;track&gt;</code> elements</h1>
 <p>Click on the buttons under the video to extract the english or german
    subtitles</p>
 <p>Look at the HTML and JS code.</p>
    <video preload="metadata" controls crossOrigin="anonymous" >
    <source src="https://mainline.i3s.unice.fr/mooc/elephants-dream-medium.mp4" type="video/mp4">
    <source src="https://mainline.i3s.unice.fr/mooc/elephants-dream-medium.webm" type="video/webm">
    <track label="English subtitles" kind="subtitles" srclang="en"
           src="https://mainline.i3s.unice.fr/mooc/elephants-dream-subtitles-en.vtt" default>
    <track label="Deutsch subtitles" kind="subtitles" srclang="de"
           src="https://mainline.i3s.unice.fr/mooc/elephants-dream-subtitles-de.vtt">
    <track label="English chapters" kind="chapters" srclang="en"
           src="https://mainline.i3s.unice.fr/mooc/elephants-dream-chapters-en.vtt">
    </video>
   <h3>Video Transcript</h3>
   <button onclick="loadTranscript('en');">English</button>
   <button onclick="loadTranscript('de');">Deutsch</button>
    </div>
    <div id="transcript"></div>
  </section>
</body>
</html>
 
#all {
  background-color: lightgrey;
  border-radius:10px;
  padding: 20px;
  border:1px solid;
}
 
// Transcript.js
function loadTranscript(lang) {
  var url = "https://mainline.i3s.unice.fr/mooc/" + 'elephants-dream-subtitles-' + lang + '.vtt';
      
    loadTranscriptFile(url);
}
function loadTranscriptFile(webvttFileUrl) {
    var reqTrans = new XMLHttpRequest();
  
    reqTrans.open('GET', webvttFileUrl);
  
    reqTrans.onload = function(e) {
        
            var pattern = /^([0-9]+)$/;
            var patternTimecode = /^([0-9]{2}:[0-9]{2}:[0-9]{2}[,.]{1}[0-9]{3}) --\> ([0-9]{2}:[0-9]{2}:[0-9]{2}[,.]{1}[0-9]{3})(.*)$/;
            
            var content = this.response; // content of the webVTT file
      
            var lines = content.split(/\r?\n/);
            var transcript = '';
            for (i = 0; i < lines.length; i++) {
                var identifier = pattern.exec(lines[i]);
                if (identifier) {
                    i++;
                    var timecode = patternTimecode.exec(lines[i]);
                    if (timecode && i < lines.length) {
                        i++;
                        var text = lines[i];
                        i++;
                        while (lines[i] !== '' && i < lines.length) {
                            text = text + '\n' + lines[i];
                            i++;
                        }
                        var transText = '';
                        var voices = getVoices(text);
                        if (voices.length > 0) {
                            for (var j = 0; j < voices.length; j++) {
                                transText += voices[j].voice + ': ' + removeHTML(voices[j].text) + '<br />';
                            }
                        }
                        else transText = removeHTML(text) + '<br />';
                        transcript += transText;
                    }
                }
            
            var oTrans = document.getElementById('transcript');
            oTrans.innerHTML = transcript;
        }
    };
    reqTrans.send();
}
function getVoices(speech) {
    var voices = [];
    var pos = speech.indexOf('<v');
  
    while (pos != -1) {
        endVoice = speech.indexOf('>');
        var voice = speech.substring(pos + 2, endVoice).trim();
        var endSpeech = speech.indexOf('</v>');
        var text = speech.substring(endVoice + 1, endSpeech);
        voices.push({
            'voice': voice,
            'text': text
        });
        speech = speech.substring(endSpeech + 4);
        pos = speech.indexOf('<v');
    }
    return voices;
}
function removeHTML(text) {
    var div = document.createElement('div');
    div.innerHTML = text;
    return div.textContent || div.innerText || '';
}
// 
Output

This bin was created anonymously and its free preview time has expired (learn why). — Get a free unrestricted account

Dismiss x
public
Bin info
anonymouspro
0viewers