// Heavily modified from // https://github.com/nickdesaulniers/netfix/issues/4#issuecomment-578856471 // which was in turn modified from // https://github.com/nickdesaulniers/netfix/blob/gh-pages/demo/bufferWhenNeeded.html // Useful reading: // https://stackoverflow.com/questions/35177797/what-exactly-is-fragmented-mp4fmp4-how-is-it-different-from-normal-mp4 // https://axel.isouard.fr/blog/2016/05/24/streaming-webm-video-over-html5-with-media-source // We start by parsing the sidx (segment index) table in order to get the // byte ranges of the segments. The byte range of the sidx table is provided // by the indexRange variable by YouTube // Useful info, as well as segments vs sequence mode (we use segments mode) // https://joshuatz.com/posts/2020/appending-videos-in-javascript-with-mediasource-buffers/ // SourceBuffer data limits: // https://developers.google.com/web/updates/2017/10/quotaexceedederror // TODO: Call abort to cancel in-progress appends? function AVMerge(video, srcPair, startTime){ this.videoSource = srcPair[0]; this.audioSource = srcPair[1]; if (this.videoSource.bitrate && this.audioSource.bitrate) this.avRatio = this.audioSource.bitrate/this.videoSource.bitrate; else this.avRatio = 1/10; this.videoStream = null; this.audioStream = null; this.seeking = false; this.startTime = startTime; this.video = video; this.mediaSource = null; this.closed = false; this.opened = false; this.audioEndOfStreamCalled = false; this.videoEndOfStreamCalled = false; this.setup(); } AVMerge.prototype.setup = function() { if ('MediaSource' in window && MediaSource.isTypeSupported(this.audioSource['mime_codec']) && MediaSource.isTypeSupported(this.videoSource['mime_codec'])) { this.mediaSource = new MediaSource(); this.video.src = URL.createObjectURL(this.mediaSource); this.mediaSource.onsourceopen = this.sourceOpen.bind(this); } else { reportError('Unsupported MIME type or codec: ', this.audioSource['mime_codec'], this.videoSource['mime_codec']); } } AVMerge.prototype.sourceOpen = function(_) { // If after calling mediaSource.endOfStream, the user seeks back // into the video, the sourceOpen event will be fired again. Do not // overwrite the streams. this.audioEndOfStreamCalled = false; this.videoEndOfStreamCalled = false; if (this.opened) return; this.opened = true; this.videoStream = new Stream(this, this.videoSource, this.startTime, this.avRatio); this.audioStream = new Stream(this, this.audioSource, this.startTime, this.avRatio); this.videoStream.setup(); this.audioStream.setup(); this.timeUpdateEvt = addEvent(this.video, 'timeupdate', this.checkBothBuffers.bind(this)); this.seekingEvt = addEvent(this.video, 'seeking', debounce(this.seek.bind(this), 500)); //this.video.onseeked = function() {console.log('seeked')}; } AVMerge.prototype.close = function() { if (this.closed) return; this.closed = true; this.videoStream.close(); this.audioStream.close(); this.timeUpdateEvt.remove(); this.seekingEvt.remove(); if (this.mediaSource.readyState == 'open') this.mediaSource.endOfStream(); } AVMerge.prototype.checkBothBuffers = function() { this.audioStream.checkBuffer(); this.videoStream.checkBuffer(); } AVMerge.prototype.seek = function(e) { if (this.mediaSource.readyState === 'open') { this.seeking = true; this.audioStream.handleSeek(); this.videoStream.handleSeek(); this.seeking = false; } else { reportWarning('seek but not open? readyState:', this.mediaSource.readyState); } } AVMerge.prototype.audioEndOfStream = function() { if (this.videoEndOfStreamCalled && !this.audioEndOfStreamCalled) { reportDebug('Calling mediaSource.endOfStream()'); this.mediaSource.endOfStream(); } this.audioEndOfStreamCalled = true; } AVMerge.prototype.videoEndOfStream = function() { if (this.audioEndOfStreamCalled && !this.videoEndOfStreamCalled) { reportDebug('Calling mediaSource.endOfStream()'); this.mediaSource.endOfStream(); } this.videoEndOfStreamCalled = true; } AVMerge.prototype.printDebuggingInfo = function() { reportDebug('videoSource:', this.videoSource); reportDebug('audioSource:', this.videoSource); reportDebug('video sidx:', this.videoStream.sidx); reportDebug('audio sidx:', this.audioStream.sidx); reportDebug('video updating', this.videoStream.sourceBuffer.updating); reportDebug('audio updating', this.audioStream.sourceBuffer.updating); reportDebug('video duration:', this.video.duration); reportDebug('video current time:', this.video.currentTime); reportDebug('mediaSource.readyState:', this.mediaSource.readyState); reportDebug('videoEndOfStreamCalled', this.videoEndOfStreamCalled); reportDebug('audioEndOfStreamCalled', this.audioEndOfStreamCalled); for (let obj of [this.videoStream, this.audioStream]) { reportDebug(obj.streamType, 'stream buffered times:'); for (let i=0; i { this.reportError('sourceBuffer error', e); }); this.updateendEvt = addEvent(this.sourceBuffer, 'updateend', (e) => { if (this.appendQueue.length != 0) { this.appendSegment(...this.appendQueue.pop()); } }); } Stream.prototype.setup = async function(){ // Group requests together if (this.initRange.end+1 == this.indexRange.start){ fetchRange( this.url, this.initRange.start, this.indexRange.end, (buffer) => { var init_end = this.initRange.end - this.initRange.start + 1; var index_start = this.indexRange.start - this.initRange.start; var index_end = this.indexRange.end - this.initRange.start + 1; this.appendSegment(null, false, buffer.slice(0, init_end)); this.setupSegments(buffer.slice(index_start, index_end)); } ) } else { // initialization data await fetchRange( this.url, this.initRange.start, this.initRange.end, this.appendSegment.bind(this, false, null), ); // sidx (segment index) table fetchRange( this.url, this.indexRange.start, this.indexRange.end, this.setupSegments.bind(this) ); } } Stream.prototype.setupSegments = async function(sidxBox){ var box = unbox(sidxBox); this.sidx = sidx_parse(box.data, this.indexRange.end+1); this.fetchSegmentIfNeeded(this.getSegmentIdx(this.startTime)); } Stream.prototype.close = function() { // Prevents appendSegment adding to buffer if request finishes // after closing this.closed = true; if (this.sourceBuffer.updating) this.sourceBuffer.abort(); this.mediaSource.removeSourceBuffer(this.sourceBuffer); this.updateendEvt.remove(); } Stream.prototype.appendSegment = function(segmentIdx, forSeek, chunk) { if (this.closed) return; this.reportDebug('Received segment', segmentIdx) // cannot append right now, schedule for updateend if (this.sourceBuffer.updating) { this.reportDebug('sourceBuffer updating, queueing for later'); this.appendQueue.push([segmentIdx, forSeek, chunk]); if (this.appendQueue.length > 2){ this.reportWarning('appendQueue length:', this.appendQueue.length); } return; } try { this.sourceBuffer.appendBuffer(chunk); if (segmentIdx !== null) this.sidx.entries[segmentIdx].have = true; this.appendRetries = 0; } catch (e) { if (e.name !== 'QuotaExceededError') { throw e; } this.reportWarning('QuotaExceededError.'); // Count how many bytes are in buffer to update buffering target, // updating .have as well for when we need to delete segments var bytesInBuffer = 0; for (var i = 0; i < this.sidx.entries.length; i++) { if (this.segmentInBuffer(i)) bytesInBuffer += this.sidx.entries[i].referencedSize; else if (this.sidx.entries[i].have) { this.sidx.entries[i].have = false; this.sidx.entries[i].requested = false; } } bytesInBuffer = Math.floor(4/5*bytesInBuffer); if (bytesInBuffer < this.bufferTarget) { this.bufferTarget = bytesInBuffer; this.reportDebug('New buffer target:', this.bufferTarget); } // Delete 3 segments (arbitrary) from buffer, making sure // not to delete current one var currentSegment = this.getSegmentIdx(this.video.currentTime); var numDeleted = 0; var i = 0; var toDelete = []; // See below for why we have to schedule it this.reportDebug('Deleting segments from beginning of buffer.'); while (numDeleted < 3 && i < currentSegment) { if (this.sidx.entries[i].have) { toDelete.push(i) numDeleted++; } i++; } if (numDeleted < 3) this.reportDebug('Deleting segments from end of buffer.'); i = this.sidx.entries.length - 1; while (numDeleted < 3 && i > currentSegment) { if (this.sidx.entries[i].have) { toDelete.push(i) numDeleted++; } i--; } // When calling .remove, the sourceBuffer will go into updating=true // state, and remove cannot be called until it is done. So we have // to delete on the updateend event for subsequent ones. var removeFinishedEvent; var deleteSegment = () => { if (toDelete.length === 0) { // If QuotaExceeded happened during seeking, retry the append // Pass false as forSeek to avoid infinite looping if it // doesn't work. Rescheduling will take care of updating=true // problem. removeFinishedEvent.remove(); if (forSeek) { this.appendSegment(segmentIdx, false, chunk); } return; } let idx = toDelete.shift(); let entry = this.sidx.entries[idx]; let start = entry.tickStart/this.sidx.timeScale; let end = (entry.tickEnd+1)/this.sidx.timeScale; this.reportDebug('Deleting segment', idx); this.sourceBuffer.remove(start, end); entry.have = false; entry.requested = false; } removeFinishedEvent = addEvent(this.sourceBuffer, 'updateend', deleteSegment); if (!this.sourceBuffer.updating) deleteSegment(); } } Stream.prototype.getSegmentIdx = function(videoTime) { // get an estimate var currentTick = videoTime * this.sidx.timeScale; var firstSegmentDuration = this.sidx.entries[0].subSegmentDuration; var index = 1 + Math.floor(currentTick / firstSegmentDuration); var index = clamp(index, 0, this.sidx.entries.length - 1); var increment = 1; if (currentTick < this.sidx.entries[index].tickStart){ increment = -1; } // go up or down to find correct index while (index >= 0 && index < this.sidx.entries.length) { var entry = this.sidx.entries[index]; if (entry.tickStart <= currentTick && (entry.tickEnd+1) > currentTick){ return index; } index = index + increment; } this.reportError('Could not find segment index for time', videoTime); return 0; } Stream.prototype.checkBuffer = async function() { if (this.avMerge.seeking) { return; } // Find the first unbuffered segment, i var currentSegmentIdx = this.getSegmentIdx(this.video.currentTime); var bufferedBytesAhead = 0; var i; for (i = currentSegmentIdx; i < this.sidx.entries.length; i++) { var entry = this.sidx.entries[i]; // check if we had it before, but it was deleted by the browser if (entry.have && !this.segmentInBuffer(i)) { this.reportDebug('segment', i, 'deleted by browser'); entry.have = false; entry.requested = false; } if (!entry.have) { break; } bufferedBytesAhead += entry.referencedSize; if (bufferedBytesAhead > this.bufferTarget) { return; } } if (i < this.sidx.entries.length && !this.sidx.entries[i].requested) { this.fetchSegment(i); // We have all the segments until the end // Signal the end of stream } else if (i == this.sidx.entries.length) { if (this.streamType == 'audio') this.avMerge.audioEndOfStream(); else this.avMerge.videoEndOfStream(); } } Stream.prototype.segmentInBuffer = function(segmentIdx) { var entry = this.sidx.entries[segmentIdx]; // allow for 0.01 second error var timeStart = entry.tickStart/this.sidx.timeScale + 0.01; /* Some of YouTube's mp4 fragments are malformed, with half-frame playback gaps. In this video at 240p (timeScale = 90000 ticks/second) https://www.youtube.com/watch?v=ZhOQCwJvwlo segment 4 (starting at 0) is claimed in the sidx table to have a duration of 388500 ticks, but closer examination of the file using Bento4 mp4dump shows that the segment has 129 frames at 3000 ticks per frame, which gives an actual duration of 38700 (1500 less than claimed). The file is 30 fps, so this error is exactly half a frame. Note that the base_media_decode_time exactly matches the tickStart, so the media decoder is being given a time gap of half a frame. The practical result of this is that sourceBuffer.buffered reports a timeRange.end that is less than expected for that segment, resulting in a false determination that the browser has deleted a segment. Segment 5 has the opposite issue, where it has a 1500 tick surplus of video data compared to the sidx length. Segments 6 and 7 also have this deficit-surplus pattern. This might have something to do with the fact that the video also has 60 fps formats. In order to allow for adaptive streaming and seamless quality switching, YouTube likely encodes their formats to line up nicely. Either there is a bug in their encoder, or this is intentional. Allow for up to 1 frame-time of error to work around this issue. */ if (this.streamType == 'video') var endError = 1/(this.avMerge.videoSource.fps || 30); else var endError = 0.01 var timeEnd = (entry.tickEnd+1)/this.sidx.timeScale - endError; var timeRanges = this.sourceBuffer.buffered; for (var i=0; i < timeRanges.length; i++) { if (timeRanges.start(i) <= timeStart && timeEnd <= timeRanges.end(i)) { return true; } } return false; } Stream.prototype.fetchSegment = function(segmentIdx) { entry = this.sidx.entries[segmentIdx]; entry.requested = true; this.reportDebug( 'Fetching segment', segmentIdx, ', bytes', entry.start, entry.end, ', seconds', entry.tickStart/this.sidx.timeScale, (entry.tickEnd+1)/this.sidx.timeScale ) fetchRange( this.url, entry.start, entry.end, this.appendSegment.bind(this, segmentIdx, this.avMerge.seeking), ); } Stream.prototype.fetchSegmentIfNeeded = function(segmentIdx) { if (segmentIdx < 0 || segmentIdx >= this.sidx.entries.length){ return; } entry = this.sidx.entries[segmentIdx]; // check if we had it before, but it was deleted by the browser if (entry.have && !this.segmentInBuffer(segmentIdx)) { this.reportDebug('segment', segmentIdx, 'deleted by browser'); entry.have = false; entry.requested = false; } if (entry.requested) { return; } this.fetchSegment(segmentIdx); } Stream.prototype.handleSeek = function() { var segmentIdx = this.getSegmentIdx(this.video.currentTime); this.fetchSegmentIfNeeded(segmentIdx); } Stream.prototype.reportDebug = function(...args) { reportDebug(String(this.streamType) + ':', ...args); } Stream.prototype.reportWarning = function(...args) { reportWarning(String(this.streamType) + ':', ...args); } Stream.prototype.reportError = function(...args) { reportError(String(this.streamType) + ':', ...args); } // Utility functions function fetchRange(url, start, end, cb) { return new Promise((resolve, reject) => { var xhr = new XMLHttpRequest(); xhr.open('get', url); xhr.responseType = 'arraybuffer'; xhr.setRequestHeader('Range', 'bytes=' + start + '-' + end); xhr.onload = function() { //bytesFetched += end - start + 1; resolve(cb(xhr.response)); }; xhr.send(); }); } function debounce(func, wait, immediate) { var timeout; return function() { var context = this; var args = arguments; var later = function() { timeout = null; if (!immediate) func.apply(context, args); }; var callNow = immediate && !timeout; clearTimeout(timeout); timeout = setTimeout(later, wait); if (callNow) func.apply(context, args); }; } function clamp(number, min, max) { return Math.max(min, Math.min(number, max)); } // allow to remove an event listener without having a function reference function RegisteredEvent(obj, eventName, func) { this.obj = obj; this.eventName = eventName; this.func = func; obj.addEventListener(eventName, func); } RegisteredEvent.prototype.remove = function() { this.obj.removeEventListener(this.eventName, this.func); } function addEvent(obj, eventName, func) { return new RegisteredEvent(obj, eventName, func); } function reportWarning(...args){ console.warn(...args); } function reportError(...args){ console.error(...args); } function reportDebug(...args){ console.debug(...args); } function byteArrayToIntegerLittleEndian(unsignedByteArray){ var result = 0; for (byte of unsignedByteArray){ result = result*256; result += byte } return result; } function ByteParser(data){ this.curIndex = 0; this.data = new Uint8Array(data); } ByteParser.prototype.readInteger = function(nBytes){ var result = byteArrayToIntegerLittleEndian( this.data.slice(this.curIndex, this.curIndex + nBytes) ); this.curIndex += nBytes; return result; } ByteParser.prototype.readBufferBytes = function(nBytes){ var result = this.data.slice(this.curIndex, this.curIndex + nBytes); this.curIndex += nBytes; return result; } // BEGIN iso-bmff-parser-stream/lib/box/sidx.js (modified) // https://github.com/necccc/iso-bmff-parser-stream/blob/master/lib/box/sidx.js /* The MIT License (MIT) Copyright (c) 2014 Szabolcs Szabolcsi-Toth Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the "Software"), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions: The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software. THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.*/ function sidx_parse (data, offset) { var bp = new ByteParser(data), version = bp.readInteger(1), flags = bp.readInteger(3), referenceId = bp.readInteger(4), timeScale = bp.readInteger(4), earliestPresentationTime = bp.readInteger(version === 0 ? 4 : 8), firstOffset = bp.readInteger(4), __reserved = bp.readInteger(2), entryCount = bp.readInteger(2), entries = []; var totalBytesOffset = firstOffset + offset; var totalTicks = 0; for (var i = entryCount; i > 0; i=i-1 ) { let referencedSize = bp.readInteger(4), subSegmentDuration = bp.readInteger(4), unused = bp.readBufferBytes(4) entries.push({ referencedSize: referencedSize, subSegmentDuration: subSegmentDuration, unused: unused, start: totalBytesOffset, end: totalBytesOffset + referencedSize - 1, // inclusive tickStart: totalTicks, tickEnd: totalTicks + subSegmentDuration - 1, requested: false, have: false, }); totalBytesOffset = totalBytesOffset + referencedSize; totalTicks = totalTicks + subSegmentDuration; } return { version: version, flags: flags, referenceId: referenceId, timeScale: timeScale, earliestPresentationTime: earliestPresentationTime, firstOffset: firstOffset, entries: entries }; } // END sidx.js // BEGIN iso-bmff-parser-stream/lib/unbox.js (same license), modified function unbox(buf) { var bp = new ByteParser(buf), bufferLength = buf.length, length, typeData, boxData length = bp.readInteger(4); // length of entire box, typeData = bp.readInteger(4); if (bufferLength - length < 0) { reportWarning('Warning: sidx table is cut off'); return { currentLength: bufferLength, length: length, type: typeData, data: bp.readBufferBytes(bufferLength) }; } boxData = bp.readBufferBytes(length - 8); return { length: length, type: typeData, data: boxData }; } // END unbox.js