mirror of https://bitbucket.org/ausocean/av.git
383 lines
13 KiB
JavaScript
383 lines
13 KiB
JavaScript
|
/*
|
||
|
NAME
|
||
|
mts-demuxer.js
|
||
|
|
||
|
AUTHOR
|
||
|
Trek Hopton <trek@ausocean.org>
|
||
|
|
||
|
LICENSE
|
||
|
This file is Copyright (C) 2019 the Australian Ocean Lab (AusOcean)
|
||
|
|
||
|
It is free software: you can redistribute it and/or modify them
|
||
|
under the terms of the GNU General Public License as published by the
|
||
|
Free Software Foundation, either version 3 of the License, or (at your
|
||
|
option) any later version.
|
||
|
|
||
|
It is distributed in the hope that it will be useful, but WITHOUT
|
||
|
ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
|
||
|
FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
|
||
|
for more details.
|
||
|
|
||
|
You should have received a copy of the GNU General Public License in gpl.txt.
|
||
|
If not, see http://www.gnu.org/licenses.
|
||
|
|
||
|
For hls.js Copyright notice and license, see LICENSE file.
|
||
|
*/
|
||
|
|
||
|
// MTSDemuxer demultiplexes an MPEG-TS stream into its individual streams.
|
||
|
// While it is possible that the MPEG-TS stream may contain many streams,
|
||
|
// this demuxer will result in at most one stream of each type ie. video, audio, id3 metadata.
|
||
|
class MTSDemuxer {
|
||
|
constructor() {
|
||
|
this.init();
|
||
|
}
|
||
|
|
||
|
// init initialises MTSDemuxer's state. It can be used to reset an MTSDemuxer instance.
|
||
|
init() {
|
||
|
this.pmtParsed = false;
|
||
|
this._pmtId = -1;
|
||
|
|
||
|
this._videoTrack = MTSDemuxer.createTrack('video');
|
||
|
this._audioTrack = MTSDemuxer.createTrack('audio');
|
||
|
this._id3Track = MTSDemuxer.createTrack('id3');
|
||
|
}
|
||
|
|
||
|
// createTrack creates and returns a track model.
|
||
|
/**
|
||
|
* @param {string} type 'audio' | 'video' | 'id3' | 'text'
|
||
|
* @return {object} MTSDemuxer's internal track model.
|
||
|
*/
|
||
|
static createTrack(type) {
|
||
|
return {
|
||
|
type,
|
||
|
pid: -1,
|
||
|
data: [] // This will contain Uint8Arrays representing each PES packet's payload for this track.
|
||
|
};
|
||
|
}
|
||
|
|
||
|
// _getTracks returns this MTSDemuxer's tracks.
|
||
|
_getTracks() {
|
||
|
return {
|
||
|
video: this._videoTrack,
|
||
|
audio: this._audioTrack,
|
||
|
id3: this._id3Track
|
||
|
};
|
||
|
}
|
||
|
|
||
|
// _syncOffset scans the first 'maxScanWindow' bytes and returns an offset to the beginning of the first three MTS packets,
|
||
|
// or -1 if three are not found.
|
||
|
// A TS fragment should contain at least 3 TS packets, a PAT, a PMT, and one PID, each starting with 0x47.
|
||
|
static _syncOffset(data) {
|
||
|
const maxScanWindow = 1000; // 1000 is a reasonable number of bytes to search for the first MTS packets.
|
||
|
const scanWindow = Math.min(maxScanWindow, data.length - 3 * 188);
|
||
|
let i = 0;
|
||
|
while (i < scanWindow) {
|
||
|
if (data[i] === 0x47 && data[i + 188] === 0x47 && data[i + 2 * 188] === 0x47) {
|
||
|
return i;
|
||
|
} else {
|
||
|
i++;
|
||
|
}
|
||
|
}
|
||
|
return -1;
|
||
|
}
|
||
|
|
||
|
append(data) {
|
||
|
let start, len = data.length, pusi, pid, afc, offset, pes,
|
||
|
unknownPIDs = false;
|
||
|
let pmtParsed = this.pmtParsed,
|
||
|
videoTrack = this._videoTrack,
|
||
|
audioTrack = this._audioTrack,
|
||
|
id3Track = this._id3Track,
|
||
|
videoId = videoTrack.pid,
|
||
|
audioId = audioTrack.pid,
|
||
|
id3Id = id3Track.pid,
|
||
|
pmtId = this._pmtId,
|
||
|
videoData = videoTrack.pesData,
|
||
|
audioData = audioTrack.pesData,
|
||
|
id3Data = id3Track.pesData,
|
||
|
parsePAT = this._parsePAT,
|
||
|
parsePMT = this._parsePMT,
|
||
|
parsePES = this._parsePES;
|
||
|
|
||
|
const syncOffset = MTSDemuxer._syncOffset(data);
|
||
|
|
||
|
// Don't parse last TS packet if incomplete.
|
||
|
len -= (len + syncOffset) % 188;
|
||
|
|
||
|
// Loop through TS packets.
|
||
|
for (start = syncOffset; start < len; start += 188) {
|
||
|
if (data[start] === 0x47) {
|
||
|
pusi = !!(data[start + 1] & 0x40);
|
||
|
// pid is a 13-bit field starting at the last bit of TS[1].
|
||
|
pid = ((data[start + 1] & 0x1f) << 8) + data[start + 2];
|
||
|
afc = (data[start + 3] & 0x30) >> 4;
|
||
|
// If an adaption field is present, its length is specified by the fifth byte of the TS packet header.
|
||
|
if (afc > 1) {
|
||
|
offset = start + 5 + data[start + 4];
|
||
|
// Continue if there is only adaptation field.
|
||
|
if (offset === (start + 188)) {
|
||
|
continue;
|
||
|
}
|
||
|
} else {
|
||
|
offset = start + 4;
|
||
|
}
|
||
|
switch (pid) {
|
||
|
case videoId:
|
||
|
if (pusi) {
|
||
|
if (videoData && (pes = parsePES(videoData)) && pes.pts !== undefined) {
|
||
|
videoTrack.data.push(pes.data);
|
||
|
// TODO: here pes contains data, pts, dts and len. Are all these needed?
|
||
|
}
|
||
|
videoData = { data: [], size: 0 };
|
||
|
}
|
||
|
if (videoData) {
|
||
|
videoData.data.push(data.subarray(offset, start + 188));
|
||
|
videoData.size += start + 188 - offset;
|
||
|
}
|
||
|
break;
|
||
|
case audioId:
|
||
|
if (pusi) {
|
||
|
if (audioData && (pes = parsePES(audioData)) && pes.pts !== undefined) {
|
||
|
audioTrack.data.push(pes.data);
|
||
|
}
|
||
|
audioData = { data: [], size: 0 };
|
||
|
}
|
||
|
if (audioData) {
|
||
|
audioData.data.push(data.subarray(offset, start + 188));
|
||
|
audioData.size += start + 188 - offset;
|
||
|
}
|
||
|
break;
|
||
|
case id3Id:
|
||
|
if (pusi) {
|
||
|
if (id3Data && (pes = parsePES(id3Data)) && pes.pts !== undefined) {
|
||
|
id3Track.data.push(pes.data);
|
||
|
}
|
||
|
id3Data = { data: [], size: 0 };
|
||
|
}
|
||
|
if (id3Data) {
|
||
|
id3Data.data.push(data.subarray(offset, start + 188));
|
||
|
id3Data.size += start + 188 - offset;
|
||
|
}
|
||
|
break;
|
||
|
case 0:
|
||
|
if (pusi) {
|
||
|
offset += data[offset] + 1;
|
||
|
}
|
||
|
|
||
|
pmtId = this._pmtId = parsePAT(data, offset);
|
||
|
break;
|
||
|
case pmtId:
|
||
|
if (pusi) {
|
||
|
offset += data[offset] + 1;
|
||
|
}
|
||
|
|
||
|
let parsedPIDs = parsePMT(data, offset);
|
||
|
|
||
|
// Only update track id if track PID found while parsing PMT.
|
||
|
// This is to avoid resetting the PID to -1 in case track PID transiently disappears from the stream,
|
||
|
// this could happen in case of transient missing audio samples for example.
|
||
|
videoId = parsedPIDs.video;
|
||
|
if (videoId > 0) {
|
||
|
videoTrack.pid = videoId;
|
||
|
}
|
||
|
audioId = parsedPIDs.audio;
|
||
|
if (audioId > 0) {
|
||
|
audioTrack.pid = audioId;
|
||
|
}
|
||
|
id3Id = parsedPIDs.id3;
|
||
|
if (id3Id > 0) {
|
||
|
id3Track.pid = id3Id;
|
||
|
}
|
||
|
|
||
|
if (unknownPIDs && !pmtParsed) {
|
||
|
// Reparse from beginning.
|
||
|
unknownPIDs = false;
|
||
|
// We set it to -188, the += 188 in the for loop will reset start to 0.
|
||
|
start = syncOffset - 188;
|
||
|
}
|
||
|
pmtParsed = this.pmtParsed = true;
|
||
|
break;
|
||
|
default:
|
||
|
unknownPIDs = true;
|
||
|
break;
|
||
|
}
|
||
|
} else {
|
||
|
console.error('TS packet did not start with 0x47');
|
||
|
}
|
||
|
}
|
||
|
|
||
|
// Try to parse last PES packets.
|
||
|
if (videoData && (pes = parsePES(videoData)) && pes.pts !== undefined) {
|
||
|
videoTrack.data.push(pes.data);
|
||
|
videoTrack.pesData = null;
|
||
|
} else {
|
||
|
// Either pesPkts null or PES truncated, keep it for next frag parsing.
|
||
|
videoTrack.pesData = videoData;
|
||
|
}
|
||
|
|
||
|
if (audioData && (pes = parsePES(audioData)) && pes.pts !== undefined) {
|
||
|
audioTrack.data.push(pes.data);
|
||
|
audioTrack.pesData = null;
|
||
|
} else {
|
||
|
// Either pesPkts null or PES truncated, keep it for next frag parsing.
|
||
|
audioTrack.pesData = audioData;
|
||
|
}
|
||
|
|
||
|
if (id3Data && (pes = parsePES(id3Data)) && pes.pts !== undefined) {
|
||
|
id3Track.data.push(pes.data);
|
||
|
id3Track.pesData = null;
|
||
|
} else {
|
||
|
// Either pesPkts null or PES truncated, keep it for next frag parsing.
|
||
|
id3Track.pesData = id3Data;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
_parsePAT(data, offset) {
|
||
|
// Skip the PSI header and parse the first PMT entry.
|
||
|
return (data[offset + 10] & 0x1F) << 8 | data[offset + 11];
|
||
|
// console.log('PMT PID:' + this._pmtId);
|
||
|
}
|
||
|
|
||
|
_parsePMT(data, offset) {
|
||
|
let programInfoLength, pid, result = { audio: -1, video: -1, id3: -1 },
|
||
|
sectionLength = (data[offset + 1] & 0x0f) << 8 | data[offset + 2],
|
||
|
tableEnd = offset + 3 + sectionLength - 4;
|
||
|
// To determine where the table is, we have to figure out how
|
||
|
// long the program info descriptors are.
|
||
|
programInfoLength = (data[offset + 10] & 0x0f) << 8 | data[offset + 11];
|
||
|
// Advance the offset to the first entry in the mapping table.
|
||
|
offset += 12 + programInfoLength;
|
||
|
while (offset < tableEnd) {
|
||
|
pid = (data[offset + 1] & 0x1F) << 8 | data[offset + 2];
|
||
|
switch (data[offset]) {
|
||
|
case 0x1c: // MJPEG
|
||
|
case 0xdb: // SAMPLE-AES AVC.
|
||
|
case 0x1b: // ITU-T Rec. H.264 and ISO/IEC 14496-10 (lower bit-rate video).
|
||
|
if (result.video === -1) {
|
||
|
result.video = pid;
|
||
|
}
|
||
|
break;
|
||
|
case 0xcf: // SAMPLE-AES AAC.
|
||
|
case 0x0f: // ISO/IEC 13818-7 ADTS AAC (MPEG-2 lower bit-rate audio).
|
||
|
case 0xd2: // ADPCM audio.
|
||
|
case 0x03: // ISO/IEC 11172-3 (MPEG-1 audio).
|
||
|
case 0x24:
|
||
|
// console.warn('HEVC stream type found, not supported for now');
|
||
|
case 0x04: // or ISO/IEC 13818-3 (MPEG-2 halved sample rate audio).
|
||
|
if (result.audio === -1) {
|
||
|
result.audio = pid;
|
||
|
}
|
||
|
break;
|
||
|
case 0x15: // Packetized metadata (ID3)
|
||
|
// console.log('ID3 PID:' + pid);
|
||
|
if (result.id3 === -1) {
|
||
|
result.id3 = pid;
|
||
|
}
|
||
|
break;
|
||
|
default:
|
||
|
// console.log('unknown stream type:' + data[offset]);
|
||
|
break;
|
||
|
}
|
||
|
// Move to the next table entry, skip past the elementary stream descriptors, if present.
|
||
|
offset += ((data[offset + 3] & 0x0F) << 8 | data[offset + 4]) + 5;
|
||
|
}
|
||
|
return result;
|
||
|
}
|
||
|
|
||
|
_parsePES(stream) {
|
||
|
let i = 0, frag, pesFlags, pesPrefix, pesLen, pesHdrLen, pesData, pesPts, pesDts, payloadStartOffset, data = stream.data;
|
||
|
// Safety check.
|
||
|
if (!stream || stream.size === 0) {
|
||
|
return null;
|
||
|
}
|
||
|
|
||
|
// We might need up to 19 bytes to read PES header.
|
||
|
// If first chunk of data is less than 19 bytes, let's merge it with following ones until we get 19 bytes.
|
||
|
// Usually only one merge is needed (and this is rare ...).
|
||
|
while (data[0].length < 19 && data.length > 1) {
|
||
|
let newData = new Uint8Array(data[0].length + data[1].length);
|
||
|
newData.set(data[0]);
|
||
|
newData.set(data[1], data[0].length);
|
||
|
data[0] = newData;
|
||
|
data.splice(1, 1);
|
||
|
}
|
||
|
// Retrieve PTS/DTS from first fragment.
|
||
|
frag = data[0];
|
||
|
pesPrefix = (frag[0] << 16) + (frag[1] << 8) + frag[2];
|
||
|
if (pesPrefix === 1) {
|
||
|
pesLen = (frag[4] << 8) + frag[5];
|
||
|
// If PES parsed length is not zero and greater than total received length, stop parsing. PES might be truncated.
|
||
|
// Minus 6 : PES header size.
|
||
|
if (pesLen && pesLen > stream.size - 6) {
|
||
|
return null;
|
||
|
}
|
||
|
|
||
|
pesFlags = frag[7];
|
||
|
if (pesFlags & 0xC0) {
|
||
|
// PES header described here : http://dvd.sourceforge.net/dvdinfo/pes-hdr.html
|
||
|
// As PTS / DTS is 33 bit we cannot use bitwise operator in JS,
|
||
|
// as Bitwise operators treat their operands as a sequence of 32 bits.
|
||
|
pesPts = (frag[9] & 0x0E) * 536870912 +// 1 << 29
|
||
|
(frag[10] & 0xFF) * 4194304 +// 1 << 22
|
||
|
(frag[11] & 0xFE) * 16384 +// 1 << 14
|
||
|
(frag[12] & 0xFF) * 128 +// 1 << 7
|
||
|
(frag[13] & 0xFE) / 2;
|
||
|
// Check if greater than 2^32 -1.
|
||
|
if (pesPts > 4294967295) {
|
||
|
// Decrement 2^33.
|
||
|
pesPts -= 8589934592;
|
||
|
}
|
||
|
if (pesFlags & 0x40) {
|
||
|
pesDts = (frag[14] & 0x0E) * 536870912 +// 1 << 29
|
||
|
(frag[15] & 0xFF) * 4194304 +// 1 << 22
|
||
|
(frag[16] & 0xFE) * 16384 +// 1 << 14
|
||
|
(frag[17] & 0xFF) * 128 +// 1 << 7
|
||
|
(frag[18] & 0xFE) / 2;
|
||
|
// Check if greater than 2^32 -1.
|
||
|
if (pesDts > 4294967295) {
|
||
|
// Decrement 2^33.
|
||
|
pesDts -= 8589934592;
|
||
|
}
|
||
|
if (pesPts - pesDts > 60 * 90000) {
|
||
|
// console.warn(`${Math.round((pesPts - pesDts) / 90000)}s delta between PTS and DTS, align them`);
|
||
|
pesPts = pesDts;
|
||
|
}
|
||
|
} else {
|
||
|
pesDts = pesPts;
|
||
|
}
|
||
|
}
|
||
|
pesHdrLen = frag[8];
|
||
|
// 9 bytes : 6 bytes for PES header + 3 bytes for PES extension.
|
||
|
payloadStartOffset = pesHdrLen + 9;
|
||
|
|
||
|
stream.size -= payloadStartOffset;
|
||
|
// Reassemble PES packet.
|
||
|
pesData = new Uint8Array(stream.size);
|
||
|
for (let j = 0, dataLen = data.length; j < dataLen; j++) {
|
||
|
frag = data[j];
|
||
|
let len = frag.byteLength;
|
||
|
if (payloadStartOffset) {
|
||
|
if (payloadStartOffset > len) {
|
||
|
// Trim full frag if PES header bigger than frag.
|
||
|
payloadStartOffset -= len;
|
||
|
continue;
|
||
|
} else {
|
||
|
// Trim partial frag if PES header smaller than frag.
|
||
|
frag = frag.subarray(payloadStartOffset);
|
||
|
len -= payloadStartOffset;
|
||
|
payloadStartOffset = 0;
|
||
|
}
|
||
|
}
|
||
|
pesData.set(frag, i);
|
||
|
i += len;
|
||
|
}
|
||
|
if (pesLen) {
|
||
|
// Payload size : remove PES header + PES extension.
|
||
|
pesLen -= pesHdrLen + 3;
|
||
|
}
|
||
|
return { data: pesData, pts: pesPts, dts: pesDts, len: pesLen };
|
||
|
} else {
|
||
|
return null;
|
||
|
}
|
||
|
}
|
||
|
}
|