123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299 |
- /**
- * mux.js
- *
- * Copyright (c) Brightcove
- * Licensed Apache-2.0 https://github.com/videojs/mux.js/blob/master/LICENSE
- *
- * Utilities to detect basic properties and metadata about TS Segments.
- */
- 'use strict';
- var StreamTypes = require('./stream-types.js');
- var parsePid = function parsePid(packet) {
- var pid = packet[1] & 0x1f;
- pid <<= 8;
- pid |= packet[2];
- return pid;
- };
- var parsePayloadUnitStartIndicator = function parsePayloadUnitStartIndicator(packet) {
- return !!(packet[1] & 0x40);
- };
- var parseAdaptionField = function parseAdaptionField(packet) {
- var offset = 0; // if an adaption field is present, its length is specified by the
- // fifth byte of the TS packet header. The adaptation field is
- // used to add stuffing to PES packets that don't fill a complete
- // TS packet, and to specify some forms of timing and control data
- // that we do not currently use.
- if ((packet[3] & 0x30) >>> 4 > 0x01) {
- offset += packet[4] + 1;
- }
- return offset;
- };
- var parseType = function parseType(packet, pmtPid) {
- var pid = parsePid(packet);
- if (pid === 0) {
- return 'pat';
- } else if (pid === pmtPid) {
- return 'pmt';
- } else if (pmtPid) {
- return 'pes';
- }
- return null;
- };
- var parsePat = function parsePat(packet) {
- var pusi = parsePayloadUnitStartIndicator(packet);
- var offset = 4 + parseAdaptionField(packet);
- if (pusi) {
- offset += packet[offset] + 1;
- }
- return (packet[offset + 10] & 0x1f) << 8 | packet[offset + 11];
- };
- var parsePmt = function parsePmt(packet) {
- var programMapTable = {};
- var pusi = parsePayloadUnitStartIndicator(packet);
- var payloadOffset = 4 + parseAdaptionField(packet);
- if (pusi) {
- payloadOffset += packet[payloadOffset] + 1;
- } // PMTs can be sent ahead of the time when they should actually
- // take effect. We don't believe this should ever be the case
- // for HLS but we'll ignore "forward" PMT declarations if we see
- // them. Future PMT declarations have the current_next_indicator
- // set to zero.
- if (!(packet[payloadOffset + 5] & 0x01)) {
- return;
- }
- var sectionLength, tableEnd, programInfoLength; // the mapping table ends at the end of the current section
- sectionLength = (packet[payloadOffset + 1] & 0x0f) << 8 | packet[payloadOffset + 2];
- tableEnd = 3 + sectionLength - 4; // to determine where the table is, we have to figure out how
- // long the program info descriptors are
- programInfoLength = (packet[payloadOffset + 10] & 0x0f) << 8 | packet[payloadOffset + 11]; // advance the offset to the first entry in the mapping table
- var offset = 12 + programInfoLength;
- while (offset < tableEnd) {
- var i = payloadOffset + offset; // add an entry that maps the elementary_pid to the stream_type
- programMapTable[(packet[i + 1] & 0x1F) << 8 | packet[i + 2]] = packet[i]; // move to the next table entry
- // skip past the elementary stream descriptors, if present
- offset += ((packet[i + 3] & 0x0F) << 8 | packet[i + 4]) + 5;
- }
- return programMapTable;
- };
- var parsePesType = function parsePesType(packet, programMapTable) {
- var pid = parsePid(packet);
- var type = programMapTable[pid];
- switch (type) {
- case StreamTypes.H264_STREAM_TYPE:
- return 'video';
- case StreamTypes.ADTS_STREAM_TYPE:
- return 'audio';
- case StreamTypes.METADATA_STREAM_TYPE:
- return 'timed-metadata';
- default:
- return null;
- }
- };
- var parsePesTime = function parsePesTime(packet) {
- var pusi = parsePayloadUnitStartIndicator(packet);
- if (!pusi) {
- return null;
- }
- var offset = 4 + parseAdaptionField(packet);
- if (offset >= packet.byteLength) {
- // From the H 222.0 MPEG-TS spec
- // "For transport stream packets carrying PES packets, stuffing is needed when there
- // is insufficient PES packet data to completely fill the transport stream packet
- // payload bytes. Stuffing is accomplished by defining an adaptation field longer than
- // the sum of the lengths of the data elements in it, so that the payload bytes
- // remaining after the adaptation field exactly accommodates the available PES packet
- // data."
- //
- // If the offset is >= the length of the packet, then the packet contains no data
- // and instead is just adaption field stuffing bytes
- return null;
- }
- var pes = null;
- var ptsDtsFlags; // PES packets may be annotated with a PTS value, or a PTS value
- // and a DTS value. Determine what combination of values is
- // available to work with.
- ptsDtsFlags = packet[offset + 7]; // PTS and DTS are normally stored as a 33-bit number. Javascript
- // performs all bitwise operations on 32-bit integers but javascript
- // supports a much greater range (52-bits) of integer using standard
- // mathematical operations.
- // We construct a 31-bit value using bitwise operators over the 31
- // most significant bits and then multiply by 4 (equal to a left-shift
- // of 2) before we add the final 2 least significant bits of the
- // timestamp (equal to an OR.)
- if (ptsDtsFlags & 0xC0) {
- pes = {}; // the PTS and DTS are not written out directly. For information
- // on how they are encoded, see
- // http://dvd.sourceforge.net/dvdinfo/pes-hdr.html
- pes.pts = (packet[offset + 9] & 0x0E) << 27 | (packet[offset + 10] & 0xFF) << 20 | (packet[offset + 11] & 0xFE) << 12 | (packet[offset + 12] & 0xFF) << 5 | (packet[offset + 13] & 0xFE) >>> 3;
- pes.pts *= 4; // Left shift by 2
- pes.pts += (packet[offset + 13] & 0x06) >>> 1; // OR by the two LSBs
- pes.dts = pes.pts;
- if (ptsDtsFlags & 0x40) {
- pes.dts = (packet[offset + 14] & 0x0E) << 27 | (packet[offset + 15] & 0xFF) << 20 | (packet[offset + 16] & 0xFE) << 12 | (packet[offset + 17] & 0xFF) << 5 | (packet[offset + 18] & 0xFE) >>> 3;
- pes.dts *= 4; // Left shift by 2
- pes.dts += (packet[offset + 18] & 0x06) >>> 1; // OR by the two LSBs
- }
- }
- return pes;
- };
- var parseNalUnitType = function parseNalUnitType(type) {
- switch (type) {
- case 0x05:
- return 'slice_layer_without_partitioning_rbsp_idr';
- case 0x06:
- return 'sei_rbsp';
- case 0x07:
- return 'seq_parameter_set_rbsp';
- case 0x08:
- return 'pic_parameter_set_rbsp';
- case 0x09:
- return 'access_unit_delimiter_rbsp';
- default:
- return null;
- }
- };
- var videoPacketContainsKeyFrame = function videoPacketContainsKeyFrame(packet) {
- var offset = 4 + parseAdaptionField(packet);
- var frameBuffer = packet.subarray(offset);
- var frameI = 0;
- var frameSyncPoint = 0;
- var foundKeyFrame = false;
- var nalType; // advance the sync point to a NAL start, if necessary
- for (; frameSyncPoint < frameBuffer.byteLength - 3; frameSyncPoint++) {
- if (frameBuffer[frameSyncPoint + 2] === 1) {
- // the sync point is properly aligned
- frameI = frameSyncPoint + 5;
- break;
- }
- }
- while (frameI < frameBuffer.byteLength) {
- // look at the current byte to determine if we've hit the end of
- // a NAL unit boundary
- switch (frameBuffer[frameI]) {
- case 0:
- // skip past non-sync sequences
- if (frameBuffer[frameI - 1] !== 0) {
- frameI += 2;
- break;
- } else if (frameBuffer[frameI - 2] !== 0) {
- frameI++;
- break;
- }
- if (frameSyncPoint + 3 !== frameI - 2) {
- nalType = parseNalUnitType(frameBuffer[frameSyncPoint + 3] & 0x1f);
- if (nalType === 'slice_layer_without_partitioning_rbsp_idr') {
- foundKeyFrame = true;
- }
- } // drop trailing zeroes
- do {
- frameI++;
- } while (frameBuffer[frameI] !== 1 && frameI < frameBuffer.length);
- frameSyncPoint = frameI - 2;
- frameI += 3;
- break;
- case 1:
- // skip past non-sync sequences
- if (frameBuffer[frameI - 1] !== 0 || frameBuffer[frameI - 2] !== 0) {
- frameI += 3;
- break;
- }
- nalType = parseNalUnitType(frameBuffer[frameSyncPoint + 3] & 0x1f);
- if (nalType === 'slice_layer_without_partitioning_rbsp_idr') {
- foundKeyFrame = true;
- }
- frameSyncPoint = frameI - 2;
- frameI += 3;
- break;
- default:
- // the current byte isn't a one or zero, so it cannot be part
- // of a sync sequence
- frameI += 3;
- break;
- }
- }
- frameBuffer = frameBuffer.subarray(frameSyncPoint);
- frameI -= frameSyncPoint;
- frameSyncPoint = 0; // parse the final nal
- if (frameBuffer && frameBuffer.byteLength > 3) {
- nalType = parseNalUnitType(frameBuffer[frameSyncPoint + 3] & 0x1f);
- if (nalType === 'slice_layer_without_partitioning_rbsp_idr') {
- foundKeyFrame = true;
- }
- }
- return foundKeyFrame;
- };
- module.exports = {
- parseType: parseType,
- parsePat: parsePat,
- parsePmt: parsePmt,
- parsePayloadUnitStartIndicator: parsePayloadUnitStartIndicator,
- parsePesType: parsePesType,
- parsePesTime: parsePesTime,
- videoPacketContainsKeyFrame: videoPacketContainsKeyFrame
- };
|