5#include <packager/media/base/container_names.h>
13#include <absl/log/check.h>
14#include <absl/log/log.h>
15#include <libxml/parser.h>
16#include <libxml/tree.h>
18#include <packager/media/base/bit_reader.h>
19#include <packager/mpd/base/xml/scoped_xml_ptr.h>
24#define TAG(a, b, c, d) \
25 ((static_cast<uint32_t>(static_cast<uint8_t>(a)) << 24) | \
26 (static_cast<uint8_t>(b) << 16) | (static_cast<uint8_t>(c) << 8) | \
27 (static_cast<uint8_t>(d)))
35#define UTF8_BYTE_ORDER_MARK "\xef\xbb\xbf"
38static int Read16(
const uint8_t* p) {
39 return p[0] << 8 | p[1];
43static uint32_t Read24(
const uint8_t* p) {
44 return p[0] << 16 | p[1] << 8 | p[2];
48static uint32_t Read32(
const uint8_t* p) {
49 return p[0] << 24 | p[1] << 16 | p[2] << 8 | p[3];
53static uint32_t Read32LE(
const uint8_t* p) {
54 return p[3] << 24 | p[2] << 16 | p[1] << 8 | p[0];
59static bool StartsWith(
const uint8_t* buffer,
62 size_t prefix_size = strlen(prefix);
63 return (prefix_size <= buffer_size &&
64 memcmp(buffer, prefix, prefix_size) == 0);
69static bool StartsWith(
const uint8_t* buffer,
71 const uint8_t* prefix,
73 return (prefix_size <= buffer_size &&
74 memcmp(buffer, prefix, prefix_size) == 0);
78static uint64_t ReadBits(BitReader* reader,
int num_bits) {
79 DCHECK_GE(
static_cast<int>(reader->bits_available()), num_bits);
80 DCHECK((num_bits > 0) && (num_bits <= 64));
82 reader->ReadBits(num_bits, &value);
86const int kAc3FrameSizeTable[38][3] = {
87 {128, 138, 192}, {128, 140, 192}, {160, 174, 240},
88 {160, 176, 240}, {192, 208, 288}, {192, 210, 288},
89 {224, 242, 336}, {224, 244, 336}, {256, 278, 384},
90 {256, 280, 384}, {320, 348, 480}, {320, 350, 480},
91 {384, 416, 576}, {384, 418, 576}, {448, 486, 672},
92 {448, 488, 672}, {512, 556, 768}, {512, 558, 768},
93 {640, 696, 960}, {640, 698, 960}, {768, 834, 1152},
94 {768, 836, 1152}, {896, 974, 1344}, {896, 976, 1344},
95 {1024, 1114, 1536}, {1024, 1116, 1536}, {1280, 1392, 1920},
96 {1280, 1394, 1920}, {1536, 1670, 2304}, {1536, 1672, 2304},
97 {1792, 1950, 2688}, {1792, 1952, 2688}, {2048, 2228, 3072},
98 {2048, 2230, 3072}, {2304, 2506, 3456}, {2304, 2508, 3456},
99 {2560, 2768, 3840}, {2560, 2770, 3840}};
102static bool CheckAac(
const uint8_t* buffer,
int buffer_size) {
105 RCHECK(buffer_size > 6);
108 while (offset + 6 < buffer_size) {
109 BitReader reader(buffer + offset, 6);
112 RCHECK(ReadBits(&reader, 12) == 0xfff);
118 RCHECK(ReadBits(&reader, 2) == 0);
121 reader.SkipBits(1 + 2);
124 RCHECK(ReadBits(&reader, 4) != 15);
128 reader.SkipBits(1 + 3 + 1 + 1 + 1 + 1);
131 int size = ReadBits(&reader, 13);
138const uint16_t kAc3SyncWord = 0x0b77;
141static bool CheckAc3(
const uint8_t* buffer,
int buffer_size) {
147 RCHECK(buffer_size > 6);
150 while (offset + 6 < buffer_size) {
151 BitReader reader(buffer + offset, 6);
154 RCHECK(ReadBits(&reader, 16) == kAc3SyncWord);
160 int sample_rate_code = ReadBits(&reader, 2);
161 RCHECK(sample_rate_code != 3);
164 int frame_size_code = ReadBits(&reader, 6);
165 RCHECK(frame_size_code < 38);
168 RCHECK(ReadBits(&reader, 5) < 10);
170 offset += kAc3FrameSizeTable[frame_size_code][sample_rate_code];
176static bool CheckEac3(
const uint8_t* buffer,
int buffer_size) {
182 RCHECK(buffer_size > 6);
185 while (offset + 6 < buffer_size) {
186 BitReader reader(buffer + offset, 6);
189 RCHECK(ReadBits(&reader, 16) == kAc3SyncWord);
192 RCHECK(ReadBits(&reader, 2) != 3);
198 int frame_size = (ReadBits(&reader, 11) + 1) * 2;
199 RCHECK(frame_size >= 7);
202 reader.SkipBits(2 + 2 + 3 + 1);
205 int bit_stream_id = ReadBits(&reader, 5);
206 RCHECK(bit_stream_id >= 11 && bit_stream_id <= 16);
208 offset += frame_size;
214static bool CheckBink(
const uint8_t* buffer,
int buffer_size) {
216 RCHECK(buffer_size >= 44);
219 RCHECK(Read32LE(buffer + 8) > 0);
222 int width = Read32LE(buffer + 20);
223 RCHECK(width > 0 && width <= 32767);
226 int height = Read32LE(buffer + 24);
227 RCHECK(height > 0 && height <= 32767);
230 RCHECK(Read32LE(buffer + 28) > 0);
233 RCHECK(Read32LE(buffer + 32) > 0);
236 return (Read32LE(buffer + 40) <= 256);
240static bool CheckCaf(
const uint8_t* buffer,
int buffer_size) {
243 RCHECK(buffer_size >= 52);
244 BitReader reader(buffer, buffer_size);
247 RCHECK(ReadBits(&reader, 32) == TAG(
'c',
'a',
'f',
'f'));
250 RCHECK(ReadBits(&reader, 16) == 1);
256 RCHECK(ReadBits(&reader, 32) == TAG(
'd',
'e',
's',
'c'));
257 RCHECK(ReadBits(&reader, 64) == 32);
260 RCHECK(ReadBits(&reader, 64) != 0);
263 RCHECK(ReadBits(&reader, 32) != 0);
266 reader.SkipBits(32 + 32);
269 RCHECK(ReadBits(&reader, 32) != 0);
273static bool kSamplingFrequencyValid[16] = {
274 false,
true,
true,
true,
false,
false,
true,
true,
275 true,
false,
false,
true,
true,
true,
false,
false};
276static bool kExtAudioIdValid[8] = {
true,
false,
true,
false,
277 false,
false,
true,
false};
280static bool CheckDts(
const uint8_t* buffer,
int buffer_size) {
283 RCHECK(buffer_size > 11);
286 while (offset + 11 < buffer_size) {
287 BitReader reader(buffer + offset, 11);
290 RCHECK(ReadBits(&reader, 32) == 0x7ffe8001);
293 reader.SkipBits(1 + 5);
296 RCHECK(ReadBits(&reader, 1) == 0);
299 RCHECK(ReadBits(&reader, 7) >= 5);
302 int frame_size = ReadBits(&reader, 14);
303 RCHECK(frame_size >= 95);
309 RCHECK(kSamplingFrequencyValid[ReadBits(&reader, 4)]);
312 RCHECK(ReadBits(&reader, 5) <= 25);
315 RCHECK(ReadBits(&reader, 1) == 0);
318 reader.SkipBits(1 + 1 + 1 + 1);
321 RCHECK(kExtAudioIdValid[ReadBits(&reader, 3)]);
324 reader.SkipBits(1 + 1);
327 RCHECK(ReadBits(&reader, 2) != 3);
329 offset += frame_size + 1;
335static bool CheckDV(
const uint8_t* buffer,
int buffer_size) {
338 RCHECK(buffer_size > 11);
341 int current_sequence_number = -1;
342 int last_block_number[6];
343 while (offset + 11 < buffer_size) {
344 BitReader reader(buffer + offset, 11);
347 int section = ReadBits(&reader, 3);
351 RCHECK(ReadBits(&reader, 1) == 1);
356 int sequence_number = ReadBits(&reader, 4);
362 RCHECK(ReadBits(&reader, 3) == 7);
364 int block_number = ReadBits(&reader, 8);
369 RCHECK(ReadBits(&reader, 1) == 0);
370 RCHECK(ReadBits(&reader, 11) == 0x7ff);
372 RCHECK(ReadBits(&reader, 4) == 0xf);
374 RCHECK(ReadBits(&reader, 4) == 0xf);
376 RCHECK(ReadBits(&reader, 4) == 0xf);
378 RCHECK(ReadBits(&reader, 24) == 0xffffff);
379 current_sequence_number = sequence_number;
380 for (
size_t i = 0; i < std::size(last_block_number); ++i)
381 last_block_number[i] = -1;
384 RCHECK(sequence_number == current_sequence_number);
386 RCHECK(block_number > last_block_number[section]);
387 last_block_number[section] = block_number;
397static bool CheckGsm(
const uint8_t* buffer,
int buffer_size) {
402 RCHECK(buffer_size >= 1024);
405 while (offset < buffer_size) {
407 RCHECK((buffer[offset] & 0xf0) == 0xd0);
418static bool AdvanceToStartCode(
const uint8_t* buffer,
423 uint32_t start_code) {
424 DCHECK_GE(bytes_needed, 3);
425 DCHECK_LE(num_bits, 24);
428 uint32_t bits_to_shift = 24 - num_bits;
429 uint32_t mask = (1 << num_bits) - 1;
430 while (*offset + bytes_needed < buffer_size) {
431 uint32_t next = Read24(buffer + *offset);
432 if (((next >> bits_to_shift) & mask) == start_code)
440static bool CheckH261(
const uint8_t* buffer,
int buffer_size) {
443 RCHECK(buffer_size > 16);
446 bool seen_start_code =
false;
449 if (!AdvanceToStartCode(buffer, buffer_size, &offset, 4, 20, 0x10)) {
452 return seen_start_code;
457 BitReader reader(buffer + offset, buffer_size - offset);
458 RCHECK(ReadBits(&reader, 20) == 0x10);
461 reader.SkipBits(5 + 6);
465 int extra = ReadBits(&reader, 1);
467 if (!reader.SkipBits(8))
468 return seen_start_code;
469 if (!reader.ReadBits(1, &extra))
470 return seen_start_code;
477 if (!reader.ReadBits(16, &next))
478 return seen_start_code;
482 seen_start_code =
true;
488static bool CheckH263(
const uint8_t* buffer,
int buffer_size) {
492 RCHECK(buffer_size > 16);
495 bool seen_start_code =
false;
498 if (!AdvanceToStartCode(buffer, buffer_size, &offset, 9, 22, 0x20)) {
501 return seen_start_code;
506 BitReader reader(buffer + offset, 9);
507 RCHECK(ReadBits(&reader, 22) == 0x20);
513 RCHECK(ReadBits(&reader, 2) == 2);
517 reader.SkipBits(1 + 1 + 1);
520 int format = ReadBits(&reader, 3);
521 RCHECK(format != 0 && format != 6);
525 int ufep = ReadBits(&reader, 3);
528 format = ReadBits(&reader, 3);
529 RCHECK(format != 0 && format != 7);
532 RCHECK(ReadBits(&reader, 4) == 8);
538 int picture_type_code = ReadBits(&reader, 3);
539 RCHECK(picture_type_code != 6 && picture_type_code != 7);
543 reader.SkipBits(1 + 1 + 1);
546 RCHECK(ReadBits(&reader, 3) == 1);
550 seen_start_code =
true;
556static bool CheckH264(
const uint8_t* buffer,
int buffer_size) {
560 RCHECK(buffer_size > 4);
563 int parameter_count = 0;
566 if (!AdvanceToStartCode(buffer, buffer_size, &offset, 4, 24, 1)) {
569 return parameter_count > 0;
574 BitReader reader(buffer + offset, 4);
575 RCHECK(ReadBits(&reader, 24) == 1);
578 RCHECK(ReadBits(&reader, 1) == 0);
581 int nal_ref_idc = ReadBits(&reader, 2);
582 int nal_unit_type = ReadBits(&reader, 5);
584 switch (nal_unit_type) {
586 RCHECK(nal_ref_idc != 0);
593 RCHECK(nal_ref_idc == 0);
606static const char kHlsSignature[] =
"#EXTM3U";
607static const char kHls1[] =
"#EXT-X-STREAM-INF:";
608static const char kHls2[] =
"#EXT-X-TARGETDURATION:";
609static const char kHls3[] =
"#EXT-X-MEDIA-SEQUENCE:";
612static bool CheckHls(
const uint8_t* buffer,
int buffer_size) {
617 if (StartsWith(buffer, buffer_size, kHlsSignature)) {
622 int offset = strlen(kHlsSignature);
623 while (offset < buffer_size) {
624 if (buffer[offset] ==
'#') {
625 if (StartsWith(buffer + offset, buffer_size - offset, kHls1) ||
626 StartsWith(buffer + offset, buffer_size - offset, kHls2) ||
627 StartsWith(buffer + offset, buffer_size - offset, kHls3)) {
638static bool CheckMJpeg(
const uint8_t* buffer,
int buffer_size) {
641 RCHECK(buffer_size >= 16);
644 int last_restart = -1;
646 while (offset + 5 < buffer_size) {
648 RCHECK(buffer[offset] == 0xff);
649 uint8_t code = buffer[offset + 1];
650 RCHECK(code >= 0xc0 || code == 1);
663 if (code == 0xd8 || code == 1) {
666 }
else if (code >= 0xd0 && code <= 0xd7) {
668 int restart = code & 0x07;
669 if (last_restart >= 0)
670 RCHECK(restart == (last_restart + 1) % 8);
671 last_restart = restart;
675 int length = Read16(buffer + offset + 2) + 2;
681 int number_components = buffer[offset + 4];
682 RCHECK(length == 8 + 2 * number_components);
686 while (offset + 2 < buffer_size) {
687 if (buffer[offset] == 0xff && buffer[offset + 1] != 0)
698 return (num_codes > 1);
701enum Mpeg2StartCodes { PROGRAM_END_CODE = 0xb9, PACK_START_CODE = 0xba };
704static bool CheckMpeg2ProgramStream(
const uint8_t* buffer,
int buffer_size) {
706 RCHECK(buffer_size > 14);
709 while (offset + 14 < buffer_size) {
710 BitReader reader(buffer + offset, 14);
713 RCHECK(ReadBits(&reader, 24) == 1);
714 RCHECK(ReadBits(&reader, 8) == PACK_START_CODE);
717 int mpeg_version = ReadBits(&reader, 2);
718 if (mpeg_version == 0) {
721 RCHECK(ReadBits(&reader, 2) == 2);
723 RCHECK(mpeg_version == 1);
730 RCHECK(ReadBits(&reader, 1) == 1);
736 RCHECK(ReadBits(&reader, 1) == 1);
742 RCHECK(ReadBits(&reader, 1) == 1);
744 if (mpeg_version == 0) {
746 RCHECK(ReadBits(&reader, 1) == 1);
752 RCHECK(ReadBits(&reader, 1) == 1);
762 RCHECK(ReadBits(&reader, 2) == 3);
768 int pack_stuffing_length = ReadBits(&reader, 3);
769 offset += 14 + pack_stuffing_length;
773 while (offset + 6 < buffer_size && Read24(buffer + offset) == 1) {
775 int stream_id = buffer[offset + 3];
778 if (mpeg_version == 0)
779 RCHECK(stream_id != 0xbc && stream_id < 0xf0);
781 RCHECK(stream_id != 0xfc && stream_id != 0xfd && stream_id != 0xfe);
784 if (stream_id == PACK_START_CODE)
786 if (stream_id == PROGRAM_END_CODE)
789 int pes_length = Read16(buffer + offset + 4);
790 RCHECK(pes_length > 0);
791 offset = offset + 6 + pes_length;
799const uint8_t kMpeg2SyncWord = 0x47;
802static bool CheckMpeg2TransportStream(
const uint8_t* buffer,
int buffer_size) {
808 RCHECK(buffer_size >= 250);
811 int packet_length = -1;
812 while (buffer[offset] != kMpeg2SyncWord && offset < 20) {
817 while (offset + 6 < buffer_size) {
818 BitReader reader(buffer + offset, 6);
821 RCHECK(ReadBits(&reader, 8) == kMpeg2SyncWord);
825 reader.SkipBits(1 + 1 + 1);
828 int pid = ReadBits(&reader, 13);
829 RCHECK(pid < 3 || pid > 15);
836 int adaptation_field_control = ReadBits(&reader, 2);
837 RCHECK(adaptation_field_control != 0);
840 if (adaptation_field_control >= 2) {
845 int adaptation_field_length = ReadBits(&reader, 8);
846 if (adaptation_field_control == 2)
847 RCHECK(adaptation_field_length == 183);
849 RCHECK(adaptation_field_length <= 182);
854 if (packet_length < 0) {
855 if (buffer[offset + 188] == kMpeg2SyncWord)
857 else if (buffer[offset + 192] == kMpeg2SyncWord)
859 else if (buffer[offset + 204] == kMpeg2SyncWord)
864 offset += packet_length;
869enum Mpeg4StartCodes {
870 VISUAL_OBJECT_SEQUENCE_START_CODE = 0xb0,
871 VISUAL_OBJECT_SEQUENCE_END_CODE = 0xb1,
872 VISUAL_OBJECT_START_CODE = 0xb5,
873 VOP_START_CODE = 0xb6
877static bool CheckMpeg4BitStream(
const uint8_t* buffer,
int buffer_size) {
881 RCHECK(buffer_size > 4);
884 int sequence_start_count = 0;
885 int sequence_end_count = 0;
886 int visual_object_count = 0;
890 if (!AdvanceToStartCode(buffer, buffer_size, &offset, 6, 24, 1)) {
893 return (sequence_start_count > 0 && visual_object_count > 0);
898 BitReader reader(buffer + offset, 6);
899 RCHECK(ReadBits(&reader, 24) == 1);
901 int start_code = ReadBits(&reader, 8);
902 RCHECK(start_code < 0x30 || start_code > 0xaf);
903 RCHECK(start_code < 0xb7 || start_code > 0xb9);
905 switch (start_code) {
906 case VISUAL_OBJECT_SEQUENCE_START_CODE: {
907 ++sequence_start_count;
909 int profile = ReadBits(&reader, 8);
911 RCHECK(profile < 0x04 || profile > 0x10);
912 RCHECK(profile < 0x13 || profile > 0x20);
913 RCHECK(profile < 0x23 || profile > 0x31);
914 RCHECK(profile < 0x35 || profile > 0x41);
915 RCHECK(profile < 0x43 || profile > 0x60);
916 RCHECK(profile < 0x65 || profile > 0x70);
917 RCHECK(profile < 0x73 || profile > 0x80);
918 RCHECK(profile < 0x83 || profile > 0x90);
919 RCHECK(profile < 0x95 || profile > 0xa0);
920 RCHECK(profile < 0xa4 || profile > 0xb0);
921 RCHECK(profile < 0xb5 || profile > 0xc0);
922 RCHECK(profile < 0xc3 || profile > 0xd0);
923 RCHECK(profile < 0xe4);
927 case VISUAL_OBJECT_SEQUENCE_END_CODE:
928 RCHECK(++sequence_end_count == sequence_start_count);
931 case VISUAL_OBJECT_START_CODE: {
932 ++visual_object_count;
933 if (ReadBits(&reader, 1) == 1) {
934 int visual_object_verid = ReadBits(&reader, 4);
935 RCHECK(visual_object_verid > 0 && visual_object_verid < 3);
936 RCHECK(ReadBits(&reader, 3) != 0);
938 int visual_object_type = ReadBits(&reader, 4);
939 RCHECK(visual_object_type > 0 && visual_object_type < 6);
944 RCHECK(++vop_count <= visual_object_count);
953static bool CheckMov(
const uint8_t* buffer,
int buffer_size) {
956 RCHECK(buffer_size > 8);
960 while (offset + 8 < buffer_size) {
961 int atomsize = Read32(buffer + offset);
962 uint32_t atomtype = Read32(buffer + offset + 4);
965 case TAG(
'f',
't',
'y',
'p'):
966 case TAG(
'p',
'd',
'i',
'n'):
967 case TAG(
'b',
'l',
'o',
'c'):
968 case TAG(
'm',
'o',
'o',
'v'):
969 case TAG(
'm',
'o',
'o',
'f'):
970 case TAG(
'm',
'f',
'r',
'a'):
971 case TAG(
'm',
'd',
'a',
't'):
972 case TAG(
'f',
'r',
'e',
'e'):
973 case TAG(
's',
'k',
'i',
'p'):
974 case TAG(
'm',
'e',
't',
'a'):
975 case TAG(
'm',
'e',
'c',
'o'):
976 case TAG(
's',
't',
'y',
'p'):
977 case TAG(
's',
'i',
'd',
'x'):
978 case TAG(
's',
's',
'i',
'x'):
979 case TAG(
'p',
'r',
'f',
't'):
980 case TAG(
'u',
'u',
'i',
'd'):
985 if (++boxes_seen >= 2)
994 if (offset + 16 > buffer_size)
996 if (Read32(buffer + offset + 8) != 0)
998 atomsize = Read32(buffer + offset + 12);
1007enum MPEGVersion { VERSION_25 = 0, VERSION_RESERVED, VERSION_2, VERSION_1 };
1008enum MPEGLayer { L_RESERVED = 0, LAYER_3, LAYER_2, LAYER_1 };
1010static int kSampleRateTable[4][4] = {
1011 {11025, 12000, 8000, 0},
1013 {22050, 24000, 16000, 0},
1014 {44100, 48000, 32000, 0}
1017static int kBitRateTableV1L1[16] = {0, 32, 64, 96, 128, 160, 192, 224,
1018 256, 288, 320, 352, 384, 416, 448, 0};
1019static int kBitRateTableV1L2[16] = {0, 32, 48, 56, 64, 80, 96, 112,
1020 128, 160, 192, 224, 256, 320, 384, 0};
1021static int kBitRateTableV1L3[16] = {0, 32, 40, 48, 56, 64, 80, 96,
1022 112, 128, 160, 192, 224, 256, 320, 0};
1023static int kBitRateTableV2L1[16] = {0, 32, 48, 56, 64, 80, 96, 112,
1024 128, 144, 160, 176, 192, 224, 256, 0};
1025static int kBitRateTableV2L23[16] = {0, 8, 16, 24, 32, 40, 48, 56,
1026 64, 80, 96, 112, 128, 144, 160, 0};
1028static bool ValidMpegAudioFrameHeader(
const uint8_t* header,
1032 DCHECK_GE(header_size, 4);
1034 BitReader reader(header, 4);
1037 RCHECK(ReadBits(&reader, 11) == 0x7ff);
1040 int version = ReadBits(&reader, 2);
1041 RCHECK(version != 1);
1044 int layer = ReadBits(&reader, 2);
1051 int bitrate_index = ReadBits(&reader, 4);
1052 RCHECK(bitrate_index != 0xf);
1055 int sampling_index = ReadBits(&reader, 2);
1056 RCHECK(sampling_index != 3);
1059 int padding = ReadBits(&reader, 1);
1065 int sampling_rate = kSampleRateTable[version][sampling_index];
1067 if (version == VERSION_1) {
1068 if (layer == LAYER_1)
1069 bitrate = kBitRateTableV1L1[bitrate_index];
1070 else if (layer == LAYER_2)
1071 bitrate = kBitRateTableV1L2[bitrate_index];
1073 bitrate = kBitRateTableV1L3[bitrate_index];
1075 if (layer == LAYER_1)
1076 bitrate = kBitRateTableV2L1[bitrate_index];
1078 bitrate = kBitRateTableV2L23[bitrate_index];
1080 if (layer == LAYER_1)
1081 *framesize = ((12000 * bitrate) / sampling_rate + padding) * 4;
1083 *framesize = (144000 * bitrate) / sampling_rate + padding;
1084 return (bitrate > 0 && sampling_rate > 0);
1088static int GetMp3HeaderSize(
const uint8_t* buffer,
int buffer_size) {
1089 DCHECK_GE(buffer_size, 9);
1090 int size = ((buffer[6] & 0x7f) << 21) + ((buffer[7] & 0x7f) << 14) +
1091 ((buffer[8] & 0x7f) << 7) + (buffer[9] & 0x7f) + 10;
1092 if (buffer[5] & 0x10)
1098static bool CheckMp3(
const uint8_t* buffer,
int buffer_size,
bool seenHeader) {
1099 RCHECK(buffer_size >= 10);
1105 offset = GetMp3HeaderSize(buffer, buffer_size);
1108 while (offset < buffer_size && buffer[offset] == 0)
1112 while (offset + 3 < buffer_size) {
1113 RCHECK(ValidMpegAudioFrameHeader(buffer + offset, buffer_size - offset,
1119 offset += framesize;
1129static bool VerifyNumber(
const uint8_t* buffer,
1133 RCHECK(*offset < buffer_size);
1136 while (isspace(buffer[*offset])) {
1138 RCHECK(*offset < buffer_size);
1143 while (--max_digits >= 0 && isdigit(buffer[*offset])) {
1146 if (*offset >= buffer_size)
1151 return (numSeen > 0);
1157static inline bool VerifyCharacters(
const uint8_t* buffer,
1162 RCHECK(*offset < buffer_size);
1163 char c =
static_cast<char>(buffer[(*offset)++]);
1164 return (c == c1 || (c == c2 && c2 != 0));
1168static bool CheckSrt(
const uint8_t* buffer,
int buffer_size) {
1170 RCHECK(buffer_size > 20);
1173 int offset = StartsWith(buffer, buffer_size, UTF8_BYTE_ORDER_MARK) ? 3 : 0;
1174 RCHECK(VerifyNumber(buffer, buffer_size, &offset, 100));
1175 RCHECK(VerifyCharacters(buffer, buffer_size, &offset,
'\n',
'\r'));
1178 while (VerifyCharacters(buffer, buffer_size, &offset,
'\n',
'\r')) {
1185 RCHECK(VerifyNumber(buffer, buffer_size, &offset, 100));
1186 RCHECK(VerifyCharacters(buffer, buffer_size, &offset,
':', 0));
1187 RCHECK(VerifyNumber(buffer, buffer_size, &offset, 2));
1188 RCHECK(VerifyCharacters(buffer, buffer_size, &offset,
':', 0));
1189 RCHECK(VerifyNumber(buffer, buffer_size, &offset, 2));
1190 RCHECK(VerifyCharacters(buffer, buffer_size, &offset,
',',
'.'));
1191 RCHECK(VerifyNumber(buffer, buffer_size, &offset, 3));
1192 RCHECK(VerifyCharacters(buffer, buffer_size, &offset,
' ', 0));
1193 RCHECK(VerifyCharacters(buffer, buffer_size, &offset,
'-', 0));
1194 RCHECK(VerifyCharacters(buffer, buffer_size, &offset,
'-', 0));
1195 RCHECK(VerifyCharacters(buffer, buffer_size, &offset,
'>', 0));
1196 RCHECK(VerifyCharacters(buffer, buffer_size, &offset,
' ', 0));
1197 RCHECK(VerifyNumber(buffer, buffer_size, &offset, 100));
1198 RCHECK(VerifyCharacters(buffer, buffer_size, &offset,
':', 0));
1199 RCHECK(VerifyNumber(buffer, buffer_size, &offset, 2));
1200 RCHECK(VerifyCharacters(buffer, buffer_size, &offset,
':', 0));
1201 RCHECK(VerifyNumber(buffer, buffer_size, &offset, 2));
1202 RCHECK(VerifyCharacters(buffer, buffer_size, &offset,
',',
'.'));
1203 RCHECK(VerifyNumber(buffer, buffer_size, &offset, 3));
1208static int GetElementId(BitReader* reader) {
1212 if (reader->bits_available() >= 8) {
1213 int num_bits_to_read = 0;
1214 static int prefix[] = {0x80, 0x4000, 0x200000, 0x10000000};
1215 for (
int i = 0; i < 4; ++i) {
1216 num_bits_to_read += 7;
1217 if (ReadBits(reader, 1) == 1) {
1218 if (
static_cast<int>(reader->bits_available()) < num_bits_to_read)
1221 return ReadBits(reader, num_bits_to_read) | prefix[i];
1230static uint64_t GetVint(BitReader* reader) {
1234 if (reader->bits_available() >= 8) {
1235 int num_bits_to_read = 0;
1236 for (
int i = 0; i < 8; ++i) {
1237 num_bits_to_read += 7;
1238 if (ReadBits(reader, 1) == 1) {
1239 if (
static_cast<int>(reader->bits_available()) < num_bits_to_read)
1241 return ReadBits(reader, num_bits_to_read);
1248 return (reader->bits_available() / 8) + 2;
1252static bool CheckWebm(
const uint8_t* buffer,
int buffer_size) {
1254 RCHECK(buffer_size > 12);
1256 BitReader reader(buffer, buffer_size);
1259 RCHECK(GetElementId(&reader) == 0x1a45dfa3);
1262 int header_size = GetVint(&reader);
1263 RCHECK(
static_cast<int>(reader.bits_available()) / 8 >= header_size);
1266 while (reader.bits_available() > 0) {
1267 int tag = GetElementId(&reader);
1268 int tagsize = GetVint(&reader);
1278 RCHECK(reader.SkipBits(tagsize * 8));
1283 switch (ReadBits(&reader, 32)) {
1284 case TAG(
'w',
'e',
'b',
'm'):
1286 case TAG(
'm',
'a',
't',
'r'):
1287 return (ReadBits(&reader, 32) == TAG(
'o',
's',
'k',
'a'));
1299 VC1_FRAME_START_CODE = 0x0d,
1300 VC1_ENTRY_POINT_START_CODE = 0x0e,
1301 VC1_SEQUENCE_START_CODE = 0x0f
1305static bool CheckVC1(
const uint8_t* buffer,
int buffer_size) {
1312 RCHECK(buffer_size >= 24);
1315 if (buffer[0] == 0xc5 && Read32(buffer + 4) == 0x04 &&
1316 Read32(buffer + 20) == 0x0c) {
1318 BitReader reader(buffer + 8, 12);
1320 int profile = ReadBits(&reader, 4);
1321 if (profile == 0 || profile == 4) {
1323 reader.SkipBits(3 + 5 + 1);
1326 RCHECK(ReadBits(&reader, 1) == 0);
1332 RCHECK(ReadBits(&reader, 1) == 1);
1335 reader.SkipBits(1 + 1 + 2 + 1);
1338 RCHECK(ReadBits(&reader, 1) == 0);
1342 reader.SkipBits(1 + 1 + 1 + 3 + 2 + 1);
1345 RCHECK(ReadBits(&reader, 1) == 1);
1348 RCHECK(profile == 12);
1349 RCHECK(ReadBits(&reader, 28) == 0);
1353 RCHECK(ReadBits(&reader, 32) <= 8192);
1354 RCHECK(ReadBits(&reader, 32) <= 8192);
1360 int sequence_start_code = 0;
1361 int frame_start_code = 0;
1364 if (!AdvanceToStartCode(buffer, buffer_size, &offset, 5, 24, 1)) {
1368 return (sequence_start_code > 0 && frame_start_code > 0);
1373 BitReader reader(buffer + offset, 5);
1374 RCHECK(ReadBits(&reader, 24) == 1);
1377 switch (ReadBits(&reader, 8)) {
1378 case VC1_SEQUENCE_START_CODE: {
1379 ++sequence_start_code;
1380 switch (ReadBits(&reader, 2)) {
1383 RCHECK(ReadBits(&reader, 2) == 0);
1388 RCHECK(ReadBits(&reader, 3) <= 4);
1389 RCHECK(ReadBits(&reader, 2) == 1);
1395 case VC1_ENTRY_POINT_START_CODE:
1398 RCHECK(sequence_start_code > 0);
1401 case VC1_FRAME_START_CODE:
1413static const char kAmrSignature[] =
"#!AMR";
1414static const uint8_t kAsfSignature[] = {0x30, 0x26, 0xb2, 0x75, 0x8e, 0x66,
1415 0xcf, 0x11, 0xa6, 0xd9, 0x00, 0xaa,
1416 0x00, 0x62, 0xce, 0x6c};
1417static const char kAssSignature[] =
"[Script Info]";
1418static const char kAssBomSignature[] = UTF8_BYTE_ORDER_MARK
"[Script Info]";
1419static const uint8_t kWtvSignature[] = {0xb7, 0xd8, 0x00, 0x20, 0x37, 0x49,
1420 0xda, 0x11, 0xa6, 0x4e, 0x00, 0x07,
1421 0xe9, 0x5e, 0xad, 0x8d};
1426static MediaContainerName LookupContainerByFirst4(
const uint8_t* buffer,
1429 if (buffer_size < 12)
1430 return CONTAINER_UNKNOWN;
1432 uint32_t first4 = Read32(buffer);
1435 if (CheckWebm(buffer, buffer_size))
1436 return CONTAINER_WEBM;
1440 if (StartsWith(buffer, buffer_size, kAsfSignature,
1441 sizeof(kAsfSignature))) {
1442 return CONTAINER_ASF;
1446 case TAG(
'#',
'!',
'A',
'M'):
1447 if (StartsWith(buffer, buffer_size, kAmrSignature))
1448 return CONTAINER_AMR;
1451 case TAG(
'#',
'E',
'X',
'T'):
1452 if (CheckHls(buffer, buffer_size))
1453 return CONTAINER_HLS;
1456 case TAG(
'.',
'R',
'M',
'F'):
1457 if (buffer[4] == 0 && buffer[5] == 0)
1458 return CONTAINER_RM;
1461 case TAG(
'.',
'r',
'a',
'\xfd'):
1462 return CONTAINER_RM;
1464 case TAG(
'B',
'I',
'K',
'b'):
1465 case TAG(
'B',
'I',
'K',
'd'):
1466 case TAG(
'B',
'I',
'K',
'f'):
1467 case TAG(
'B',
'I',
'K',
'g'):
1468 case TAG(
'B',
'I',
'K',
'h'):
1469 case TAG(
'B',
'I',
'K',
'i'):
1470 if (CheckBink(buffer, buffer_size))
1471 return CONTAINER_BINK;
1474 case TAG(
'c',
'a',
'f',
'f'):
1475 if (CheckCaf(buffer, buffer_size))
1476 return CONTAINER_CAF;
1479 case TAG(
'D',
'E',
'X',
'A'):
1480 if (buffer_size > 15 && Read16(buffer + 11) <= 2048 &&
1481 Read16(buffer + 13) <= 2048) {
1482 return CONTAINER_DXA;
1486 case TAG(
'D',
'T',
'S',
'H'):
1487 if (Read32(buffer + 4) == TAG(
'D',
'H',
'D',
'R'))
1488 return CONTAINER_DTSHD;
1498 if (Read32(buffer + 4) != 0 && Read32(buffer + 8) != 0)
1499 return CONTAINER_IRCAM;
1502 case TAG(
'f',
'L',
'a',
'C'):
1503 return CONTAINER_FLAC;
1505 case TAG(
'F',
'L',
'V', 0):
1506 case TAG(
'F',
'L',
'V', 1):
1507 case TAG(
'F',
'L',
'V', 2):
1508 case TAG(
'F',
'L',
'V', 3):
1509 case TAG(
'F',
'L',
'V', 4):
1510 if (buffer[5] == 0 && Read32(buffer + 5) > 8)
1511 return CONTAINER_FLV;
1514 case TAG(
'F',
'O',
'R',
'M'):
1515 switch (Read32(buffer + 8)) {
1516 case TAG(
'A',
'I',
'F',
'F'):
1517 case TAG(
'A',
'I',
'F',
'C'):
1518 return CONTAINER_AIFF;
1522 case TAG(
'M',
'A',
'C',
' '):
1523 return CONTAINER_APE;
1525 case TAG(
'O',
'N',
'2',
' '):
1526 if (Read32(buffer + 8) == TAG(
'O',
'N',
'2',
'f'))
1527 return CONTAINER_AVI;
1530 case TAG(
'O',
'g',
'g',
'S'):
1532 return CONTAINER_OGG;
1535 case TAG(
'R',
'F',
'6',
'4'):
1536 if (buffer_size > 16 && Read32(buffer + 12) == TAG(
'd',
's',
'6',
'4'))
1537 return CONTAINER_WAV;
1540 case TAG(
'R',
'I',
'F',
'F'):
1541 switch (Read32(buffer + 8)) {
1542 case TAG(
'A',
'V',
'I',
' '):
1543 case TAG(
'A',
'V',
'I',
'X'):
1544 case TAG(
'A',
'V',
'I',
'\x19'):
1545 case TAG(
'A',
'M',
'V',
' '):
1546 return CONTAINER_AVI;
1547 case TAG(
'W',
'A',
'V',
'E'):
1548 return CONTAINER_WAV;
1552 case TAG(
'[',
'S',
'c',
'r'):
1553 if (StartsWith(buffer, buffer_size, kAssSignature))
1554 return CONTAINER_ASS;
1557 case TAG(
'\xef',
'\xbb',
'\xbf',
'['):
1558 if (StartsWith(buffer, buffer_size, kAssBomSignature))
1559 return CONTAINER_ASS;
1566 if (CheckDts(buffer, buffer_size))
1567 return CONTAINER_DTS;
1571 if (StartsWith(buffer, buffer_size, kWtvSignature,
1572 sizeof(kWtvSignature))) {
1573 return CONTAINER_WTV;
1577 return CONTAINER_MPEG2PS;
1582 uint32_t first3 = first4 & 0xffffff00;
1584 case TAG(
'C',
'W',
'S', 0):
1585 case TAG(
'F',
'W',
'S', 0):
1586 return CONTAINER_SWF;
1588 case TAG(
'I',
'D',
'3', 0):
1589 if (CheckMp3(buffer, buffer_size, true))
1590 return CONTAINER_MP3;
1595 uint32_t first2 = Read16(buffer);
1598 if (CheckAc3(buffer, buffer_size))
1599 return CONTAINER_AC3;
1600 if (CheckEac3(buffer, buffer_size))
1601 return CONTAINER_EAC3;
1608 if (CheckAac(buffer, buffer_size))
1609 return CONTAINER_AAC;
1614 if (CheckMp3(buffer, buffer_size,
false))
1615 return CONTAINER_MP3;
1617 return CONTAINER_UNKNOWN;
1621const char kWebVtt[] =
"WEBVTT";
1623bool CheckWebVtt(
const uint8_t* buffer,
int buffer_size) {
1625 StartsWith(buffer, buffer_size, UTF8_BYTE_ORDER_MARK) ? 3 : 0;
1627 return StartsWith(buffer + offset, buffer_size - offset,
1628 reinterpret_cast<const uint8_t*
>(kWebVtt),
1629 std::size(kWebVtt) - 1);
1632bool CheckTtml(
const uint8_t* buffer,
int buffer_size) {
1634 if (!StartsWith(buffer, buffer_size,
"<?xml"))
1640 xml::scoped_xml_ptr<xmlDoc> doc(
1641 xmlParseMemory(
reinterpret_cast<const char*
>(buffer), buffer_size));
1645 xmlNodePtr root_node = xmlDocGetRootElement(doc.get());
1646 std::string root_node_name(
reinterpret_cast<const char*
>(root_node->name));
1648 return root_node_name ==
"tt";
1654MediaContainerName DetermineContainer(
const uint8_t* buffer,
int buffer_size) {
1658 if (CheckMov(buffer, buffer_size))
1659 return CONTAINER_MOV;
1663 MediaContainerName result = LookupContainerByFirst4(buffer, buffer_size);
1664 if (result != CONTAINER_UNKNOWN)
1668 if (CheckWebVtt(buffer, buffer_size))
1669 return CONTAINER_WEBVTT;
1672 if (CheckMpeg2ProgramStream(buffer, buffer_size))
1673 return CONTAINER_MPEG2PS;
1674 if (CheckMpeg2TransportStream(buffer, buffer_size))
1675 return CONTAINER_MPEG2TS;
1676 if (CheckMJpeg(buffer, buffer_size))
1677 return CONTAINER_MJPEG;
1678 if (CheckDV(buffer, buffer_size))
1679 return CONTAINER_DV;
1680 if (CheckH261(buffer, buffer_size))
1681 return CONTAINER_H261;
1682 if (CheckH263(buffer, buffer_size))
1683 return CONTAINER_H263;
1684 if (CheckH264(buffer, buffer_size))
1685 return CONTAINER_H264;
1686 if (CheckMpeg4BitStream(buffer, buffer_size))
1687 return CONTAINER_MPEG4BS;
1688 if (CheckVC1(buffer, buffer_size))
1689 return CONTAINER_VC1;
1690 if (CheckSrt(buffer, buffer_size))
1691 return CONTAINER_SRT;
1692 if (CheckGsm(buffer, buffer_size))
1693 return CONTAINER_GSM;
1698 if (AdvanceToStartCode(buffer, buffer_size, &offset, 4, 16, kAc3SyncWord)) {
1699 if (CheckAc3(buffer + offset, buffer_size - offset))
1700 return CONTAINER_AC3;
1701 if (CheckEac3(buffer + offset, buffer_size - offset))
1702 return CONTAINER_EAC3;
1707 if (CheckTtml(buffer, buffer_size))
1708 return CONTAINER_TTML;
1710 return CONTAINER_UNKNOWN;
1713MediaContainerName DetermineContainerFromFormatName(
1714 const std::string& format_name) {
1715 std::string normalized_format_name = format_name;
1716 std::transform(format_name.begin(), format_name.end(),
1717 normalized_format_name.begin(), ::tolower);
1719 if (normalized_format_name ==
"aac" || normalized_format_name ==
"adts") {
1720 return CONTAINER_AAC;
1721 }
else if (normalized_format_name ==
"ac3") {
1722 return CONTAINER_AC3;
1723 }
else if (normalized_format_name ==
"ec3" ||
1724 normalized_format_name ==
"eac3") {
1725 return CONTAINER_EAC3;
1726 }
else if (normalized_format_name ==
"mp3") {
1727 return CONTAINER_MP3;
1728 }
else if (normalized_format_name ==
"webm") {
1729 return CONTAINER_WEBM;
1730 }
else if (normalized_format_name ==
"cmfa" ||
1731 normalized_format_name ==
"cmft" ||
1732 normalized_format_name ==
"cmfv" ||
1733 normalized_format_name ==
"m4a" ||
1734 normalized_format_name ==
"m4s" ||
1735 normalized_format_name ==
"m4v" ||
1736 normalized_format_name ==
"mov" ||
1737 normalized_format_name ==
"mp4" ||
1738 normalized_format_name ==
"ttml+mp4" ||
1739 normalized_format_name ==
"webvtt+mp4" ||
1740 normalized_format_name ==
"vtt+mp4") {
1741 return CONTAINER_MOV;
1742 }
else if (normalized_format_name ==
"ts" ||
1743 normalized_format_name ==
"mpeg2ts") {
1744 return CONTAINER_MPEG2TS;
1745 }
else if (normalized_format_name ==
"wvm") {
1746 return CONTAINER_WVM;
1747 }
else if (normalized_format_name ==
"vtt" ||
1748 normalized_format_name ==
"webvtt") {
1749 return CONTAINER_WEBVTT;
1750 }
else if (normalized_format_name ==
"ttml" ||
1752 normalized_format_name ==
"xml") {
1753 return CONTAINER_TTML;
1755 return CONTAINER_UNKNOWN;
1758MediaContainerName DetermineContainerFromFileName(
1759 const std::string& file_name) {
1760 const size_t pos = file_name.rfind(
'.');
1761 if (pos == std::string::npos)
1762 return CONTAINER_UNKNOWN;
1763 const std::string& file_extension = file_name.substr(pos + 1);
1764 return DetermineContainerFromFormatName(file_extension);
All the methods that are virtual are virtual for mocking.