5#include <packager/media/formats/mp2t/es_parser_h26x.h>
9#include <absl/log/check.h>
10#include <absl/log/log.h>
12#include <packager/macros/logging.h>
13#include <packager/media/base/media_sample.h>
14#include <packager/media/base/offset_byte_queue.h>
15#include <packager/media/base/timestamp.h>
16#include <packager/media/base/video_stream_info.h>
17#include <packager/media/codecs/h26x_byte_to_unit_stream_converter.h>
18#include <packager/media/formats/mp2t/mp2t_common.h>
26const int kStartCodeSize = 3;
27const int kH264NaluHeaderSize = 1;
28const int kH265NaluHeaderSize = 2;
32EsParserH26x::EsParserH26x(
34 std::unique_ptr<H26xByteToUnitStreamConverter> stream_converter,
36 const EmitSampleCB& emit_sample_cb)
38 emit_sample_cb_(emit_sample_cb),
40 es_queue_(new media::OffsetByteQueue()),
41 stream_converter_(std::move(stream_converter)) {}
43EsParserH26x::~EsParserH26x() {}
45bool EsParserH26x::Parse(
const uint8_t* buf,
58 if (pts == kNoTimestamp) {
59 DVLOG(1) <<
"Each video PES should have a PTS";
61 TimingDesc timing_desc;
62 timing_desc.pts = pts;
63 timing_desc.dts = (dts != kNoTimestamp) ? dts : pts;
66 timing_desc_list_.push_back(
67 std::pair<int64_t, TimingDesc>(es_queue_->tail(), timing_desc));
71 const size_t kWarningSize =
73 LOG_IF(WARNING, timing_desc_list_.size() >= kWarningSize)
74 <<
"Unusually large number of cached timestamps ("
75 << timing_desc_list_.size() <<
").";
79 es_queue_->Push(buf, size);
80 return ParseInternal();
83bool EsParserH26x::Flush() {
84 DVLOG(1) <<
"EsParserH26x::Flush";
91 if (type_ == Nalu::kH264) {
92 const uint8_t aud[] = {0x00, 0x00, 0x01, 0x09, 0x00, 0x00, 0x01, 0x09};
93 es_queue_->Push(aud,
sizeof(aud));
95 DCHECK_EQ(Nalu::kH265, type_);
96 const uint8_t aud[] = {0x00, 0x00, 0x01, 0x46, 0x01,
97 0x00, 0x00, 0x01, 0x46, 0x01};
98 es_queue_->Push(aud,
sizeof(aud));
101 RCHECK(ParseInternal());
103 if (pending_sample_) {
105 if (!pending_sample_duration_) {
106 pending_sample_duration_ =
107 CalculateSampleDuration(pending_sample_pps_id_);
109 pending_sample_->set_duration(pending_sample_duration_);
110 emit_sample_cb_(std::move(pending_sample_));
115void EsParserH26x::Reset() {
116 es_queue_.reset(
new media::OffsetByteQueue());
117 current_search_position_ = 0;
118 current_access_unit_position_ = 0;
119 current_video_slice_info_.valid =
false;
120 next_access_unit_position_set_ =
false;
121 next_access_unit_position_ = 0;
122 current_nalu_info_.reset();
123 timing_desc_list_.clear();
124 pending_sample_ = std::shared_ptr<MediaSample>();
125 pending_sample_duration_ = 0;
126 waiting_for_key_frame_ =
true;
129bool EsParserH26x::SearchForNalu(uint64_t* position, Nalu* nalu) {
132 es_queue_->PeekAt(current_search_position_, &es, &es_size);
135 uint64_t start_code_offset;
136 uint8_t start_code_size;
137 const bool start_code_found = NaluReader::FindStartCode(
138 es, es_size, &start_code_offset, &start_code_size);
140 if (!start_code_found) {
142 if (es_size > kStartCodeSize)
143 current_search_position_ += es_size - kStartCodeSize;
148 const uint8_t* next_nalu_ptr = es + start_code_offset + start_code_size;
150 const int64_t next_nalu_size = es_size - start_code_offset - start_code_size;
152 (type_ == Nalu::kH264 ? kH264NaluHeaderSize : kH265NaluHeaderSize)) {
158 current_search_position_ += start_code_offset + start_code_size;
162 if (!next_nalu_info_)
163 next_nalu_info_.reset(
new NaluInfo);
164 if (!next_nalu_info_->nalu.Initialize(type_, next_nalu_ptr, next_nalu_size)) {
166 return SearchForNalu(position, nalu);
168 next_nalu_info_->position = current_search_position_ - start_code_size;
169 next_nalu_info_->start_code_size = start_code_size;
171 const bool current_nalu_set = current_nalu_info_ ? true :
false;
172 if (current_nalu_info_) {
174 *position = current_nalu_info_->position;
176 const uint8_t* current_nalu_ptr =
178 (current_nalu_info_->position + current_nalu_info_->start_code_size) -
179 current_search_position_;
180 const uint64_t current_nalu_size = next_nalu_info_->position -
181 current_nalu_info_->position -
182 current_nalu_info_->start_code_size;
183 CHECK(nalu->Initialize(type_, current_nalu_ptr, current_nalu_size));
185 current_nalu_info_.swap(next_nalu_info_);
186 return current_nalu_set ? true : SearchForNalu(position, nalu);
189bool EsParserH26x::ParseInternal() {
192 VideoSliceInfo video_slice_info;
193 while (SearchForNalu(&position, &nalu)) {
203 if (nalu.can_start_access_unit()) {
204 if (!next_access_unit_position_set_) {
205 next_access_unit_position_set_ =
true;
206 next_access_unit_position_ = position;
208 RCHECK(ProcessNalu(nalu, &video_slice_info));
209 if (nalu.is_vcl() && !video_slice_info.valid) {
212 DCHECK(!current_video_slice_info_.valid);
213 next_access_unit_position_set_ =
false;
216 }
else if (nalu.is_vcl()) {
219 next_access_unit_position_set_ =
false;
227 RCHECK(EmitCurrentAccessUnit());
233 if (!video_slice_info.valid)
238 bool is_first_vcl_nalu =
true;
239 if (type_ == Nalu::kH264) {
240 if (current_video_slice_info_.valid) {
244 video_slice_info.frame_num != current_video_slice_info_.frame_num ||
245 video_slice_info.pps_id != current_video_slice_info_.pps_id;
248 if (!is_first_vcl_nalu) {
251 next_access_unit_position_set_ =
false;
255 DCHECK(next_access_unit_position_set_);
256 RCHECK(EmitCurrentAccessUnit());
259 es_queue_->Trim(next_access_unit_position_);
261 current_access_unit_position_ = next_access_unit_position_;
262 current_video_slice_info_ = video_slice_info;
263 next_access_unit_position_set_ =
false;
268bool EsParserH26x::EmitCurrentAccessUnit() {
269 if (current_video_slice_info_.valid) {
270 if (current_video_slice_info_.is_key_frame)
271 waiting_for_key_frame_ =
false;
272 if (!waiting_for_key_frame_) {
274 EmitFrame(current_access_unit_position_,
275 next_access_unit_position_ - current_access_unit_position_,
276 current_video_slice_info_.is_key_frame,
277 current_video_slice_info_.pps_id));
279 current_video_slice_info_.valid =
false;
284bool EsParserH26x::EmitFrame(int64_t access_unit_pos,
285 int access_unit_size,
289 TimingDesc current_timing_desc = {kNoTimestamp, kNoTimestamp};
290 while (!timing_desc_list_.empty() &&
291 timing_desc_list_.front().first <= access_unit_pos) {
292 current_timing_desc = timing_desc_list_.front().second;
293 timing_desc_list_.pop_front();
295 if (current_timing_desc.pts == kNoTimestamp)
299 DVLOG(LOG_LEVEL_ES) <<
"Emit frame: stream_pos=" << access_unit_pos
300 <<
" size=" << access_unit_size <<
" pts "
301 << current_timing_desc.pts <<
" timing_desc_list size "
302 << timing_desc_list_.size();
305 es_queue_->PeekAt(access_unit_pos, &es, &es_size);
308 std::vector<uint8_t> converted_frame;
309 if (!stream_converter_->ConvertByteStreamToNalUnitStream(es, access_unit_size,
311 DLOG(ERROR) <<
"Failure to convert video frame to unit stream format.";
316 RCHECK(UpdateVideoDecoderConfig(pps_id));
320 std::shared_ptr<MediaSample> media_sample = MediaSample::CopyFrom(
321 converted_frame.data(), converted_frame.size(), is_key_frame);
322 media_sample->set_dts(current_timing_desc.dts);
323 media_sample->set_pts(current_timing_desc.pts);
324 if (pending_sample_) {
325 if (media_sample->dts() <= pending_sample_->dts()) {
326 LOG(WARNING) <<
"[MPEG-2 TS] PID " << pid() <<
" dts "
327 << media_sample->dts()
328 <<
" less than or equal to previous dts "
329 << pending_sample_->dts();
332 const int64_t kArbitrarySmallDuration = 0.001 * kMpeg2Timescale;
333 pending_sample_->set_duration(kArbitrarySmallDuration);
335 int64_t sample_duration = media_sample->dts() - pending_sample_->dts();
336 pending_sample_->set_duration(sample_duration);
338 const int kArbitraryGapScale = 10;
339 if (pending_sample_duration_ &&
340 sample_duration > kArbitraryGapScale * pending_sample_duration_) {
341 LOG(WARNING) <<
"[MPEG-2 TS] PID " << pid() <<
" Possible GAP at dts "
342 << pending_sample_->dts() <<
" with next sample at dts "
343 << media_sample->dts() <<
" (difference "
344 << sample_duration <<
")";
347 pending_sample_duration_ = sample_duration;
349 emit_sample_cb_(std::move(pending_sample_));
351 pending_sample_ = media_sample;
352 pending_sample_pps_id_ = pps_id;
All the methods that are virtual are virtual for mocking.