Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(53)

Side by Side Diff: media/filters/ffmpeg_demuxer.cc

Issue 23702007: Render inband text tracks in the media pipeline (Closed) Base URL: http://git.chromium.org/chromium/src.git@master
Patch Set: modified ffmpeg demuxer unittest Created 7 years, 1 month ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch
OLDNEW
1 // Copyright (c) 2012 The Chromium Authors. All rights reserved. 1 // Copyright (c) 2012 The Chromium Authors. All rights reserved.
2 // Use of this source code is governed by a BSD-style license that can be 2 // Use of this source code is governed by a BSD-style license that can be
3 // found in the LICENSE file. 3 // found in the LICENSE file.
4 4
5 #include "media/filters/ffmpeg_demuxer.h" 5 #include "media/filters/ffmpeg_demuxer.h"
6 6
7 #include <algorithm> 7 #include <algorithm>
8 #include <string> 8 #include <string>
9 9
10 #include "base/base64.h" 10 #include "base/base64.h"
11 #include "base/bind.h" 11 #include "base/bind.h"
12 #include "base/callback.h" 12 #include "base/callback.h"
13 #include "base/callback_helpers.h" 13 #include "base/callback_helpers.h"
14 #include "base/command_line.h"
15 #include "base/memory/scoped_ptr.h" 14 #include "base/memory/scoped_ptr.h"
16 #include "base/message_loop/message_loop.h" 15 #include "base/message_loop/message_loop.h"
17 #include "base/metrics/sparse_histogram.h" 16 #include "base/metrics/sparse_histogram.h"
18 #include "base/stl_util.h"
19 #include "base/strings/string_util.h" 17 #include "base/strings/string_util.h"
20 #include "base/strings/stringprintf.h" 18 #include "base/strings/stringprintf.h"
21 #include "base/task_runner_util.h" 19 #include "base/task_runner_util.h"
22 #include "base/time/time.h" 20 #include "base/time/time.h"
23 #include "media/base/audio_decoder_config.h" 21 #include "media/base/audio_decoder_config.h"
24 #include "media/base/bind_to_loop.h" 22 #include "media/base/bind_to_loop.h"
25 #include "media/base/decoder_buffer.h" 23 #include "media/base/decoder_buffer.h"
26 #include "media/base/decrypt_config.h" 24 #include "media/base/decrypt_config.h"
27 #include "media/base/limits.h" 25 #include "media/base/limits.h"
28 #include "media/base/media_log.h" 26 #include "media/base/media_log.h"
29 #include "media/base/media_switches.h"
30 #include "media/base/video_decoder_config.h" 27 #include "media/base/video_decoder_config.h"
31 #include "media/ffmpeg/ffmpeg_common.h" 28 #include "media/ffmpeg/ffmpeg_common.h"
32 #include "media/filters/ffmpeg_glue.h" 29 #include "media/filters/ffmpeg_glue.h"
33 #include "media/filters/ffmpeg_h264_to_annex_b_bitstream_converter.h" 30 #include "media/filters/ffmpeg_h264_to_annex_b_bitstream_converter.h"
31 #include "media/filters/webvtt_util.h"
34 #include "media/webm/webm_crypto_helpers.h" 32 #include "media/webm/webm_crypto_helpers.h"
35 33
36 namespace media { 34 namespace media {
37 35
38 // 36 //
39 // FFmpegDemuxerStream 37 // FFmpegDemuxerStream
40 // 38 //
41 FFmpegDemuxerStream::FFmpegDemuxerStream( 39 FFmpegDemuxerStream::FFmpegDemuxerStream(
42 FFmpegDemuxer* demuxer, 40 FFmpegDemuxer* demuxer,
43 AVStream* stream) 41 AVStream* stream)
(...skipping 13 matching lines...) Expand all
57 case AVMEDIA_TYPE_AUDIO: 55 case AVMEDIA_TYPE_AUDIO:
58 type_ = AUDIO; 56 type_ = AUDIO;
59 AVStreamToAudioDecoderConfig(stream, &audio_config_, true); 57 AVStreamToAudioDecoderConfig(stream, &audio_config_, true);
60 is_encrypted = audio_config_.is_encrypted(); 58 is_encrypted = audio_config_.is_encrypted();
61 break; 59 break;
62 case AVMEDIA_TYPE_VIDEO: 60 case AVMEDIA_TYPE_VIDEO:
63 type_ = VIDEO; 61 type_ = VIDEO;
64 AVStreamToVideoDecoderConfig(stream, &video_config_, true); 62 AVStreamToVideoDecoderConfig(stream, &video_config_, true);
65 is_encrypted = video_config_.is_encrypted(); 63 is_encrypted = video_config_.is_encrypted();
66 break; 64 break;
65 case AVMEDIA_TYPE_SUBTITLE:
66 type_ = TEXT;
67 break;
67 default: 68 default:
68 NOTREACHED(); 69 NOTREACHED();
69 break; 70 break;
70 } 71 }
71 72
72 // Calculate the duration. 73 // Calculate the duration.
73 duration_ = ConvertStreamTimestamp(stream->time_base, stream->duration); 74 duration_ = ConvertStreamTimestamp(stream->time_base, stream->duration);
74 75
75 if (stream_->codec->codec_id == AV_CODEC_ID_H264) { 76 if (stream_->codec->codec_id == AV_CODEC_ID_H264) {
76 bitstream_converter_.reset( 77 bitstream_converter_.reset(
(...skipping 26 matching lines...) Expand all
103 NOTREACHED() << "Attempted to enqueue packet on a stopped stream"; 104 NOTREACHED() << "Attempted to enqueue packet on a stopped stream";
104 return; 105 return;
105 } 106 }
106 107
107 // Convert the packet if there is a bitstream filter. 108 // Convert the packet if there is a bitstream filter.
108 if (packet->data && bitstream_converter_enabled_ && 109 if (packet->data && bitstream_converter_enabled_ &&
109 !bitstream_converter_->ConvertPacket(packet.get())) { 110 !bitstream_converter_->ConvertPacket(packet.get())) {
110 LOG(ERROR) << "Format conversion failed."; 111 LOG(ERROR) << "Format conversion failed.";
111 } 112 }
112 113
113 // Get side data if any. For now, the only type of side_data is VP8 Alpha. We 114 scoped_refptr<DecoderBuffer> buffer;
114 // keep this generic so that other side_data types in the future can be 115
115 // handled the same way as well. 116 // Get side data if any. For now, the only types of side_data are VP8 Alpha,
117 // and WebVTT id and settings. We keep this generic so that other side_data
118 // types in the future can be handled the same way as well.
116 av_packet_split_side_data(packet.get()); 119 av_packet_split_side_data(packet.get());
117 int side_data_size = 0; 120 if (type() == DemuxerStream::TEXT) {
118 uint8* side_data = av_packet_get_side_data( 121 int id_size = 0;
119 packet.get(), 122 uint8* id_data = av_packet_get_side_data(
120 AV_PKT_DATA_MATROSKA_BLOCKADDITIONAL, 123 packet.get(),
121 &side_data_size); 124 AV_PKT_DATA_WEBVTT_IDENTIFIER,
125 &id_size);
122 126
123 // If a packet is returned by FFmpeg's av_parser_parse2() the packet will 127 int settings_size = 0;
124 // reference inner memory of FFmpeg. As such we should transfer the packet 128 uint8* settings_data = av_packet_get_side_data(
125 // into memory we control. 129 packet.get(),
126 scoped_refptr<DecoderBuffer> buffer; 130 AV_PKT_DATA_WEBVTT_SETTINGS,
127 if (side_data_size > 0) { 131 &settings_size);
132
133 std::vector<uint8> side_data;
134 MakeSideData(id_data, id_data + id_size,
135 settings_data, settings_data + settings_size,
136 &side_data);
137
128 buffer = DecoderBuffer::CopyFrom(packet.get()->data, packet.get()->size, 138 buffer = DecoderBuffer::CopyFrom(packet.get()->data, packet.get()->size,
129 side_data, side_data_size); 139 side_data.data(), side_data.size());
130 } else { 140 } else {
131 buffer = DecoderBuffer::CopyFrom(packet.get()->data, packet.get()->size); 141 int side_data_size = 0;
142 uint8* side_data = av_packet_get_side_data(
143 packet.get(),
144 AV_PKT_DATA_MATROSKA_BLOCKADDITIONAL,
145 &side_data_size);
146
147 // If a packet is returned by FFmpeg's av_parser_parse2() the packet will
148 // reference inner memory of FFmpeg. As such we should transfer the packet
149 // into memory we control.
150 if (side_data_size > 0) {
151 buffer = DecoderBuffer::CopyFrom(packet.get()->data, packet.get()->size,
152 side_data, side_data_size);
153 } else {
154 buffer = DecoderBuffer::CopyFrom(packet.get()->data, packet.get()->size);
155 }
132 } 156 }
133 157
134 if ((type() == DemuxerStream::AUDIO && audio_config_.is_encrypted()) || 158 if ((type() == DemuxerStream::AUDIO && audio_config_.is_encrypted()) ||
135 (type() == DemuxerStream::VIDEO && video_config_.is_encrypted())) { 159 (type() == DemuxerStream::VIDEO && video_config_.is_encrypted())) {
136 scoped_ptr<DecryptConfig> config(WebMCreateDecryptConfig( 160 scoped_ptr<DecryptConfig> config(WebMCreateDecryptConfig(
137 packet->data, packet->size, 161 packet->data, packet->size,
138 reinterpret_cast<const uint8*>(encryption_key_id_.data()), 162 reinterpret_cast<const uint8*>(encryption_key_id_.data()),
139 encryption_key_id_.size())); 163 encryption_key_id_.size()));
140 if (!config) 164 if (!config)
141 LOG(ERROR) << "Creation of DecryptConfig failed."; 165 LOG(ERROR) << "Creation of DecryptConfig failed.";
142 buffer->set_decrypt_config(config.Pass()); 166 buffer->set_decrypt_config(config.Pass());
143 } 167 }
144 168
145 buffer->set_timestamp(ConvertStreamTimestamp( 169 buffer->set_timestamp(ConvertStreamTimestamp(
146 stream_->time_base, packet->pts)); 170 stream_->time_base, packet->pts));
147 buffer->set_duration(ConvertStreamTimestamp( 171 buffer->set_duration(ConvertStreamTimestamp(
(...skipping 117 matching lines...) Expand 10 before | Expand all | Expand 10 after
265 // TODO(scherkus): Remove early return and reenable time-based capacity 289 // TODO(scherkus): Remove early return and reenable time-based capacity
266 // after our data sources support canceling/concurrent reads, see 290 // after our data sources support canceling/concurrent reads, see
267 // http://crbug.com/165762 for details. 291 // http://crbug.com/165762 for details.
268 return !read_cb_.is_null(); 292 return !read_cb_.is_null();
269 293
270 // Try to have one second's worth of encoded data per stream. 294 // Try to have one second's worth of encoded data per stream.
271 const base::TimeDelta kCapacity = base::TimeDelta::FromSeconds(1); 295 const base::TimeDelta kCapacity = base::TimeDelta::FromSeconds(1);
272 return buffer_queue_.IsEmpty() || buffer_queue_.Duration() < kCapacity; 296 return buffer_queue_.IsEmpty() || buffer_queue_.Duration() < kCapacity;
273 } 297 }
274 298
299 TextKind FFmpegDemuxerStream::GetTextKind() const {
300 DCHECK_EQ(type_, DemuxerStream::TEXT);
301
302 if (stream_->disposition & AV_DISPOSITION_CAPTIONS)
303 return kTextCaptions;
304
305 if (stream_->disposition & AV_DISPOSITION_DESCRIPTIONS)
306 return kTextDescriptions;
307
308 if (stream_->disposition & AV_DISPOSITION_METADATA)
309 return kTextMetadata;
310
311 return kTextSubtitles;
312 }
313
314 std::string FFmpegDemuxerStream::GetMetadata(const char* key) const {
315 const AVDictionaryEntry* entry =
316 av_dict_get(stream_->metadata, key, NULL, 0);
317 return (entry == NULL || entry->value == NULL) ? "" : entry->value;
318 }
319
275 // static 320 // static
276 base::TimeDelta FFmpegDemuxerStream::ConvertStreamTimestamp( 321 base::TimeDelta FFmpegDemuxerStream::ConvertStreamTimestamp(
277 const AVRational& time_base, int64 timestamp) { 322 const AVRational& time_base, int64 timestamp) {
278 if (timestamp == static_cast<int64>(AV_NOPTS_VALUE)) 323 if (timestamp == static_cast<int64>(AV_NOPTS_VALUE))
279 return kNoTimestamp(); 324 return kNoTimestamp();
280 325
281 return ConvertFromTimeBase(time_base, timestamp); 326 return ConvertFromTimeBase(time_base, timestamp);
282 } 327 }
283 328
284 // 329 //
285 // FFmpegDemuxer 330 // FFmpegDemuxer
286 // 331 //
287 FFmpegDemuxer::FFmpegDemuxer( 332 FFmpegDemuxer::FFmpegDemuxer(
288 const scoped_refptr<base::MessageLoopProxy>& message_loop, 333 const scoped_refptr<base::MessageLoopProxy>& message_loop,
289 DataSource* data_source, 334 DataSource* data_source,
290 const NeedKeyCB& need_key_cb, 335 const NeedKeyCB& need_key_cb,
336 bool text_enabled,
291 const scoped_refptr<MediaLog>& media_log) 337 const scoped_refptr<MediaLog>& media_log)
292 : host_(NULL), 338 : host_(NULL),
293 message_loop_(message_loop), 339 message_loop_(message_loop),
294 weak_factory_(this), 340 weak_factory_(this),
295 blocking_thread_("FFmpegDemuxer"), 341 blocking_thread_("FFmpegDemuxer"),
296 pending_read_(false), 342 pending_read_(false),
297 pending_seek_(false), 343 pending_seek_(false),
298 data_source_(data_source), 344 data_source_(data_source),
299 media_log_(media_log), 345 media_log_(media_log),
300 bitrate_(0), 346 bitrate_(0),
301 start_time_(kNoTimestamp()), 347 start_time_(kNoTimestamp()),
302 audio_disabled_(false), 348 audio_disabled_(false),
349 text_enabled_(text_enabled),
303 duration_known_(false), 350 duration_known_(false),
304 url_protocol_(data_source, BindToLoop(message_loop_, base::Bind( 351 url_protocol_(data_source, BindToLoop(message_loop_, base::Bind(
305 &FFmpegDemuxer::OnDataSourceError, base::Unretained(this)))), 352 &FFmpegDemuxer::OnDataSourceError, base::Unretained(this)))),
306 need_key_cb_(need_key_cb) { 353 need_key_cb_(need_key_cb) {
307 DCHECK(message_loop_.get()); 354 DCHECK(message_loop_.get());
308 DCHECK(data_source_); 355 DCHECK(data_source_);
309 } 356 }
310 357
311 FFmpegDemuxer::~FFmpegDemuxer() {} 358 FFmpegDemuxer::~FFmpegDemuxer() {}
312 359
(...skipping 84 matching lines...) Expand 10 before | Expand all | Expand 10 after
397 } 444 }
398 } 445 }
399 return NULL; 446 return NULL;
400 } 447 }
401 448
402 base::TimeDelta FFmpegDemuxer::GetStartTime() const { 449 base::TimeDelta FFmpegDemuxer::GetStartTime() const {
403 DCHECK(message_loop_->BelongsToCurrentThread()); 450 DCHECK(message_loop_->BelongsToCurrentThread());
404 return start_time_; 451 return start_time_;
405 } 452 }
406 453
454 void FFmpegDemuxer::AddTextStreams() {
455 DCHECK(message_loop_->BelongsToCurrentThread());
456
457 for (StreamVector::size_type idx = 0; idx < streams_.size(); ++idx) {
458 FFmpegDemuxerStream* stream = streams_[idx];
459 if (stream == NULL || stream->type() != DemuxerStream::TEXT)
460 continue;
461
462 TextKind kind = stream->GetTextKind();
463 std::string title = stream->GetMetadata("title");
464 std::string language = stream->GetMetadata("language");
465
466 host_->AddTextStream(stream, TextTrackConfig(kind, title, language));
467 }
468 }
469
407 // Helper for calculating the bitrate of the media based on information stored 470 // Helper for calculating the bitrate of the media based on information stored
408 // in |format_context| or failing that the size and duration of the media. 471 // in |format_context| or failing that the size and duration of the media.
409 // 472 //
410 // Returns 0 if a bitrate could not be determined. 473 // Returns 0 if a bitrate could not be determined.
411 static int CalculateBitrate( 474 static int CalculateBitrate(
412 AVFormatContext* format_context, 475 AVFormatContext* format_context,
413 const base::TimeDelta& duration, 476 const base::TimeDelta& duration,
414 int64 filesize_in_bytes) { 477 int64 filesize_in_bytes) {
415 // If there is a bitrate set on the container, use it. 478 // If there is a bitrate set on the container, use it.
416 if (format_context->bit_rate > 0) 479 if (format_context->bit_rate > 0)
(...skipping 98 matching lines...) Expand 10 before | Expand all | Expand 10 after
515 // Log the codec detected, whether it is supported or not. 578 // Log the codec detected, whether it is supported or not.
516 UMA_HISTOGRAM_SPARSE_SLOWLY("Media.DetectedVideoCodec", 579 UMA_HISTOGRAM_SPARSE_SLOWLY("Media.DetectedVideoCodec",
517 codec_context->codec_id); 580 codec_context->codec_id);
518 // Ensure the codec is supported. IsValidConfig() also checks that the 581 // Ensure the codec is supported. IsValidConfig() also checks that the
519 // frame size and visible size are valid. 582 // frame size and visible size are valid.
520 AVStreamToVideoDecoderConfig(stream, &video_config, false); 583 AVStreamToVideoDecoderConfig(stream, &video_config, false);
521 584
522 if (!video_config.IsValidConfig()) 585 if (!video_config.IsValidConfig())
523 continue; 586 continue;
524 video_stream = stream; 587 video_stream = stream;
588 } else if (codec_type == AVMEDIA_TYPE_SUBTITLE) {
589 if (codec_context->codec_id != AV_CODEC_ID_WEBVTT || !text_enabled_) {
590 continue;
591 }
525 } else { 592 } else {
526 continue; 593 continue;
527 } 594 }
528 595
529 streams_[i] = new FFmpegDemuxerStream(this, stream); 596 streams_[i] = new FFmpegDemuxerStream(this, stream);
530 max_duration = std::max(max_duration, streams_[i]->duration()); 597 max_duration = std::max(max_duration, streams_[i]->duration());
531 598
532 if (stream->first_dts != static_cast<int64_t>(AV_NOPTS_VALUE)) { 599 if (stream->first_dts != static_cast<int64_t>(AV_NOPTS_VALUE)) {
533 const base::TimeDelta first_dts = ConvertFromTimeBase( 600 const base::TimeDelta first_dts = ConvertFromTimeBase(
534 stream->time_base, stream->first_dts); 601 stream->time_base, stream->first_dts);
535 if (start_time_ == kNoTimestamp() || first_dts < start_time_) 602 if (start_time_ == kNoTimestamp() || first_dts < start_time_)
536 start_time_ = first_dts; 603 start_time_ = first_dts;
537 } 604 }
538 } 605 }
539 606
540 if (!audio_stream && !video_stream) { 607 if (!audio_stream && !video_stream) {
541 status_cb.Run(DEMUXER_ERROR_NO_SUPPORTED_STREAMS); 608 status_cb.Run(DEMUXER_ERROR_NO_SUPPORTED_STREAMS);
542 return; 609 return;
543 } 610 }
544 611
612 if (text_enabled_)
613 AddTextStreams();
614
545 if (format_context->duration != static_cast<int64_t>(AV_NOPTS_VALUE)) { 615 if (format_context->duration != static_cast<int64_t>(AV_NOPTS_VALUE)) {
546 // If there is a duration value in the container use that to find the 616 // If there is a duration value in the container use that to find the
547 // maximum between it and the duration from A/V streams. 617 // maximum between it and the duration from A/V streams.
548 const AVRational av_time_base = {1, AV_TIME_BASE}; 618 const AVRational av_time_base = {1, AV_TIME_BASE};
549 max_duration = 619 max_duration =
550 std::max(max_duration, 620 std::max(max_duration,
551 ConvertFromTimeBase(av_time_base, format_context->duration)); 621 ConvertFromTimeBase(av_time_base, format_context->duration));
552 } else { 622 } else {
553 // The duration is unknown, in which case this is likely a live stream. 623 // The duration is unknown, in which case this is likely a live stream.
554 max_duration = kInfiniteDuration(); 624 max_duration = kInfiniteDuration();
(...skipping 274 matching lines...) Expand 10 before | Expand all | Expand 10 after
829 } 899 }
830 for (size_t i = 0; i < buffered.size(); ++i) 900 for (size_t i = 0; i < buffered.size(); ++i)
831 host_->AddBufferedTimeRange(buffered.start(i), buffered.end(i)); 901 host_->AddBufferedTimeRange(buffered.start(i), buffered.end(i));
832 } 902 }
833 903
834 void FFmpegDemuxer::OnDataSourceError() { 904 void FFmpegDemuxer::OnDataSourceError() {
835 host_->OnDemuxerError(PIPELINE_ERROR_READ); 905 host_->OnDemuxerError(PIPELINE_ERROR_READ);
836 } 906 }
837 907
838 } // namespace media 908 } // namespace media
OLDNEW

Powered by Google App Engine
This is Rietveld 408576698