content/common/gpu/media/vt_video_encode_accelerator.cc - Issue 1636083003: H264 HW encode using VideoToolbox

Unified Diff: content/common/gpu/media/vt_video_encode_accelerator.cc

Issue 1636083003: H264 HW encode using VideoToolbox (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@master

Patch Set: miu@ comments. Created 4 years, 10 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

« content/common/gpu/media/vt_video_encode_accelerator.h ('K') | « content/common/gpu/media/vt_video_encode_accelerator.h ('k') | content/content_common.gypi » ('j') | no next file with comments »
Expand Comments ('e') | Collapse Comments ('c') | Hide Comments ('s')

Index: content/common/gpu/media/vt_video_encode_accelerator.cc

diff --git a/content/common/gpu/media/vt_video_encode_accelerator.cc b/content/common/gpu/media/vt_video_encode_accelerator.cc

new file mode 100644

index 0000000000000000000000000000000000000000..466c6c4179fee98885971ccf8877060bdc638bb3

--- /dev/null

+++ b/content/common/gpu/media/vt_video_encode_accelerator.cc

@@ -0,0 +1,328 @@

+// Use of this source code is governed by a BSD-style license that can be

+// found in the LICENSE file.

+#include "content/common/gpu/media/vt_video_encode_accelerator.h"

+#include "base/thread_task_runner_handle.h"

+#include "media/base/mac/coremedia_glue.h"

+#include "media/base/mac/corevideo_glue.h"

+#include "media/base/mac/video_frame_mac.h"

+namespace content {

+namespace {

+// Subjectively chosen.

+// TODO(emircan): Check if we can find the actual system capabilities via

+// creating VTCompressionSessions with varying requirements.

+// See crbug.com/584784.

+const size_t kNumInputBuffers = 4;

+const size_t kMaxFrameRateNumerator = 30;

+const size_t kMaxFrameRateDenominator = 1;

+const size_t kMaxResolutionWidth = 4096;

+const size_t kMaxResolutionHeight = 2160;

+// The ratio of |input_visible_size| area to the max expected output

+// BitstreamBuffer size in bytes. VideoToolbox returns variable sized encoded

+// data whereas media::VideoEncodeAccelerator provides a uniform BitstreamBuffer

+// size to fill this data into. This ratio is used to determine a size that

+// would ideally be big enough to fit all frames.

+const size_t kOutputBufferSizeRatio = 10;

+// Container for the associated data of a video frame being processed.

+struct InProgressFrameEncode {

Pawel Osciak 2016/02/08 04:33:42 Could this be a private substruct of VTVEA?

emircan 2016/02/08 23:41:23 Done.

+ const base::TimeDelta timestamp;

+ const base::TimeTicks reference_time;

+ InProgressFrameEncode(base::TimeDelta rtp_timestamp, base::TimeTicks ref_time)

+ : timestamp(rtp_timestamp), reference_time(ref_time) {}

+ private:

+ DISALLOW_IMPLICIT_CONSTRUCTORS(InProgressFrameEncode);

+};

+} // namespace

+struct VTVideoEncodeAccelerator::BitstreamBufferRef {

+ BitstreamBufferRef(int32_t id,

+ scoped_ptr<base::SharedMemory> shm,

Pawel Osciak 2016/02/08 04:33:42 const& perhaps?

emircan 2016/02/08 23:41:23 I cannot use std::move on const scoped_ptr&.

+ size_t size)

+ : id(id), shm(std::move(shm)), size(size) {}

+ const int32_t id;

+ const scoped_ptr<base::SharedMemory> shm;

+ const size_t size;

+ private:

+ DISALLOW_IMPLICIT_CONSTRUCTORS(BitstreamBufferRef);

+};

+VTVideoEncodeAccelerator::VTVideoEncodeAccelerator()

+ : videotoolbox_glue_(VideoToolboxGlue::Get()),

Pawel Osciak 2016/02/08 04:33:43 We used to check this for != nullptr (https://code

emircan 2016/02/08 23:41:23 Hmm we dont have a similar IsSupported() call thou

+ client_task_runner_(base::ThreadTaskRunnerHandle::Get()) {

+VTVideoEncodeAccelerator::~VTVideoEncodeAccelerator() {

+ DCHECK(thread_checker_.CalledOnValidThread());

+media::VideoEncodeAccelerator::SupportedProfiles

+VTVideoEncodeAccelerator::GetSupportedProfiles() {

+ DVLOG(3) << __FUNCTION__;

+ DCHECK(thread_checker_.CalledOnValidThread());

+ SupportedProfiles profiles;

+ SupportedProfile profile;

+ profile.profile = media::H264PROFILE_BASELINE;

+ profile.max_framerate_numerator = kMaxFrameRateNumerator;

+ profile.max_framerate_denominator = kMaxFrameRateDenominator;

+ profile.max_resolution = gfx::Size(kMaxResolutionWidth, kMaxResolutionHeight);

+ profiles.push_back(profile);

+ return profiles;

+bool VTVideoEncodeAccelerator::Initialize(

+ media::VideoPixelFormat format,

+ const gfx::Size& input_visible_size,

+ media::VideoCodecProfile output_profile,

+ uint32_t initial_bitrate,

+ Client* client) {

+ DVLOG(3) << __FUNCTION__

+ << ": input_format=" << media::VideoPixelFormatToString(format)

+ << ", input_visible_size=" << input_visible_size.ToString()

+ << ", output_profile=" << output_profile

+ << ", initial_bitrate=" << initial_bitrate;

+ DCHECK(thread_checker_.CalledOnValidThread());

+ DCHECK(client);

+ DCHECK_EQ(media::PIXEL_FORMAT_I420, format);

Pawel Osciak 2016/02/08 04:33:42 I'd suggest if()s and careful check for argument v

emircan 2016/02/08 23:41:23 Done.

+ DCHECK_EQ(media::H264PROFILE_BASELINE, output_profile);

Pawel Osciak 2016/02/08 04:33:42 I'd prefer we if()'d profile here nevertheless. Th

emircan 2016/02/08 23:41:24 Done.

+ bitrate_ = initial_bitrate;

+ input_visible_size_ = input_visible_size;

+ if (!ResetCompressionSession()) {

+ DLOG(ERROR) << "Failed creating compression session";

+ return false;

+ }

+ client_ptr_factory_.reset(new base::WeakPtrFactory<Client>(client));

Pawel Osciak 2016/02/08 04:33:42 I'd suggest doing this before calling any methods,

emircan 2016/02/08 23:41:23 Ok, moving it right after the initial ifs.

+ client_ = client_ptr_factory_->GetWeakPtr();

+ client_->RequireBitstreamBuffers(

+ kNumInputBuffers, input_visible_size_,

+ input_visible_size_.GetArea() / kOutputBufferSizeRatio);

+ return true;

+void VTVideoEncodeAccelerator::Encode(

+ const scoped_refptr<media::VideoFrame>& frame,

+ bool force_keyframe) {

+ DVLOG(3) << __FUNCTION__;

+ DCHECK(thread_checker_.CalledOnValidThread());

+ DCHECK(compression_session_);

+ DCHECK(frame);

+ base::TimeTicks ref_time;

+ if (!frame->metadata()->GetTimeTicks(

+ media::VideoFrameMetadata::REFERENCE_TIME, &ref_time)) {

+ ref_time = base::TimeTicks::Now();

+ }

+ auto timestamp_cm = CoreMediaGlue::CMTimeMake(

+ frame->timestamp().InMicroseconds(), USEC_PER_SEC);

+ // Wrap information we'll need after the frame is encoded in a heap object.

+ // We'll get the pointer back from the VideoToolbox completion callback.

+ scoped_ptr<InProgressFrameEncode> request(new InProgressFrameEncode(

+ frame->timestamp(), ref_time));

+ // TODO(emircan): See if we can eliminate a copy here by using

+ // CVPixelBufferPool for the allocation of incoming VideoFrames.

+ base::ScopedCFTypeRef<CVPixelBufferRef> pixel_buffer =

+ media::WrapVideoFrameInCVPixelBuffer(*frame);

+ base::ScopedCFTypeRef<CFDictionaryRef> frame_props =

+ media::video_toolbox::DictionaryWithKeyValue(

+ videotoolbox_glue_->kVTEncodeFrameOptionKey_ForceKeyFrame(),

+ force_keyframe ? kCFBooleanTrue : kCFBooleanFalse);

+ OSStatus status = videotoolbox_glue_->VTCompressionSessionEncodeFrame(

+ compression_session_, pixel_buffer, timestamp_cm,

+ CoreMediaGlue::CMTime{0, 0, 0, 0}, frame_props,

+ reinterpret_cast<void*>(request.release()), nullptr);

+ DLOG_IF(ERROR, status != noErr)

Pawel Osciak 2016/02/08 04:33:42 No need to NOTIFY_ERROR? Can we continue from next

emircan 2016/02/08 23:41:23 Thanks for pointing out. I realize I haven't used

+ << " VTCompressionSessionEncodeFrame failed: " << status;

+void VTVideoEncodeAccelerator::UseOutputBitstreamBuffer(

+ const media::BitstreamBuffer& buffer) {

+ DVLOG(3) << __FUNCTION__;

+ DCHECK(thread_checker_.CalledOnValidThread());

+ DCHECK_GE(buffer.size(), static_cast<size_t>(input_visible_size_.GetArea() /

Pawel Osciak 2016/02/08 04:33:42 I think it'd be better to if() here please.

emircan 2016/02/08 23:41:23 Done.

+ kOutputBufferSizeRatio));

+ scoped_ptr<base::SharedMemory> shm(

+ new base::SharedMemory(buffer.handle(), false));

+ if (!shm->Map(buffer.size())) {

+ DLOG(ERROR) << "Failed mapping shared memory.";

Pawel Osciak 2016/02/08 04:33:42 NOTIFY_ERROR?

emircan 2016/02/08 23:41:23 Done.

+ return;

+ }

+ scoped_ptr<BitstreamBufferRef> buffer_ref(

+ new BitstreamBufferRef(buffer.id(), std::move(shm), buffer.size()));

+ encoder_output_queue_.push_back(std::move(buffer_ref));

Pawel Osciak 2016/02/08 04:33:42 Do we need to wake something up here? If we got En

emircan 2016/02/08 23:41:23 Replied to the later comment.

+void VTVideoEncodeAccelerator::RequestEncodingParametersChange(

+ uint32_t bitrate,

+ uint32_t framerate) {

Pawel Osciak 2016/02/08 04:33:42 If this class cannot handle changing framerate, sh

emircan 2016/02/08 23:41:23 Actually both changes aren't supported, but at lea

+ DVLOG(3) << __FUNCTION__;

+ DCHECK(thread_checker_.CalledOnValidThread());

+ bitrate_ = bitrate;

Pawel Osciak 2016/02/08 04:33:42 We should preferably check input values here.

emircan 2016/02/08 23:41:24 What kind of checks? I found (bitrate < 1) checks

+ if (!compression_session_)

Pawel Osciak 2016/02/08 04:33:42 NOTIFY_ERROR?

emircan 2016/02/08 23:41:24 Done.

+ return;

+ session_property_setter_->SetSessionProperty(

Pawel Osciak 2016/02/08 04:33:42 SetSessionProperty() methods are bool, but we are

emircan 2016/02/08 23:41:24 I will go through them.

+ videotoolbox_glue_->kVTCompressionPropertyKey_AverageBitRate(),

+ static_cast<int32_t>(bitrate_));

+void VTVideoEncodeAccelerator::Destroy() {

+ DVLOG(3) << __FUNCTION__;

+ DCHECK(thread_checker_.CalledOnValidThread());

+ DestroyCompressionSession();

+ delete this;

+// static

+void VTVideoEncodeAccelerator::CompressionCallback(void* encoder_opaque,

Pawel Osciak 2016/02/08 04:33:42 Do we know what thread this is called on? Should

emircan 2016/02/08 23:41:23 No. To quote the documentation: "This function may

+ void* request_opaque,

+ OSStatus status,

+ VTEncodeInfoFlags info,

+ CMSampleBufferRef sbuf) {

+ DVLOG(3) << __FUNCTION__;

+ if (status != noErr)

+ DLOG(ERROR) << " encode failed: " << status;

Pawel Osciak 2016/02/08 04:33:43 NOTIFY_ERROR?

emircan 2016/02/08 23:41:23 Done.

+ if (info & VideoToolboxGlue::kVTEncodeInfo_FrameDropped) {

+ DVLOG(2) << " frame dropped";

+ return;

+ }

+ auto sample_attachments = static_cast<CFDictionaryRef>(CFArrayGetValueAtIndex(

+ CoreMediaGlue::CMSampleBufferGetSampleAttachmentsArray(sbuf, true), 0));

+ const bool keyframe =

+ !CFDictionaryContainsKey(sample_attachments,

+ CoreMediaGlue::kCMSampleAttachmentKey_NotSync());

+ auto encoder = reinterpret_cast<VTVideoEncodeAccelerator*>(encoder_opaque);

+ DCHECK(encoder);

+ if (encoder->encoder_output_queue_.empty()) {

+ DLOG(ERROR) << "No more bitstream buffer to encode into.";

Pawel Osciak 2016/02/08 04:33:42 Please see my previous comment, but I think this c

emircan 2016/02/08 23:41:23 Thanks for pointing out. I didn't know Encode() an

+ encoder->client_task_runner_->PostTask(

+ FROM_HERE, base::Bind(&Client::NotifyError, encoder->client_,

+ kPlatformFailureError));

+ return;

+ }

+ scoped_ptr<VTVideoEncodeAccelerator::BitstreamBufferRef> buffer_ref =

+ std::move(encoder->encoder_output_queue_.front());

+ encoder->encoder_output_queue_.pop_front();

+ size_t used_buffer_size = 0;

+ const bool copy_rv = media::video_toolbox::CopySampleBufferToAnnexBBuffer(

+ sbuf, reinterpret_cast<uint8_t*>(buffer_ref->shm->memory()),

+ buffer_ref->size, keyframe, &used_buffer_size);

+ if (!copy_rv) {

+ DLOG(ERROR) << "Cannot copy output from SampleBuffer to AnnexBBuffer.";

+ encoder->encoder_output_queue_.push_back(std::move(buffer_ref));

+ return;

+ }

+ // This method is NOT called on |client_task_runner_|, so we still need to

Pawel Osciak 2016/02/08 04:33:42 Uhh, if so, I don't think we can access encoder at

emircan 2016/02/08 23:41:23 I am posting a task as you suggest. But why woul

Pawel Osciak 2016/02/18 11:16:14 Concurrent read-only calls to containers are ok, b

+ // post a task back to it to reach |client_|.

+ encoder->client_task_runner_->PostTask(

+ FROM_HERE, base::Bind(&Client::BitstreamBufferReady, encoder->client_,

+ buffer_ref->id, used_buffer_size, keyframe));

+bool VTVideoEncodeAccelerator::ResetCompressionSession() {

+ DCHECK(thread_checker_.CalledOnValidThread());

+ DestroyCompressionSession();

+ base::ScopedCFTypeRef<CFDictionaryRef> encoder_spec =

+ media::video_toolbox::DictionaryWithKeyValue(videotoolbox_glue_

+ ->kVTVideoEncoderSpecification_EnableHardwareAcceleratedVideoEncoder(),

+ kCFBooleanTrue);

+ // Keep these in-sync with those in ConfigureSession().

Pawel Osciak 2016/02/08 04:33:42 Where is ConfigureSession() ?

emircan 2016/02/08 23:41:23 Changed it to ConfigureCompressionSession().

+ CFTypeRef attributes_keys[] = {

+#if defined(OS_IOS)

+ kCVPixelBufferOpenGLESCompatibilityKey,

+#else

+ kCVPixelBufferOpenGLCompatibilityKey,

+#endif

+ kCVPixelBufferIOSurfacePropertiesKey,

+ kCVPixelBufferPixelFormatTypeKey

+ };

+ const int format[] = {

Pawel Osciak 2016/02/08 04:33:42 Is this a fourcc? If so uint32_t please.

emircan 2016/02/08 23:41:24 We need to create CFArrayRef<int> from it.

+ CoreVideoGlue::kCVPixelFormatType_420YpCbCr8BiPlanarVideoRange};

+ CFTypeRef attributes_values[] = {

+ kCFBooleanTrue,

+ media::video_toolbox::DictionaryWithKeysAndValues(nullptr, nullptr, 0)

+ .release(),

+ media::video_toolbox::ArrayWithIntegers(format, arraysize(format))

+ .release()};

+ const base::ScopedCFTypeRef<CFDictionaryRef> attributes =

+ media::video_toolbox::DictionaryWithKeysAndValues(

+ attributes_keys, attributes_values, arraysize(attributes_keys));

+ for (auto& v : attributes_values)

+ CFRelease(v);

+ // Create the compression session.

+ OSStatus status = videotoolbox_glue_->VTCompressionSessionCreate(

+ kCFAllocatorDefault,

+ input_visible_size_.width(),

+ input_visible_size_.height(),

+ CoreMediaGlue::kCMVideoCodecType_H264,

+ encoder_spec,

+ attributes,

+ nullptr /* compressedDataAllocator */,

+ &VTVideoEncodeAccelerator::CompressionCallback,

+ reinterpret_cast<void*>(this),

+ compression_session_.InitializeInto());

+ if (status != noErr) {

+ DLOG(ERROR) << " VTCompressionSessionCreate failed: " << status;

+ return false;

+ }

+ ConfigureCompressionSession();

+ return true;

+void VTVideoEncodeAccelerator::ConfigureCompressionSession() {

+ DCHECK(thread_checker_.CalledOnValidThread());

+ DCHECK(compression_session_);

+ session_property_setter_.reset(

+ new media::video_toolbox::SessionPropertySetter(compression_session_,

+ videotoolbox_glue_));

+ session_property_setter_->SetSessionProperty(

+ videotoolbox_glue_->kVTCompressionPropertyKey_ProfileLevel(),

+ videotoolbox_glue_->kVTProfileLevel_H264_Baseline_AutoLevel());

Pawel Osciak 2016/02/08 04:33:42 Is baseline preferred by us? Normally constrained

emircan 2016/02/08 23:41:24 I discussed this with WebRTC people. I learned tha

Pawel Osciak 2016/02/18 11:16:14 Are we sure that was Baseline, and not Constrained

emircan 2016/03/03 19:18:19 As far as I got answers from WebRTC folks, it is B

+ session_property_setter_->SetSessionProperty(

+ videotoolbox_glue_->kVTCompressionPropertyKey_RealTime(), true);

+ session_property_setter_->SetSessionProperty(

+ videotoolbox_glue_->kVTCompressionPropertyKey_AverageBitRate(),

+ static_cast<int32_t>(bitrate_));

+ session_property_setter_->SetSessionProperty(

+ videotoolbox_glue_->kVTCompressionPropertyKey_AllowFrameReordering(),

+ false);

+void VTVideoEncodeAccelerator::DestroyCompressionSession() {

+ DCHECK(thread_checker_.CalledOnValidThread());

+ if (compression_session_) {

+ videotoolbox_glue_->VTCompressionSessionInvalidate(compression_session_);

+ compression_session_.reset();

+ }

+} // namespace content