media/cast/sender/h264_vt_encoder.cc - Issue 450693006: VideoToolbox encoder for cast senders.

Unified Diff: media/cast/sender/h264_vt_encoder.cc

Issue 450693006: VideoToolbox encoder for cast senders. (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@master

Patch Set: Fix lint and formatting issues. Created 6 years, 4 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: media/cast/sender/h264_vt_encoder.cc

diff --git a/media/cast/sender/h264_vt_encoder.cc b/media/cast/sender/h264_vt_encoder.cc

new file mode 100644

index 0000000000000000000000000000000000000000..190de2c6249db2b89b2a3264c9edf67ce091f0d5

--- /dev/null

+++ b/media/cast/sender/h264_vt_encoder.cc

@@ -0,0 +1,813 @@

+// Use of this source code is governed by a BSD-style license that can be

+// found in the LICENSE file.

+#include "media/cast/sender/h264_vt_encoder.h"

+#include <algorithm>

+#include <vector>

+#include "base/big_endian.h"

+#include "base/bind.h"

+#include "base/bind_helpers.h"

+#include "base/location.h"

+#include "base/logging.h"

+namespace media {

+namespace cast {

+static const char* GetCVErrorString(CVReturn error) {

+ switch (error) {

+ case kCVReturnSuccess:

+ return "success";

+ case kCVReturnError:

+ return "error";

+ case kCVReturnInvalidArgument:

+ return "invalid argument";

+ case kCVReturnAllocationFailed:

+ return "allocation failed";

+ case kCVReturnInvalidDisplay:

+ return "invalid display";

+ case kCVReturnDisplayLinkAlreadyRunning:

+ return "display link already running";

+ case kCVReturnDisplayLinkNotRunning:

+ return "display link not running";

+ case kCVReturnDisplayLinkCallbacksNotSet:

+ return "display link callback not set";

+ case kCVReturnInvalidPixelFormat:

+ return "invalid pixel format";

+ case kCVReturnInvalidSize:

+ return "invalid size";

+ case kCVReturnInvalidPixelBufferAttributes:

+ return "invalid pixel buffer attributes";

+ case kCVReturnPixelBufferNotOpenGLCompatible:

+ return "pixel buffer not OpenGL compatible";

+ case kCVReturnWouldExceedAllocationThreshold:

+ return "would exceed allocation threshold";

+ case kCVReturnPoolAllocationFailed:

+ return "pool allocation failed";

+ case kCVReturnInvalidPoolAttributes:

+ return "invalid pool attributes";

+ default:

+ return "unknown error";

+ }

+static const char* GetVTErrorString(OSStatus error) {

+ switch (error) {

+ case kVTPropertyNotSupportedErr:

+ return "property not supported";

+ case kVTPropertyReadOnlyErr:

+ return "read only property";

+ case kVTParameterErr:

+ return "invalid parameter";

+ case kVTInvalidSessionErr:

+ return "invalid session";

+ case kVTAllocationFailedErr:

+ return "allocation failed";

+ case kVTPixelTransferNotSupportedErr:

+ return "pixel transfer not supported";

+ case kVTCouldNotFindVideoDecoderErr:

+ return "could not find video decoder";

+ case kVTCouldNotCreateInstanceErr:

+ return "could not create instance";

+ case kVTCouldNotFindVideoEncoderErr:

+ return "could not find video encoder";

+ case kVTVideoDecoderBadDataErr:

+ return "video decoder bad data";

+ case kVTVideoDecoderUnsupportedDataFormatErr:

+ return "video decoder unsupported data format";

+ case kVTVideoDecoderMalfunctionErr:

+ return "video decoder malfunction";

+ case kVTVideoEncoderMalfunctionErr:

+ return "video encoder malfunction";

+ case kVTVideoDecoderNotAvailableNowErr:

+ return "video decoder not available";

+ case kVTImageRotationNotSupportedErr:

+ return "image rotation not supported";

+ case kVTVideoEncoderNotAvailableNowErr:

+ return "video encoder not available now";

+ case kVTFormatDescriptionChangeNotSupportedErr:

+ return "format description change not supported";

+ case kVTInsufficientSourceColorDataErr:

+ return "insufficient source color data";

+ case kVTCouldNotCreateColorCorrectionDataErr:

+ return "could not create color correction data";

+ case kVTColorSyncTransformConvertFailedErr:

+ return "ColorSync transform convert failed";

+ case kVTVideoDecoderAuthorizationErr:

+ return "video decoder authorization error";

+ case kVTVideoEncoderAuthorizationErr:

+ return "video encoder authorization error";

+ case kVTColorCorrectionPixelTransferFailedErr:

+ return "color correction pixel transfer failed";

+ case kVTMultiPassStorageIdentifierMismatchErr:

+ return "multi-pass storage identifier mismatch";

+ case kVTMultiPassStorageInvalidErr:

+ return "invalid multi-pass storage";

+ case kVTFrameSiloInvalidTimeStampErr:

+ return "invalid frame silo timestamp";

+ case kVTFrameSiloInvalidTimeRangeErr:

+ return "invalid frame silo time range";

+ case kVTCouldNotFindTemporalFilterErr:

+ return "could not find temporal filter";

+ case kVTPixelTransferNotPermittedErr:

+ return "pixel transfer not permitted";

+ default:

+ return "unknown error";

+ }

+#pragma mark -

Robert Sesek 2014/08/07 22:49:23 Chrome doesn't typically do this.

jfroy 2014/08/07 23:06:11 Acknowledged.

+// utility to log CFTypes

+std::ostream& operator<<(std::ostream& out, const CFStringRef& cfstring) {

Robert Sesek 2014/08/07 22:49:22 All these osteram functions are just to support DL

jfroy 2014/08/07 23:06:11 Acknowledged.

+ if (!cfstring) {

+ return out << "null";

+ }

+ const char* c_str;

+ c_str = CFStringGetCStringPtr(cfstring, kCFStringEncodingASCII);

+ if (c_str) {

+ return out << c_str;

+ }

+ c_str = CFStringGetCStringPtr(cfstring, kCFStringEncodingUTF8);

+ if (c_str) {

+ return out << c_str;

+ }

+ CFIndex length = CFStringGetLength(cfstring);

+ size_t size =

+ CFStringGetMaximumSizeForEncoding(length, kCFStringEncodingUTF8) + 1;

+ std::vector<char> c_str_buf;

+ c_str_buf.reserve(size);

+ CFStringGetCString(cfstring, c_str_buf.data(), size, kCFStringEncodingUTF8);

+ return out << c_str_buf.data();

+std::ostream& operator<<(std::ostream& out, const CFNumberRef& cfnumber) {

+ if (!cfnumber) {

+ return out << "null";

+ }

+ base::ScopedCFTypeRef<CFNumberFormatterRef> formatter(CFNumberFormatterCreate(

+ kCFAllocatorDefault, CFLocaleGetSystem(), kCFNumberFormatterNoStyle));

+ base::ScopedCFTypeRef<CFStringRef> as_str(

+ CFNumberFormatterCreateStringWithNumber(

+ kCFAllocatorDefault, formatter, cfnumber));

+ return out << as_str;

+std::ostream& operator<<(std::ostream& out, const CFBooleanRef& cfboolean) {

+ if (!cfboolean) {

+ return out << "null";

+ }

+ base::ScopedCFTypeRef<CFStringRef> as_str(

+ CFBooleanGetValue(cfboolean) ? CFSTR("true") : CFSTR("false"));

+ return out << as_str;

+struct CFTypeEmittable {

+ explicit CFTypeEmittable(CFTypeRef cfobject) : cfobject_(cfobject) {}

+ explicit operator bool() const { return cfobject_ != nullptr; }

+ operator CFTypeRef() const { return cfobject_; }

+ CFTypeRef get() const { return cfobject_; }

+ friend std::ostream& operator<<(std::ostream&, const CFTypeEmittable&);

+ CFTypeRef cfobject_;

+};

+std::ostream& operator<<(std::ostream& out, const CFTypeEmittable& emittable) {

+ if (!emittable) {

+ return out << "null";

+ }

+ if (CFGetTypeID(emittable) == CFStringGetTypeID()) {

+ return out << static_cast<CFStringRef>(emittable.get());

+ } else if (CFGetTypeID(emittable) == CFNumberGetTypeID()) {

+ return out << static_cast<CFNumberRef>(emittable.get());

+ } else if (CFGetTypeID(emittable) == CFBooleanGetTypeID()) {

+ return out << static_cast<CFBooleanRef>(emittable.get());

+ }

+ base::ScopedCFTypeRef<CFStringRef> as_str(CFCopyDescription(emittable));

+ return out << as_str;

+std::ostream& operator<<(std::ostream& out, const CMTime& time) {

+ return out << "{value=" << time.value << ", timescale=" << time.timescale

+ << ", flags=" << time.flags << ", epoch=" << time.epoch << "}";

+std::ostream& operator<<(std::ostream& out,

+ const CMSampleTimingInfo& timing_info) {

+ return out << "{duration=" << timing_info.duration

+ << ", pts=" << timing_info.presentationTimeStamp

+ << ", dts=" << timing_info.decodeTimeStamp << "}";

+#pragma mark -

+template <typename T>

+bool SetSessionProperty(VTSessionRef session,

Robert Sesek 2014/08/07 22:49:22 Is this really templatized for just logging purpos

jfroy 2014/08/07 23:06:11 Mostly yes, but it's also nice to have setters wit

+ CFStringRef key,

+ T value,

+ CFTypeRef cfvalue) {

+ DVLOG(3) << __func__ << ": " << key << "=" << value;

+ OSStatus status = VTSessionSetProperty(session, key, cfvalue);

+ if (status != noErr) {

+ DLOG(ERROR) << __func__

+ << " VTSessionSetProperty failed: " << GetVTErrorString(status)

+ << " (" << status << ") " << key << "=" << value;

+ }

+ return status == noErr;

+static bool SetSessionProperty(VTSessionRef session,

+ CFStringRef key,

+ uint32_t value) {

+ base::ScopedCFTypeRef<CFNumberRef> cfvalue(

+ CFNumberCreate(nullptr, kCFNumberSInt32Type, &value));

+ return SetSessionProperty(session, key, value, cfvalue);

+static bool SetSessionProperty(VTSessionRef session,

+ CFStringRef key,

+ bool value) {

+ CFBooleanRef cfvalue = (value) ? kCFBooleanTrue : kCFBooleanFalse;

+ return SetSessionProperty(session, key, value, cfvalue);

+static bool SetSessionProperty(VTSessionRef session,

+ CFStringRef key,

+ CFStringRef value) {

+ return SetSessionProperty(session, key, value, value);

+static base::ScopedCFTypeRef<CFDictionaryRef> DictionaryWithKeyValue(

+ CFTypeRef key,

+ CFTypeRef value) {

+ CFTypeRef keys[1] = {key};

+ CFTypeRef values[1] = {value};

+ return base::ScopedCFTypeRef<CFDictionaryRef>(

+ CFDictionaryCreate(kCFAllocatorDefault,

+ keys,

+ values,

+ 1,

+ &kCFTypeDictionaryKeyCallBacks,

+ &kCFTypeDictionaryValueCallBacks));

+#pragma mark -

+struct H264VideoToolboxEncoder::FrameContext {

+ base::TimeTicks capture_time;

+ FrameEncodedCallback frame_encoded_callback;

+};

+H264VideoToolboxEncoder::H264VideoToolboxEncoder(

+ scoped_refptr<CastEnvironment> cast_environment,

+ const VideoSenderConfig& video_config)

+ : cast_environment_(cast_environment),

+ cast_config_(video_config),

+ frame_id_(kStartFrameId),

+ last_keyframe_id_(kStartFrameId),

+ encode_next_frame_as_keyframe_(false) {

+ Initialize();

Robert Sesek 2014/08/07 22:49:23 You only call this here, so why is it a separate m

jfroy 2014/08/07 23:06:11 The current code doesn't do it, but I have a suspi

+H264VideoToolboxEncoder::~H264VideoToolboxEncoder() {

+ Teardown();

Robert Sesek 2014/08/07 22:49:22 Same.

jfroy 2014/08/07 23:06:11 See my reply above.

+CVPixelBufferPoolRef H264VideoToolboxEncoder::cv_pixel_buffer_pool() const {

+ DCHECK(thread_checker_.CalledOnValidThread());

+ DCHECK(compression_session_);

+ return VTCompressionSessionGetPixelBufferPool(compression_session_);

+void H264VideoToolboxEncoder::Initialize() {

+ DCHECK(thread_checker_.CalledOnValidThread());

+ DCHECK(!compression_session_);

+ DVLOG(3) << __func__ << " width: " << cast_config_.width

+ << ", height: " << cast_config_.height

+ << ", start_bitrate: " << cast_config_.start_bitrate

+ << ", max_frame_rate:" << cast_config_.max_frame_rate;

+ // Note that the encoder object is given to the compression session as the

+ // callback context using a raw pointer. The C API does not allow us to use

+ // a smart pointer, nor is this encoder ref counted. However, this is still

+ // safe, because we 1) we own the compression session and 2) we tear it down

+ // safely. When destructing the encoder, the compression session is flushed

+ // and invalidated. Internally, VideoToolbox will join all of its threads

+ // before returning to the client. Therefore, when control returns to us, we

+ // are guaranteed that the output callback will not execute again.

+ // On OS X, allow the hardware encoder. Don't require it, it does not support

+ // all configurations (some of which are used for testing).

+ DictionaryPtr encoder_spec(nullptr);

+#if !defined(OS_IOS)

+ encoder_spec = DictionaryWithKeyValue(

+ kVTVideoEncoderSpecification_EnableHardwareAcceleratedVideoEncoder,

+ kCFBooleanTrue);

+#endif

+ VTCompressionSessionRef session;

+ OSStatus status =

+ VTCompressionSessionCreate(kCFAllocatorDefault,

+ cast_config_.width,

+ cast_config_.height,

+ kCMVideoCodecType_H264,

+ encoder_spec,

+ nullptr /* sourceImageBufferAttributes */,

+ nullptr /* compressedDataAllocator */,

+ CompressionCallback,

+ reinterpret_cast<void*>(this),

+ &session);

+ if (status != noErr) {

+ DLOG(ERROR) << __func__ << " VTCompressionSessionCreate failed: "

+ << GetVTErrorString(status) << " (" << status << ")";

+ return;

+ }

+ compression_session_.reset(session);

+#if defined(OS_IOS)

+ using_hardware_ = true;

+#else

+ CFBooleanRef using_hardware_cf = nullptr;

+ status = VTSessionCopyProperty(

+ session,

+ kVTCompressionPropertyKey_UsingHardwareAcceleratedVideoEncoder,

+ kCFAllocatorDefault,

+ &using_hardware_cf);

+ if (status == noErr) {

+ using_hardware_ = CFBooleanGetValue(using_hardware_cf);

+ CFRelease(using_hardware_cf);

+ }

+ DVLOG(3) << __func__ << " using hardware: " << using_hardware_;

+#endif

+ ConfigureSession();

+static void SetConfigurationApplier(CFStringRef key,

+ CFTypeRef value,

+ VTCompressionSessionRef session) {

+ SetSessionProperty(session, key, CFTypeEmittable(value), value);

+void H264VideoToolboxEncoder::ConfigureSession() {