Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(706)

Unified Diff: media/cast/sender/h264_vt_encoder.cc

Issue 450693006: VideoToolbox encoder for cast senders. (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@master
Patch Set: Fix lint and formatting issues. Created 6 years, 4 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View side-by-side diff with in-line comments
Download patch
« no previous file with comments | « media/cast/sender/h264_vt_encoder.h ('k') | no next file » | no next file with comments »
Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
Index: media/cast/sender/h264_vt_encoder.cc
diff --git a/media/cast/sender/h264_vt_encoder.cc b/media/cast/sender/h264_vt_encoder.cc
new file mode 100644
index 0000000000000000000000000000000000000000..190de2c6249db2b89b2a3264c9edf67ce091f0d5
--- /dev/null
+++ b/media/cast/sender/h264_vt_encoder.cc
@@ -0,0 +1,813 @@
+// Copyright 2014 The Chromium Authors. All rights reserved.
+// Use of this source code is governed by a BSD-style license that can be
+// found in the LICENSE file.
+
+#include "media/cast/sender/h264_vt_encoder.h"
+
+#include <algorithm>
+#include <vector>
+
+#include "base/big_endian.h"
+#include "base/bind.h"
+#include "base/bind_helpers.h"
+#include "base/location.h"
+#include "base/logging.h"
+
+namespace media {
+namespace cast {
+
+static const char* GetCVErrorString(CVReturn error) {
+ switch (error) {
+ case kCVReturnSuccess:
+ return "success";
+ case kCVReturnError:
+ return "error";
+ case kCVReturnInvalidArgument:
+ return "invalid argument";
+ case kCVReturnAllocationFailed:
+ return "allocation failed";
+ case kCVReturnInvalidDisplay:
+ return "invalid display";
+ case kCVReturnDisplayLinkAlreadyRunning:
+ return "display link already running";
+ case kCVReturnDisplayLinkNotRunning:
+ return "display link not running";
+ case kCVReturnDisplayLinkCallbacksNotSet:
+ return "display link callback not set";
+ case kCVReturnInvalidPixelFormat:
+ return "invalid pixel format";
+ case kCVReturnInvalidSize:
+ return "invalid size";
+ case kCVReturnInvalidPixelBufferAttributes:
+ return "invalid pixel buffer attributes";
+ case kCVReturnPixelBufferNotOpenGLCompatible:
+ return "pixel buffer not OpenGL compatible";
+ case kCVReturnWouldExceedAllocationThreshold:
+ return "would exceed allocation threshold";
+ case kCVReturnPoolAllocationFailed:
+ return "pool allocation failed";
+ case kCVReturnInvalidPoolAttributes:
+ return "invalid pool attributes";
+ default:
+ return "unknown error";
+ }
+}
+
+static const char* GetVTErrorString(OSStatus error) {
+ switch (error) {
+ case kVTPropertyNotSupportedErr:
+ return "property not supported";
+ case kVTPropertyReadOnlyErr:
+ return "read only property";
+ case kVTParameterErr:
+ return "invalid parameter";
+ case kVTInvalidSessionErr:
+ return "invalid session";
+ case kVTAllocationFailedErr:
+ return "allocation failed";
+ case kVTPixelTransferNotSupportedErr:
+ return "pixel transfer not supported";
+ case kVTCouldNotFindVideoDecoderErr:
+ return "could not find video decoder";
+ case kVTCouldNotCreateInstanceErr:
+ return "could not create instance";
+ case kVTCouldNotFindVideoEncoderErr:
+ return "could not find video encoder";
+ case kVTVideoDecoderBadDataErr:
+ return "video decoder bad data";
+ case kVTVideoDecoderUnsupportedDataFormatErr:
+ return "video decoder unsupported data format";
+ case kVTVideoDecoderMalfunctionErr:
+ return "video decoder malfunction";
+ case kVTVideoEncoderMalfunctionErr:
+ return "video encoder malfunction";
+ case kVTVideoDecoderNotAvailableNowErr:
+ return "video decoder not available";
+ case kVTImageRotationNotSupportedErr:
+ return "image rotation not supported";
+ case kVTVideoEncoderNotAvailableNowErr:
+ return "video encoder not available now";
+ case kVTFormatDescriptionChangeNotSupportedErr:
+ return "format description change not supported";
+ case kVTInsufficientSourceColorDataErr:
+ return "insufficient source color data";
+ case kVTCouldNotCreateColorCorrectionDataErr:
+ return "could not create color correction data";
+ case kVTColorSyncTransformConvertFailedErr:
+ return "ColorSync transform convert failed";
+ case kVTVideoDecoderAuthorizationErr:
+ return "video decoder authorization error";
+ case kVTVideoEncoderAuthorizationErr:
+ return "video encoder authorization error";
+ case kVTColorCorrectionPixelTransferFailedErr:
+ return "color correction pixel transfer failed";
+ case kVTMultiPassStorageIdentifierMismatchErr:
+ return "multi-pass storage identifier mismatch";
+ case kVTMultiPassStorageInvalidErr:
+ return "invalid multi-pass storage";
+ case kVTFrameSiloInvalidTimeStampErr:
+ return "invalid frame silo timestamp";
+ case kVTFrameSiloInvalidTimeRangeErr:
+ return "invalid frame silo time range";
+ case kVTCouldNotFindTemporalFilterErr:
+ return "could not find temporal filter";
+ case kVTPixelTransferNotPermittedErr:
+ return "pixel transfer not permitted";
+ default:
+ return "unknown error";
+ }
+}
+
+#pragma mark -
Robert Sesek 2014/08/07 22:49:23 Chrome doesn't typically do this.
jfroy 2014/08/07 23:06:11 Acknowledged.
+
+// utility to log CFTypes
+
+std::ostream& operator<<(std::ostream& out, const CFStringRef& cfstring) {
Robert Sesek 2014/08/07 22:49:22 All these osteram functions are just to support DL
jfroy 2014/08/07 23:06:11 Acknowledged.
+ if (!cfstring) {
+ return out << "null";
+ }
+
+ const char* c_str;
+ c_str = CFStringGetCStringPtr(cfstring, kCFStringEncodingASCII);
+ if (c_str) {
+ return out << c_str;
+ }
+ c_str = CFStringGetCStringPtr(cfstring, kCFStringEncodingUTF8);
+ if (c_str) {
+ return out << c_str;
+ }
+
+ CFIndex length = CFStringGetLength(cfstring);
+ size_t size =
+ CFStringGetMaximumSizeForEncoding(length, kCFStringEncodingUTF8) + 1;
+ std::vector<char> c_str_buf;
+ c_str_buf.reserve(size);
+ CFStringGetCString(cfstring, c_str_buf.data(), size, kCFStringEncodingUTF8);
+ return out << c_str_buf.data();
+}
+
+std::ostream& operator<<(std::ostream& out, const CFNumberRef& cfnumber) {
+ if (!cfnumber) {
+ return out << "null";
+ }
+
+ base::ScopedCFTypeRef<CFNumberFormatterRef> formatter(CFNumberFormatterCreate(
+ kCFAllocatorDefault, CFLocaleGetSystem(), kCFNumberFormatterNoStyle));
+ base::ScopedCFTypeRef<CFStringRef> as_str(
+ CFNumberFormatterCreateStringWithNumber(
+ kCFAllocatorDefault, formatter, cfnumber));
+ return out << as_str;
+}
+
+std::ostream& operator<<(std::ostream& out, const CFBooleanRef& cfboolean) {
+ if (!cfboolean) {
+ return out << "null";
+ }
+
+ base::ScopedCFTypeRef<CFStringRef> as_str(
+ CFBooleanGetValue(cfboolean) ? CFSTR("true") : CFSTR("false"));
+ return out << as_str;
+}
+
+struct CFTypeEmittable {
+ explicit CFTypeEmittable(CFTypeRef cfobject) : cfobject_(cfobject) {}
+ explicit operator bool() const { return cfobject_ != nullptr; }
+ operator CFTypeRef() const { return cfobject_; }
+ CFTypeRef get() const { return cfobject_; }
+ friend std::ostream& operator<<(std::ostream&, const CFTypeEmittable&);
+ CFTypeRef cfobject_;
+};
+
+std::ostream& operator<<(std::ostream& out, const CFTypeEmittable& emittable) {
+ if (!emittable) {
+ return out << "null";
+ }
+
+ if (CFGetTypeID(emittable) == CFStringGetTypeID()) {
+ return out << static_cast<CFStringRef>(emittable.get());
+ } else if (CFGetTypeID(emittable) == CFNumberGetTypeID()) {
+ return out << static_cast<CFNumberRef>(emittable.get());
+ } else if (CFGetTypeID(emittable) == CFBooleanGetTypeID()) {
+ return out << static_cast<CFBooleanRef>(emittable.get());
+ }
+ base::ScopedCFTypeRef<CFStringRef> as_str(CFCopyDescription(emittable));
+ return out << as_str;
+}
+
+std::ostream& operator<<(std::ostream& out, const CMTime& time) {
+ return out << "{value=" << time.value << ", timescale=" << time.timescale
+ << ", flags=" << time.flags << ", epoch=" << time.epoch << "}";
+}
+
+std::ostream& operator<<(std::ostream& out,
+ const CMSampleTimingInfo& timing_info) {
+ return out << "{duration=" << timing_info.duration
+ << ", pts=" << timing_info.presentationTimeStamp
+ << ", dts=" << timing_info.decodeTimeStamp << "}";
+}
+
+#pragma mark -
+
+template <typename T>
+bool SetSessionProperty(VTSessionRef session,
Robert Sesek 2014/08/07 22:49:22 Is this really templatized for just logging purpos
jfroy 2014/08/07 23:06:11 Mostly yes, but it's also nice to have setters wit
+ CFStringRef key,
+ T value,
+ CFTypeRef cfvalue) {
+ DVLOG(3) << __func__ << ": " << key << "=" << value;
+ OSStatus status = VTSessionSetProperty(session, key, cfvalue);
+ if (status != noErr) {
+ DLOG(ERROR) << __func__
+ << " VTSessionSetProperty failed: " << GetVTErrorString(status)
+ << " (" << status << ") " << key << "=" << value;
+ }
+ return status == noErr;
+}
+
+static bool SetSessionProperty(VTSessionRef session,
+ CFStringRef key,
+ uint32_t value) {
+ base::ScopedCFTypeRef<CFNumberRef> cfvalue(
+ CFNumberCreate(nullptr, kCFNumberSInt32Type, &value));
+ return SetSessionProperty(session, key, value, cfvalue);
+}
+
+static bool SetSessionProperty(VTSessionRef session,
+ CFStringRef key,
+ bool value) {
+ CFBooleanRef cfvalue = (value) ? kCFBooleanTrue : kCFBooleanFalse;
+ return SetSessionProperty(session, key, value, cfvalue);
+}
+
+static bool SetSessionProperty(VTSessionRef session,
+ CFStringRef key,
+ CFStringRef value) {
+ return SetSessionProperty(session, key, value, value);
+}
+
+static base::ScopedCFTypeRef<CFDictionaryRef> DictionaryWithKeyValue(
+ CFTypeRef key,
+ CFTypeRef value) {
+ CFTypeRef keys[1] = {key};
+ CFTypeRef values[1] = {value};
+ return base::ScopedCFTypeRef<CFDictionaryRef>(
+ CFDictionaryCreate(kCFAllocatorDefault,
+ keys,
+ values,
+ 1,
+ &kCFTypeDictionaryKeyCallBacks,
+ &kCFTypeDictionaryValueCallBacks));
+}
+
+#pragma mark -
+
+struct H264VideoToolboxEncoder::FrameContext {
+ base::TimeTicks capture_time;
+ FrameEncodedCallback frame_encoded_callback;
+};
+
+H264VideoToolboxEncoder::H264VideoToolboxEncoder(
+ scoped_refptr<CastEnvironment> cast_environment,
+ const VideoSenderConfig& video_config)
+ : cast_environment_(cast_environment),
+ cast_config_(video_config),
+ frame_id_(kStartFrameId),
+ last_keyframe_id_(kStartFrameId),
+ encode_next_frame_as_keyframe_(false) {
+ Initialize();
Robert Sesek 2014/08/07 22:49:23 You only call this here, so why is it a separate m
jfroy 2014/08/07 23:06:11 The current code doesn't do it, but I have a suspi
+}
+
+H264VideoToolboxEncoder::~H264VideoToolboxEncoder() {
+ Teardown();
Robert Sesek 2014/08/07 22:49:22 Same.
jfroy 2014/08/07 23:06:11 See my reply above.
+}
+
+CVPixelBufferPoolRef H264VideoToolboxEncoder::cv_pixel_buffer_pool() const {
+ DCHECK(thread_checker_.CalledOnValidThread());
+ DCHECK(compression_session_);
+ return VTCompressionSessionGetPixelBufferPool(compression_session_);
+}
+
+void H264VideoToolboxEncoder::Initialize() {
+ DCHECK(thread_checker_.CalledOnValidThread());
+ DCHECK(!compression_session_);
+
+ DVLOG(3) << __func__ << " width: " << cast_config_.width
+ << ", height: " << cast_config_.height
+ << ", start_bitrate: " << cast_config_.start_bitrate
+ << ", max_frame_rate:" << cast_config_.max_frame_rate;
+
+ // Note that the encoder object is given to the compression session as the
+ // callback context using a raw pointer. The C API does not allow us to use
+ // a smart pointer, nor is this encoder ref counted. However, this is still
+ // safe, because we 1) we own the compression session and 2) we tear it down
+ // safely. When destructing the encoder, the compression session is flushed
+ // and invalidated. Internally, VideoToolbox will join all of its threads
+ // before returning to the client. Therefore, when control returns to us, we
+ // are guaranteed that the output callback will not execute again.
+
+ // On OS X, allow the hardware encoder. Don't require it, it does not support
+ // all configurations (some of which are used for testing).
+ DictionaryPtr encoder_spec(nullptr);
+#if !defined(OS_IOS)
+ encoder_spec = DictionaryWithKeyValue(
+ kVTVideoEncoderSpecification_EnableHardwareAcceleratedVideoEncoder,
+ kCFBooleanTrue);
+#endif
+
+ VTCompressionSessionRef session;
+ OSStatus status =
+ VTCompressionSessionCreate(kCFAllocatorDefault,
+ cast_config_.width,
+ cast_config_.height,
+ kCMVideoCodecType_H264,
+ encoder_spec,
+ nullptr /* sourceImageBufferAttributes */,
+ nullptr /* compressedDataAllocator */,
+ CompressionCallback,
+ reinterpret_cast<void*>(this),
+ &session);
+ if (status != noErr) {
+ DLOG(ERROR) << __func__ << " VTCompressionSessionCreate failed: "
+ << GetVTErrorString(status) << " (" << status << ")";
+ return;
+ }
+ compression_session_.reset(session);
+
+#if defined(OS_IOS)
+ using_hardware_ = true;
+#else
+ CFBooleanRef using_hardware_cf = nullptr;
+ status = VTSessionCopyProperty(
+ session,
+ kVTCompressionPropertyKey_UsingHardwareAcceleratedVideoEncoder,
+ kCFAllocatorDefault,
+ &using_hardware_cf);
+ if (status == noErr) {
+ using_hardware_ = CFBooleanGetValue(using_hardware_cf);
+ CFRelease(using_hardware_cf);
+ }
+ DVLOG(3) << __func__ << " using hardware: " << using_hardware_;
+#endif
+
+ ConfigureSession();
+}
+
+static void SetConfigurationApplier(CFStringRef key,
+ CFTypeRef value,
+ VTCompressionSessionRef session) {
+ SetSessionProperty(session, key, CFTypeEmittable(value), value);
+}
+
+void H264VideoToolboxEncoder::ConfigureSession() {
+ SetSessionProperty(compression_session_,
+ kVTCompressionPropertyKey_ProfileLevel,
+ kVTProfileLevel_H264_Main_AutoLevel);
+
+ SetSessionProperty(
+ compression_session_, kVTCompressionPropertyKey_RealTime, true);
+ SetSessionProperty(compression_session_,
+ kVTCompressionPropertyKey_AllowFrameReordering,
+ false);
+ SetSessionProperty(compression_session_,
+ kVTCompressionPropertyKey_MaxKeyFrameInterval,
+ 240u);
+ SetSessionProperty(compression_session_,
+ kVTCompressionPropertyKey_MaxKeyFrameIntervalDuration,
+ 240u);
+
+ SetSessionProperty(compression_session_,
+ kVTCompressionPropertyKey_AverageBitRate,
+ static_cast<uint32_t>(cast_config_.start_bitrate));
+
+ SetSessionProperty(compression_session_,
+ kVTCompressionPropertyKey_ExpectedFrameRate,
+ static_cast<uint32_t>(cast_config_.max_frame_rate));
+
+ SetSessionProperty(compression_session_,
+ kVTCompressionPropertyKey_ColorPrimaries,
+ kCVImageBufferColorPrimaries_ITU_R_709_2);
+ SetSessionProperty(compression_session_,
+ kVTCompressionPropertyKey_TransferFunction,
+ kCVImageBufferTransferFunction_ITU_R_709_2);
+ SetSessionProperty(compression_session_,
+ kVTCompressionPropertyKey_YCbCrMatrix,
+ kCVImageBufferYCbCrMatrix_ITU_R_709_2);
+
+ if (compression_properties_) {
+ CFDictionaryApplyFunction(
+ compression_properties_,
+ reinterpret_cast<CFDictionaryApplierFunction>(SetConfigurationApplier),
+ compression_session_.get());
+ }
+}
+
+void H264VideoToolboxEncoder::Teardown() {
+ DCHECK(thread_checker_.CalledOnValidThread());
+
+ // If the compression session exists, invalidate it. This blocks until all
+ // pending output callbacks have returned and any internal threads have
+ // joined, ensuring no output callback ever sees a dangling encoder pointer.
+ if (compression_session_) {
+ VTCompressionSessionInvalidate(compression_session_);
+ compression_session_.reset();
+ }
+}
+
+#pragma mark -
+
+bool H264VideoToolboxEncoder::EncodeVideoFrame(
+ const scoped_refptr<media::VideoFrame>& video_frame,
+ const base::TimeTicks& capture_time,
+ const FrameEncodedCallback& frame_encoded_callback) {
+ DCHECK(thread_checker_.CalledOnValidThread());
+
+ if (!compression_session_) {
+ DLOG(ERROR) << __func__ << " compression session is null";
+ return false;
+ }
+
+ PixelBufferPtr pixel_buffer(video_frame->cv_pixel_buffer(),
+ base::scoped_policy::RETAIN);
+ if (!pixel_buffer) {
+ pixel_buffer = WrapVideoFrame(*video_frame);
+ if (!pixel_buffer) {
+ return false;
+ }
+ }
+
+ CMTime timestamp_cm;
+ if (capture_time.is_null()) {
+ timestamp_cm = kCMTimeInvalid;
+ } else {
+ timestamp_cm = CMTimeMake(capture_time.ToInternalValue(), USEC_PER_SEC);
+ }
+
+ FrameContext* fc = new FrameContext();
+ fc->capture_time = capture_time;
+ fc->frame_encoded_callback = frame_encoded_callback;
+
+ DVLOG(3) << __func__ << " pts: " << timestamp_cm;
+
+ DictionaryPtr frame_props(nullptr);
+ if (encode_next_frame_as_keyframe_) {
+ frame_props = DictionaryWithKeyValue(kVTEncodeFrameOptionKey_ForceKeyFrame,
+ kCFBooleanTrue);
+ encode_next_frame_as_keyframe_ = false;
+ }
+
+ VTEncodeInfoFlags info;
+ OSStatus status = VTCompressionSessionEncodeFrame(compression_session_,
+ pixel_buffer,
+ timestamp_cm,
+ kCMTimeInvalid,
+ frame_props,
+ reinterpret_cast<void*>(fc),
+ &info);
+ if (status != noErr) {
+ DLOG(ERROR) << __func__ << " VTCompressionSessionEncodeFrame failed: "
+ << GetVTErrorString(status) << " (" << status << ")";
+ return false;
+ }
+ if ((info & kVTEncodeInfo_FrameDropped)) {
+ DLOG(ERROR) << __func__ << " frame dropped";
+ return false;
+ }
+
+ return true;
+}
+
+void H264VideoToolboxEncoder::SetBitRate(int new_bit_rate) {
+ DCHECK(thread_checker_.CalledOnValidThread());
+ // NOTE: VideoToolbox does not seem to support bitrate reconfiguration.
+}
+
+void H264VideoToolboxEncoder::GenerateKeyFrame() {
+ DCHECK(thread_checker_.CalledOnValidThread());
+ DCHECK(compression_session_);
+
+ encode_next_frame_as_keyframe_ = true;
+}
+
+void H264VideoToolboxEncoder::LatestFrameIdToReference(uint32 /*frame_id*/) {
+}
+
+#pragma mark -
+
+static void VideoFramePixelBufferReleaseCallback(void* frame_ref,
+ const void* data,
+ size_t size,
+ size_t num_planes,
+ const void* planes[]) {
+ free(const_cast<void*>(data));
+ reinterpret_cast<media::VideoFrame*>(frame_ref)->Release();
+}
+
+H264VideoToolboxEncoder::PixelBufferPtr H264VideoToolboxEncoder::WrapVideoFrame(
+ const scoped_refptr<media::VideoFrame>& frame) {
+ static const size_t MAX_PLANES = 3;
+
+ media::VideoFrame::Format format = frame->format();
+ size_t num_planes = media::VideoFrame::NumPlanes(format);
+ gfx::Size coded_size = frame->coded_size();
+
+ // media::VideoFrame only supports YUV formats, so there is no way to
+ // leverage VideoToolbox's ability to convert RGBA formats automatically. In
+ // addition, most of the media::VideoFrame formats are YVU, which VT does not
+ // support. Finally, media::VideoFrame formats do not carry any information
+ // about the color space, transform or any other colorimetric information
+ // that is generally needed to fully specify the input data. So essentially
+ // require that the input be YCbCr 4:2:0 (either planar or biplanar) and
+ // assume the standard video dynamic range for samples (although most modern
+ // HDTVs support full-range video these days).
+ OSType pixel_format;
+ if (format == media::VideoFrame::Format::I420) {
+ pixel_format = kCVPixelFormatType_420YpCbCr8Planar;
+ } else if (format == media::VideoFrame::Format::NV12) {
+ pixel_format = kCVPixelFormatType_420YpCbCr8BiPlanarVideoRange;
+ } else {
+ DLOG(ERROR) << __func__ << " unsupported frame format: " << format;
+ return PixelBufferPtr(nullptr);
+ }
+
+ // TODO(jfroy): Support extended pixels (i.e. padding).
+ if (frame->coded_size() != frame->visible_rect().size()) {
+ DLOG(ERROR) << __func__ << " frame with extended pixels not supported: "
+ << " coded_size: " << coded_size.ToString()
+ << ", visible_rect: " << frame->visible_rect().ToString();
+ return PixelBufferPtr(nullptr);
+ }
+
+ DCHECK(media::VideoFrame::NumPlanes(format) <= MAX_PLANES);
+ void* plane_ptrs[MAX_PLANES];
+ size_t plane_widths[MAX_PLANES];
+ size_t plane_heights[MAX_PLANES];
+ size_t plane_bytes_per_row[MAX_PLANES];
+ for (size_t plane_i = 0; plane_i < num_planes; ++plane_i) {
+ plane_ptrs[plane_i] = frame->data(plane_i);
+ gfx::Size plane_size =
+ media::VideoFrame::PlaneSize(format, plane_i, coded_size);
+ plane_widths[plane_i] = plane_size.width();
+ plane_heights[plane_i] = plane_size.height();
+ plane_bytes_per_row[plane_i] = frame->stride(plane_i);
+ }
+
+ // CVPixelBufferCreateWithPlanarBytes needs a dummy plane descriptor or the
+ // release callback will not execute. The descriptor is freed in the callback.
+ void* descriptor =
+ calloc(1,
+ std::max(sizeof(CVPlanarPixelBufferInfo_YCbCrPlanar),
+ sizeof(CVPlanarPixelBufferInfo_YCbCrBiPlanar)));
+
+ // Wrap the frame's data in a CVPixelBuffer. Because this is a C API, we can't
+ // give it a smart pointer to the frame, so instead pass a raw pointer and
+ // increment the frame's reference count manually.
+ CVPixelBufferRef pixel_buffer;
+ CVReturn result =
+ CVPixelBufferCreateWithPlanarBytes(kCFAllocatorDefault,
+ coded_size.width(),
+ coded_size.height(),
+ format,
+ &descriptor,
+ 0,
+ num_planes,
+ plane_ptrs,
+ plane_widths,
+ plane_heights,
+ plane_bytes_per_row,
+ VideoFramePixelBufferReleaseCallback,
+ frame.get(),
+ nullptr,
+ &pixel_buffer);
+ if (result != kCVReturnSuccess) {
+ DLOG(ERROR) << __func__ << " CVPixelBufferCreateWithPlanarBytes failed: "
+ << GetCVErrorString(result) << " (" << result << ")";
+ return PixelBufferPtr(nullptr);
+ }
+
+ // The CVPixelBuffer now references the data of the frame, so increment its
+ // reference count manually. The release callback set on the pixel buffer will
+ // release the frame.
+ frame.AddRef();
+
+ return PixelBufferPtr(pixel_buffer);
+}
+
+#pragma mark -
+
+void H264VideoToolboxEncoder::CompressionCallback(void* encoder_opaque,
+ void* frame_opaque,
+ OSStatus status,
+ VTEncodeInfoFlags info,
+ CMSampleBufferRef sbuf) {
+ H264VideoToolboxEncoder* encoder =
+ reinterpret_cast<H264VideoToolboxEncoder*>(encoder_opaque);
+ scoped_ptr<FrameContext> fc(reinterpret_cast<FrameContext*>(frame_opaque));
+
+ if (status != noErr) {
+ DLOG(ERROR) << __func__ << " encoding failed: " << GetVTErrorString(status)
+ << " (" << status << ")";
+ return;
+ }
+ if ((info & kVTEncodeInfo_FrameDropped)) {
+ DVLOG(2) << __func__ << " frame dropped";
+ return;
+ }
+ CMItemCount sample_count = CMSampleBufferGetNumSamples(sbuf);
+ if (sample_count > 1) {
+ DLOG(ERROR) << __func__
+ << " more than one sample in sample buffer: " << sample_count;
+ return;
+ }
+
+ CFDictionaryRef sample_attachments =
+ static_cast<CFDictionaryRef>(CFArrayGetValueAtIndex(
+ CMSampleBufferGetSampleAttachmentsArray(sbuf, true), 0));
+
+ // If the NotSync key is not present, it implies Sync, which indicates a
+ // keyframe (at least I think, VT documentation is, erm, sparse). Could
+ // alternatively use kCMSampleAttachmentKey_DependsOnOthers == false.
+ bool keyframe =
+ CFDictionaryContainsKey(sample_attachments,
+ kCMSampleAttachmentKey_NotSync) == false;
+
+ // Generate a frame id and update the last keyframe id if needed.
+ // NOTE: VideoToolbox calls the output callback serially, so this is safe.
+ uint32 frame_id = ++encoder->frame_id_;
+ if (keyframe) {
+ encoder->last_keyframe_id_ = frame_id;
+ }
+
+ CMSampleTimingInfo timing_info;
+ CMSampleBufferGetSampleTimingInfo(sbuf, 0, &timing_info);
+ DVLOG(3) << __func__ << ", timing info: " << timing_info
+ << ", keyframe: " << keyframe << ", frame id: " << frame_id;
+
+ scoped_ptr<EncodedFrame> encoded_frame(new EncodedFrame());
+ encoded_frame->frame_id = frame_id;
+ encoded_frame->reference_time = fc->capture_time;
+ encoded_frame->rtp_timestamp = GetVideoRtpTimestamp(fc->capture_time);
+ if (keyframe) {
+ encoded_frame->dependency = EncodedFrame::KEY;
+ encoded_frame->referenced_frame_id = frame_id;
+ } else {
+ encoded_frame->dependency = EncodedFrame::DEPENDENT;
+ // NOTE: Technically wrong, but without parsing the NALs our best guess is
+ // the last keyframe.
+ encoded_frame->referenced_frame_id = encoder->last_keyframe_id_;
+ }
+
+ CopySampleBufferToAnnexBBuffer(sbuf, &encoded_frame->data, keyframe);
+
+ encoder->cast_environment_->PostTask(
+ CastEnvironment::MAIN,
+ FROM_HERE,
+ base::Bind(fc->frame_encoded_callback, base::Passed(&encoded_frame)));
+}
+
+template <typename NalSizeType>
+static void CopyNalsToAnnexB(char* avcc_buffer,
+ const size_t avcc_size,
+ std::string* annexb_buffer) {
+ static_assert(sizeof(NalSizeType) == 1 || sizeof(NalSizeType) == 2 ||
+ sizeof(NalSizeType) == 4,
+ "NAL size type has unsupported size");
+ static const char startcode_3[3] = {0, 0, 1};
+ DCHECK(avcc_buffer);
+ DCHECK(annexb_buffer);
+ size_t bytes_left = avcc_size;
+ while (bytes_left > 0) {
+ DCHECK(bytes_left > sizeof(NalSizeType));
+ NalSizeType nal_size;
+ base::ReadBigEndian(avcc_buffer, &nal_size);
+ bytes_left -= sizeof(NalSizeType);
+ avcc_buffer += sizeof(NalSizeType);
+
+ DCHECK(bytes_left >= nal_size);
+ annexb_buffer->append(startcode_3, sizeof(startcode_3));
+ annexb_buffer->append(avcc_buffer, nal_size);
+ bytes_left -= nal_size;
+ avcc_buffer += nal_size;
+ }
+}
+
+void H264VideoToolboxEncoder::CopySampleBufferToAnnexBBuffer(
+ CMSampleBufferRef sbuf,
+ std::string* annexb_buffer,
+ bool keyframe) {
+ // Perform two pass, one to figure out the total output size, and another to
+ // copy the data after having performed a single output allocation. Note that
+ // we'll allocate a bit more because we'll count 4 bytes instead of 3 for
+ // video NALs.
+
+ // TODO(jfroy): There is a bug in
+ // CMVideoFormatDescriptionGetH264ParameterSetAtIndex, iterate until fail.
+
+ OSStatus status;
+
+ // Get the sample buffer's block buffer and format description.
+ CMBlockBufferRef bb = CMSampleBufferGetDataBuffer(sbuf);
+ DCHECK(bb);
+ CMFormatDescriptionRef fdesc = CMSampleBufferGetFormatDescription(sbuf);
+ DCHECK(fdesc);
+
+ size_t bb_size = CMBlockBufferGetDataLength(bb);
+ size_t total_bytes = bb_size;
+
+ size_t pset_count;
+ int nal_size_field_bytes;
+ status = CMVideoFormatDescriptionGetH264ParameterSetAtIndex(
+ fdesc, 0, nullptr, nullptr, &pset_count, &nal_size_field_bytes);
+ if (status == kCMFormatDescriptionBridgeError_InvalidParameter) {
+ DLOG(WARNING) << __func__ << " assuming 2 parameter sets and 4 bytes NAL "
+ "length header" pset_count = 2;
+ nal_size_field_bytes = 4;
+ } else if (status != noErr) {
+ DLOG(ERROR)
+ << __func__
+ << " CMVideoFormatDescriptionGetH264ParameterSetAtIndex failed: "
+ << status;
+ return;
+ }
+
+ if (keyframe) {
+ const uint8_t* pset;
+ size_t pset_size;
+ for (size_t pset_i = 0; pset_i < pset_count; ++pset_i) {
+ status = CMVideoFormatDescriptionGetH264ParameterSetAtIndex(
+ fdesc, pset_i, &pset, &pset_size, nullptr, nullptr);
+ if (status != noErr) {
+ DLOG(ERROR)
+ << __func__
+ << " CMVideoFormatDescriptionGetH264ParameterSetAtIndex failed: "
+ << status;
+ return;
+ }
+ total_bytes += pset_size + nal_size_field_bytes;
+ }
+ }
+
+ annexb_buffer->reserve(total_bytes);
+
+ // Copy all parameter sets before keyframes.
+ if (keyframe) {
+ const uint8_t* pset;
+ size_t pset_size;
+ for (size_t pset_i = 0; pset_i < pset_count; ++pset_i) {
+ status = CMVideoFormatDescriptionGetH264ParameterSetAtIndex(
+ fdesc, pset_i, &pset, &pset_size, nullptr, nullptr);
+ if (status != noErr) {
+ DLOG(ERROR)
+ << __func__
+ << " CMVideoFormatDescriptionGetH264ParameterSetAtIndex failed: "
+ << status;
+ return;
+ }
+ static const char startcode_4[4] = {0, 0, 0, 1};
+ annexb_buffer->append(startcode_4, sizeof(startcode_4));
+ annexb_buffer->append(reinterpret_cast<const char*>(pset), pset_size);
+ }
+ }
+
+ // Block buffers can be composed of non-contiguous chunks. For the sake of
+ // keeping this code simple, flatten non-contiguous block buffers.
+ base::ScopedCFTypeRef<CMBlockBufferRef> contiguous_bb(
+ bb, base::scoped_policy::RETAIN);
+ if (!CMBlockBufferIsRangeContiguous(bb, 0, 0)) {
+ DVLOG(3) << __func__ << " copying block buffer to contiguous buffer";
+ contiguous_bb.reset();
+ status = CMBlockBufferCreateContiguous(kCFAllocatorDefault,
+ bb,
+ kCFAllocatorDefault,
+ nullptr,
+ 0,
+ 0,
+ 0,
+ contiguous_bb.InitializeInto());
+ if (status != noErr) {
+ DLOG(ERROR) << __func__
+ << " CMBlockBufferCreateContiguous failed: " << status;
+ return;
+ }
+ }
+
+ // Copy all the NAL units. In the process convert them from AVCC format
+ // (length header) to AnnexB format (start code).
+ char* bb_data;
+ status =
+ CMBlockBufferGetDataPointer(contiguous_bb, 0, nullptr, nullptr, &bb_data);
+ if (status != noErr) {
+ DLOG(ERROR) << __func__
+ << " CMBlockBufferGetDataPointer failed: " << status;
+ return;
+ }
+
+ if (nal_size_field_bytes == 1) {
+ CopyNalsToAnnexB<uint8_t>(bb_data, bb_size, annexb_buffer);
+ } else if (nal_size_field_bytes == 2) {
+ CopyNalsToAnnexB<uint16_t>(bb_data, bb_size, annexb_buffer);
+ } else if (nal_size_field_bytes == 4) {
+ CopyNalsToAnnexB<uint32_t>(bb_data, bb_size, annexb_buffer);
+ }
+}
+
+} // namespace cast
+} // namespace media
« no previous file with comments | « media/cast/sender/h264_vt_encoder.h ('k') | no next file » | no next file with comments »

Powered by Google App Engine
This is Rietveld 408576698