Index: media/cast/sender/h264_vt_encoder.cc |
diff --git a/media/cast/sender/h264_vt_encoder.cc b/media/cast/sender/h264_vt_encoder.cc |
new file mode 100644 |
index 0000000000000000000000000000000000000000..190de2c6249db2b89b2a3264c9edf67ce091f0d5 |
--- /dev/null |
+++ b/media/cast/sender/h264_vt_encoder.cc |
@@ -0,0 +1,813 @@ |
+// Copyright 2014 The Chromium Authors. All rights reserved. |
+// Use of this source code is governed by a BSD-style license that can be |
+// found in the LICENSE file. |
+ |
+#include "media/cast/sender/h264_vt_encoder.h" |
+ |
+#include <algorithm> |
+#include <vector> |
+ |
+#include "base/big_endian.h" |
+#include "base/bind.h" |
+#include "base/bind_helpers.h" |
+#include "base/location.h" |
+#include "base/logging.h" |
+ |
+namespace media { |
+namespace cast { |
+ |
+static const char* GetCVErrorString(CVReturn error) { |
+ switch (error) { |
+ case kCVReturnSuccess: |
+ return "success"; |
+ case kCVReturnError: |
+ return "error"; |
+ case kCVReturnInvalidArgument: |
+ return "invalid argument"; |
+ case kCVReturnAllocationFailed: |
+ return "allocation failed"; |
+ case kCVReturnInvalidDisplay: |
+ return "invalid display"; |
+ case kCVReturnDisplayLinkAlreadyRunning: |
+ return "display link already running"; |
+ case kCVReturnDisplayLinkNotRunning: |
+ return "display link not running"; |
+ case kCVReturnDisplayLinkCallbacksNotSet: |
+ return "display link callback not set"; |
+ case kCVReturnInvalidPixelFormat: |
+ return "invalid pixel format"; |
+ case kCVReturnInvalidSize: |
+ return "invalid size"; |
+ case kCVReturnInvalidPixelBufferAttributes: |
+ return "invalid pixel buffer attributes"; |
+ case kCVReturnPixelBufferNotOpenGLCompatible: |
+ return "pixel buffer not OpenGL compatible"; |
+ case kCVReturnWouldExceedAllocationThreshold: |
+ return "would exceed allocation threshold"; |
+ case kCVReturnPoolAllocationFailed: |
+ return "pool allocation failed"; |
+ case kCVReturnInvalidPoolAttributes: |
+ return "invalid pool attributes"; |
+ default: |
+ return "unknown error"; |
+ } |
+} |
+ |
+static const char* GetVTErrorString(OSStatus error) { |
+ switch (error) { |
+ case kVTPropertyNotSupportedErr: |
+ return "property not supported"; |
+ case kVTPropertyReadOnlyErr: |
+ return "read only property"; |
+ case kVTParameterErr: |
+ return "invalid parameter"; |
+ case kVTInvalidSessionErr: |
+ return "invalid session"; |
+ case kVTAllocationFailedErr: |
+ return "allocation failed"; |
+ case kVTPixelTransferNotSupportedErr: |
+ return "pixel transfer not supported"; |
+ case kVTCouldNotFindVideoDecoderErr: |
+ return "could not find video decoder"; |
+ case kVTCouldNotCreateInstanceErr: |
+ return "could not create instance"; |
+ case kVTCouldNotFindVideoEncoderErr: |
+ return "could not find video encoder"; |
+ case kVTVideoDecoderBadDataErr: |
+ return "video decoder bad data"; |
+ case kVTVideoDecoderUnsupportedDataFormatErr: |
+ return "video decoder unsupported data format"; |
+ case kVTVideoDecoderMalfunctionErr: |
+ return "video decoder malfunction"; |
+ case kVTVideoEncoderMalfunctionErr: |
+ return "video encoder malfunction"; |
+ case kVTVideoDecoderNotAvailableNowErr: |
+ return "video decoder not available"; |
+ case kVTImageRotationNotSupportedErr: |
+ return "image rotation not supported"; |
+ case kVTVideoEncoderNotAvailableNowErr: |
+ return "video encoder not available now"; |
+ case kVTFormatDescriptionChangeNotSupportedErr: |
+ return "format description change not supported"; |
+ case kVTInsufficientSourceColorDataErr: |
+ return "insufficient source color data"; |
+ case kVTCouldNotCreateColorCorrectionDataErr: |
+ return "could not create color correction data"; |
+ case kVTColorSyncTransformConvertFailedErr: |
+ return "ColorSync transform convert failed"; |
+ case kVTVideoDecoderAuthorizationErr: |
+ return "video decoder authorization error"; |
+ case kVTVideoEncoderAuthorizationErr: |
+ return "video encoder authorization error"; |
+ case kVTColorCorrectionPixelTransferFailedErr: |
+ return "color correction pixel transfer failed"; |
+ case kVTMultiPassStorageIdentifierMismatchErr: |
+ return "multi-pass storage identifier mismatch"; |
+ case kVTMultiPassStorageInvalidErr: |
+ return "invalid multi-pass storage"; |
+ case kVTFrameSiloInvalidTimeStampErr: |
+ return "invalid frame silo timestamp"; |
+ case kVTFrameSiloInvalidTimeRangeErr: |
+ return "invalid frame silo time range"; |
+ case kVTCouldNotFindTemporalFilterErr: |
+ return "could not find temporal filter"; |
+ case kVTPixelTransferNotPermittedErr: |
+ return "pixel transfer not permitted"; |
+ default: |
+ return "unknown error"; |
+ } |
+} |
+ |
+#pragma mark - |
Robert Sesek
2014/08/07 22:49:23
Chrome doesn't typically do this.
jfroy
2014/08/07 23:06:11
Acknowledged.
|
+ |
+// utility to log CFTypes |
+ |
+std::ostream& operator<<(std::ostream& out, const CFStringRef& cfstring) { |
Robert Sesek
2014/08/07 22:49:22
All these osteram functions are just to support DL
jfroy
2014/08/07 23:06:11
Acknowledged.
|
+ if (!cfstring) { |
+ return out << "null"; |
+ } |
+ |
+ const char* c_str; |
+ c_str = CFStringGetCStringPtr(cfstring, kCFStringEncodingASCII); |
+ if (c_str) { |
+ return out << c_str; |
+ } |
+ c_str = CFStringGetCStringPtr(cfstring, kCFStringEncodingUTF8); |
+ if (c_str) { |
+ return out << c_str; |
+ } |
+ |
+ CFIndex length = CFStringGetLength(cfstring); |
+ size_t size = |
+ CFStringGetMaximumSizeForEncoding(length, kCFStringEncodingUTF8) + 1; |
+ std::vector<char> c_str_buf; |
+ c_str_buf.reserve(size); |
+ CFStringGetCString(cfstring, c_str_buf.data(), size, kCFStringEncodingUTF8); |
+ return out << c_str_buf.data(); |
+} |
+ |
+std::ostream& operator<<(std::ostream& out, const CFNumberRef& cfnumber) { |
+ if (!cfnumber) { |
+ return out << "null"; |
+ } |
+ |
+ base::ScopedCFTypeRef<CFNumberFormatterRef> formatter(CFNumberFormatterCreate( |
+ kCFAllocatorDefault, CFLocaleGetSystem(), kCFNumberFormatterNoStyle)); |
+ base::ScopedCFTypeRef<CFStringRef> as_str( |
+ CFNumberFormatterCreateStringWithNumber( |
+ kCFAllocatorDefault, formatter, cfnumber)); |
+ return out << as_str; |
+} |
+ |
+std::ostream& operator<<(std::ostream& out, const CFBooleanRef& cfboolean) { |
+ if (!cfboolean) { |
+ return out << "null"; |
+ } |
+ |
+ base::ScopedCFTypeRef<CFStringRef> as_str( |
+ CFBooleanGetValue(cfboolean) ? CFSTR("true") : CFSTR("false")); |
+ return out << as_str; |
+} |
+ |
+struct CFTypeEmittable { |
+ explicit CFTypeEmittable(CFTypeRef cfobject) : cfobject_(cfobject) {} |
+ explicit operator bool() const { return cfobject_ != nullptr; } |
+ operator CFTypeRef() const { return cfobject_; } |
+ CFTypeRef get() const { return cfobject_; } |
+ friend std::ostream& operator<<(std::ostream&, const CFTypeEmittable&); |
+ CFTypeRef cfobject_; |
+}; |
+ |
+std::ostream& operator<<(std::ostream& out, const CFTypeEmittable& emittable) { |
+ if (!emittable) { |
+ return out << "null"; |
+ } |
+ |
+ if (CFGetTypeID(emittable) == CFStringGetTypeID()) { |
+ return out << static_cast<CFStringRef>(emittable.get()); |
+ } else if (CFGetTypeID(emittable) == CFNumberGetTypeID()) { |
+ return out << static_cast<CFNumberRef>(emittable.get()); |
+ } else if (CFGetTypeID(emittable) == CFBooleanGetTypeID()) { |
+ return out << static_cast<CFBooleanRef>(emittable.get()); |
+ } |
+ base::ScopedCFTypeRef<CFStringRef> as_str(CFCopyDescription(emittable)); |
+ return out << as_str; |
+} |
+ |
+std::ostream& operator<<(std::ostream& out, const CMTime& time) { |
+ return out << "{value=" << time.value << ", timescale=" << time.timescale |
+ << ", flags=" << time.flags << ", epoch=" << time.epoch << "}"; |
+} |
+ |
+std::ostream& operator<<(std::ostream& out, |
+ const CMSampleTimingInfo& timing_info) { |
+ return out << "{duration=" << timing_info.duration |
+ << ", pts=" << timing_info.presentationTimeStamp |
+ << ", dts=" << timing_info.decodeTimeStamp << "}"; |
+} |
+ |
+#pragma mark - |
+ |
+template <typename T> |
+bool SetSessionProperty(VTSessionRef session, |
Robert Sesek
2014/08/07 22:49:22
Is this really templatized for just logging purpos
jfroy
2014/08/07 23:06:11
Mostly yes, but it's also nice to have setters wit
|
+ CFStringRef key, |
+ T value, |
+ CFTypeRef cfvalue) { |
+ DVLOG(3) << __func__ << ": " << key << "=" << value; |
+ OSStatus status = VTSessionSetProperty(session, key, cfvalue); |
+ if (status != noErr) { |
+ DLOG(ERROR) << __func__ |
+ << " VTSessionSetProperty failed: " << GetVTErrorString(status) |
+ << " (" << status << ") " << key << "=" << value; |
+ } |
+ return status == noErr; |
+} |
+ |
+static bool SetSessionProperty(VTSessionRef session, |
+ CFStringRef key, |
+ uint32_t value) { |
+ base::ScopedCFTypeRef<CFNumberRef> cfvalue( |
+ CFNumberCreate(nullptr, kCFNumberSInt32Type, &value)); |
+ return SetSessionProperty(session, key, value, cfvalue); |
+} |
+ |
+static bool SetSessionProperty(VTSessionRef session, |
+ CFStringRef key, |
+ bool value) { |
+ CFBooleanRef cfvalue = (value) ? kCFBooleanTrue : kCFBooleanFalse; |
+ return SetSessionProperty(session, key, value, cfvalue); |
+} |
+ |
+static bool SetSessionProperty(VTSessionRef session, |
+ CFStringRef key, |
+ CFStringRef value) { |
+ return SetSessionProperty(session, key, value, value); |
+} |
+ |
+static base::ScopedCFTypeRef<CFDictionaryRef> DictionaryWithKeyValue( |
+ CFTypeRef key, |
+ CFTypeRef value) { |
+ CFTypeRef keys[1] = {key}; |
+ CFTypeRef values[1] = {value}; |
+ return base::ScopedCFTypeRef<CFDictionaryRef>( |
+ CFDictionaryCreate(kCFAllocatorDefault, |
+ keys, |
+ values, |
+ 1, |
+ &kCFTypeDictionaryKeyCallBacks, |
+ &kCFTypeDictionaryValueCallBacks)); |
+} |
+ |
+#pragma mark - |
+ |
+struct H264VideoToolboxEncoder::FrameContext { |
+ base::TimeTicks capture_time; |
+ FrameEncodedCallback frame_encoded_callback; |
+}; |
+ |
+H264VideoToolboxEncoder::H264VideoToolboxEncoder( |
+ scoped_refptr<CastEnvironment> cast_environment, |
+ const VideoSenderConfig& video_config) |
+ : cast_environment_(cast_environment), |
+ cast_config_(video_config), |
+ frame_id_(kStartFrameId), |
+ last_keyframe_id_(kStartFrameId), |
+ encode_next_frame_as_keyframe_(false) { |
+ Initialize(); |
Robert Sesek
2014/08/07 22:49:23
You only call this here, so why is it a separate m
jfroy
2014/08/07 23:06:11
The current code doesn't do it, but I have a suspi
|
+} |
+ |
+H264VideoToolboxEncoder::~H264VideoToolboxEncoder() { |
+ Teardown(); |
Robert Sesek
2014/08/07 22:49:22
Same.
jfroy
2014/08/07 23:06:11
See my reply above.
|
+} |
+ |
+CVPixelBufferPoolRef H264VideoToolboxEncoder::cv_pixel_buffer_pool() const { |
+ DCHECK(thread_checker_.CalledOnValidThread()); |
+ DCHECK(compression_session_); |
+ return VTCompressionSessionGetPixelBufferPool(compression_session_); |
+} |
+ |
+void H264VideoToolboxEncoder::Initialize() { |
+ DCHECK(thread_checker_.CalledOnValidThread()); |
+ DCHECK(!compression_session_); |
+ |
+ DVLOG(3) << __func__ << " width: " << cast_config_.width |
+ << ", height: " << cast_config_.height |
+ << ", start_bitrate: " << cast_config_.start_bitrate |
+ << ", max_frame_rate:" << cast_config_.max_frame_rate; |
+ |
+ // Note that the encoder object is given to the compression session as the |
+ // callback context using a raw pointer. The C API does not allow us to use |
+ // a smart pointer, nor is this encoder ref counted. However, this is still |
+ // safe, because we 1) we own the compression session and 2) we tear it down |
+ // safely. When destructing the encoder, the compression session is flushed |
+ // and invalidated. Internally, VideoToolbox will join all of its threads |
+ // before returning to the client. Therefore, when control returns to us, we |
+ // are guaranteed that the output callback will not execute again. |
+ |
+ // On OS X, allow the hardware encoder. Don't require it, it does not support |
+ // all configurations (some of which are used for testing). |
+ DictionaryPtr encoder_spec(nullptr); |
+#if !defined(OS_IOS) |
+ encoder_spec = DictionaryWithKeyValue( |
+ kVTVideoEncoderSpecification_EnableHardwareAcceleratedVideoEncoder, |
+ kCFBooleanTrue); |
+#endif |
+ |
+ VTCompressionSessionRef session; |
+ OSStatus status = |
+ VTCompressionSessionCreate(kCFAllocatorDefault, |
+ cast_config_.width, |
+ cast_config_.height, |
+ kCMVideoCodecType_H264, |
+ encoder_spec, |
+ nullptr /* sourceImageBufferAttributes */, |
+ nullptr /* compressedDataAllocator */, |
+ CompressionCallback, |
+ reinterpret_cast<void*>(this), |
+ &session); |
+ if (status != noErr) { |
+ DLOG(ERROR) << __func__ << " VTCompressionSessionCreate failed: " |
+ << GetVTErrorString(status) << " (" << status << ")"; |
+ return; |
+ } |
+ compression_session_.reset(session); |
+ |
+#if defined(OS_IOS) |
+ using_hardware_ = true; |
+#else |
+ CFBooleanRef using_hardware_cf = nullptr; |
+ status = VTSessionCopyProperty( |
+ session, |
+ kVTCompressionPropertyKey_UsingHardwareAcceleratedVideoEncoder, |
+ kCFAllocatorDefault, |
+ &using_hardware_cf); |
+ if (status == noErr) { |
+ using_hardware_ = CFBooleanGetValue(using_hardware_cf); |
+ CFRelease(using_hardware_cf); |
+ } |
+ DVLOG(3) << __func__ << " using hardware: " << using_hardware_; |
+#endif |
+ |
+ ConfigureSession(); |
+} |
+ |
+static void SetConfigurationApplier(CFStringRef key, |
+ CFTypeRef value, |
+ VTCompressionSessionRef session) { |
+ SetSessionProperty(session, key, CFTypeEmittable(value), value); |
+} |
+ |
+void H264VideoToolboxEncoder::ConfigureSession() { |
+ SetSessionProperty(compression_session_, |
+ kVTCompressionPropertyKey_ProfileLevel, |
+ kVTProfileLevel_H264_Main_AutoLevel); |
+ |
+ SetSessionProperty( |
+ compression_session_, kVTCompressionPropertyKey_RealTime, true); |
+ SetSessionProperty(compression_session_, |
+ kVTCompressionPropertyKey_AllowFrameReordering, |
+ false); |
+ SetSessionProperty(compression_session_, |
+ kVTCompressionPropertyKey_MaxKeyFrameInterval, |
+ 240u); |
+ SetSessionProperty(compression_session_, |
+ kVTCompressionPropertyKey_MaxKeyFrameIntervalDuration, |
+ 240u); |
+ |
+ SetSessionProperty(compression_session_, |
+ kVTCompressionPropertyKey_AverageBitRate, |
+ static_cast<uint32_t>(cast_config_.start_bitrate)); |
+ |
+ SetSessionProperty(compression_session_, |
+ kVTCompressionPropertyKey_ExpectedFrameRate, |
+ static_cast<uint32_t>(cast_config_.max_frame_rate)); |
+ |
+ SetSessionProperty(compression_session_, |
+ kVTCompressionPropertyKey_ColorPrimaries, |
+ kCVImageBufferColorPrimaries_ITU_R_709_2); |
+ SetSessionProperty(compression_session_, |
+ kVTCompressionPropertyKey_TransferFunction, |
+ kCVImageBufferTransferFunction_ITU_R_709_2); |
+ SetSessionProperty(compression_session_, |
+ kVTCompressionPropertyKey_YCbCrMatrix, |
+ kCVImageBufferYCbCrMatrix_ITU_R_709_2); |
+ |
+ if (compression_properties_) { |
+ CFDictionaryApplyFunction( |
+ compression_properties_, |
+ reinterpret_cast<CFDictionaryApplierFunction>(SetConfigurationApplier), |
+ compression_session_.get()); |
+ } |
+} |
+ |
+void H264VideoToolboxEncoder::Teardown() { |
+ DCHECK(thread_checker_.CalledOnValidThread()); |
+ |
+ // If the compression session exists, invalidate it. This blocks until all |
+ // pending output callbacks have returned and any internal threads have |
+ // joined, ensuring no output callback ever sees a dangling encoder pointer. |
+ if (compression_session_) { |
+ VTCompressionSessionInvalidate(compression_session_); |
+ compression_session_.reset(); |
+ } |
+} |
+ |
+#pragma mark - |
+ |
+bool H264VideoToolboxEncoder::EncodeVideoFrame( |
+ const scoped_refptr<media::VideoFrame>& video_frame, |
+ const base::TimeTicks& capture_time, |
+ const FrameEncodedCallback& frame_encoded_callback) { |
+ DCHECK(thread_checker_.CalledOnValidThread()); |
+ |
+ if (!compression_session_) { |
+ DLOG(ERROR) << __func__ << " compression session is null"; |
+ return false; |
+ } |
+ |
+ PixelBufferPtr pixel_buffer(video_frame->cv_pixel_buffer(), |
+ base::scoped_policy::RETAIN); |
+ if (!pixel_buffer) { |
+ pixel_buffer = WrapVideoFrame(*video_frame); |
+ if (!pixel_buffer) { |
+ return false; |
+ } |
+ } |
+ |
+ CMTime timestamp_cm; |
+ if (capture_time.is_null()) { |
+ timestamp_cm = kCMTimeInvalid; |
+ } else { |
+ timestamp_cm = CMTimeMake(capture_time.ToInternalValue(), USEC_PER_SEC); |
+ } |
+ |
+ FrameContext* fc = new FrameContext(); |
+ fc->capture_time = capture_time; |
+ fc->frame_encoded_callback = frame_encoded_callback; |
+ |
+ DVLOG(3) << __func__ << " pts: " << timestamp_cm; |
+ |
+ DictionaryPtr frame_props(nullptr); |
+ if (encode_next_frame_as_keyframe_) { |
+ frame_props = DictionaryWithKeyValue(kVTEncodeFrameOptionKey_ForceKeyFrame, |
+ kCFBooleanTrue); |
+ encode_next_frame_as_keyframe_ = false; |
+ } |
+ |
+ VTEncodeInfoFlags info; |
+ OSStatus status = VTCompressionSessionEncodeFrame(compression_session_, |
+ pixel_buffer, |
+ timestamp_cm, |
+ kCMTimeInvalid, |
+ frame_props, |
+ reinterpret_cast<void*>(fc), |
+ &info); |
+ if (status != noErr) { |
+ DLOG(ERROR) << __func__ << " VTCompressionSessionEncodeFrame failed: " |
+ << GetVTErrorString(status) << " (" << status << ")"; |
+ return false; |
+ } |
+ if ((info & kVTEncodeInfo_FrameDropped)) { |
+ DLOG(ERROR) << __func__ << " frame dropped"; |
+ return false; |
+ } |
+ |
+ return true; |
+} |
+ |
+void H264VideoToolboxEncoder::SetBitRate(int new_bit_rate) { |
+ DCHECK(thread_checker_.CalledOnValidThread()); |
+ // NOTE: VideoToolbox does not seem to support bitrate reconfiguration. |
+} |
+ |
+void H264VideoToolboxEncoder::GenerateKeyFrame() { |
+ DCHECK(thread_checker_.CalledOnValidThread()); |
+ DCHECK(compression_session_); |
+ |
+ encode_next_frame_as_keyframe_ = true; |
+} |
+ |
+void H264VideoToolboxEncoder::LatestFrameIdToReference(uint32 /*frame_id*/) { |
+} |
+ |
+#pragma mark - |
+ |
+static void VideoFramePixelBufferReleaseCallback(void* frame_ref, |
+ const void* data, |
+ size_t size, |
+ size_t num_planes, |
+ const void* planes[]) { |
+ free(const_cast<void*>(data)); |
+ reinterpret_cast<media::VideoFrame*>(frame_ref)->Release(); |
+} |
+ |
+H264VideoToolboxEncoder::PixelBufferPtr H264VideoToolboxEncoder::WrapVideoFrame( |
+ const scoped_refptr<media::VideoFrame>& frame) { |
+ static const size_t MAX_PLANES = 3; |
+ |
+ media::VideoFrame::Format format = frame->format(); |
+ size_t num_planes = media::VideoFrame::NumPlanes(format); |
+ gfx::Size coded_size = frame->coded_size(); |
+ |
+ // media::VideoFrame only supports YUV formats, so there is no way to |
+ // leverage VideoToolbox's ability to convert RGBA formats automatically. In |
+ // addition, most of the media::VideoFrame formats are YVU, which VT does not |
+ // support. Finally, media::VideoFrame formats do not carry any information |
+ // about the color space, transform or any other colorimetric information |
+ // that is generally needed to fully specify the input data. So essentially |
+ // require that the input be YCbCr 4:2:0 (either planar or biplanar) and |
+ // assume the standard video dynamic range for samples (although most modern |
+ // HDTVs support full-range video these days). |
+ OSType pixel_format; |
+ if (format == media::VideoFrame::Format::I420) { |
+ pixel_format = kCVPixelFormatType_420YpCbCr8Planar; |
+ } else if (format == media::VideoFrame::Format::NV12) { |
+ pixel_format = kCVPixelFormatType_420YpCbCr8BiPlanarVideoRange; |
+ } else { |
+ DLOG(ERROR) << __func__ << " unsupported frame format: " << format; |
+ return PixelBufferPtr(nullptr); |
+ } |
+ |
+ // TODO(jfroy): Support extended pixels (i.e. padding). |
+ if (frame->coded_size() != frame->visible_rect().size()) { |
+ DLOG(ERROR) << __func__ << " frame with extended pixels not supported: " |
+ << " coded_size: " << coded_size.ToString() |
+ << ", visible_rect: " << frame->visible_rect().ToString(); |
+ return PixelBufferPtr(nullptr); |
+ } |
+ |
+ DCHECK(media::VideoFrame::NumPlanes(format) <= MAX_PLANES); |
+ void* plane_ptrs[MAX_PLANES]; |
+ size_t plane_widths[MAX_PLANES]; |
+ size_t plane_heights[MAX_PLANES]; |
+ size_t plane_bytes_per_row[MAX_PLANES]; |
+ for (size_t plane_i = 0; plane_i < num_planes; ++plane_i) { |
+ plane_ptrs[plane_i] = frame->data(plane_i); |
+ gfx::Size plane_size = |
+ media::VideoFrame::PlaneSize(format, plane_i, coded_size); |
+ plane_widths[plane_i] = plane_size.width(); |
+ plane_heights[plane_i] = plane_size.height(); |
+ plane_bytes_per_row[plane_i] = frame->stride(plane_i); |
+ } |
+ |
+ // CVPixelBufferCreateWithPlanarBytes needs a dummy plane descriptor or the |
+ // release callback will not execute. The descriptor is freed in the callback. |
+ void* descriptor = |
+ calloc(1, |
+ std::max(sizeof(CVPlanarPixelBufferInfo_YCbCrPlanar), |
+ sizeof(CVPlanarPixelBufferInfo_YCbCrBiPlanar))); |
+ |
+ // Wrap the frame's data in a CVPixelBuffer. Because this is a C API, we can't |
+ // give it a smart pointer to the frame, so instead pass a raw pointer and |
+ // increment the frame's reference count manually. |
+ CVPixelBufferRef pixel_buffer; |
+ CVReturn result = |
+ CVPixelBufferCreateWithPlanarBytes(kCFAllocatorDefault, |
+ coded_size.width(), |
+ coded_size.height(), |
+ format, |
+ &descriptor, |
+ 0, |
+ num_planes, |
+ plane_ptrs, |
+ plane_widths, |
+ plane_heights, |
+ plane_bytes_per_row, |
+ VideoFramePixelBufferReleaseCallback, |
+ frame.get(), |
+ nullptr, |
+ &pixel_buffer); |
+ if (result != kCVReturnSuccess) { |
+ DLOG(ERROR) << __func__ << " CVPixelBufferCreateWithPlanarBytes failed: " |
+ << GetCVErrorString(result) << " (" << result << ")"; |
+ return PixelBufferPtr(nullptr); |
+ } |
+ |
+ // The CVPixelBuffer now references the data of the frame, so increment its |
+ // reference count manually. The release callback set on the pixel buffer will |
+ // release the frame. |
+ frame.AddRef(); |
+ |
+ return PixelBufferPtr(pixel_buffer); |
+} |
+ |
+#pragma mark - |
+ |
+void H264VideoToolboxEncoder::CompressionCallback(void* encoder_opaque, |
+ void* frame_opaque, |
+ OSStatus status, |
+ VTEncodeInfoFlags info, |
+ CMSampleBufferRef sbuf) { |
+ H264VideoToolboxEncoder* encoder = |
+ reinterpret_cast<H264VideoToolboxEncoder*>(encoder_opaque); |
+ scoped_ptr<FrameContext> fc(reinterpret_cast<FrameContext*>(frame_opaque)); |
+ |
+ if (status != noErr) { |
+ DLOG(ERROR) << __func__ << " encoding failed: " << GetVTErrorString(status) |
+ << " (" << status << ")"; |
+ return; |
+ } |
+ if ((info & kVTEncodeInfo_FrameDropped)) { |
+ DVLOG(2) << __func__ << " frame dropped"; |
+ return; |
+ } |
+ CMItemCount sample_count = CMSampleBufferGetNumSamples(sbuf); |
+ if (sample_count > 1) { |
+ DLOG(ERROR) << __func__ |
+ << " more than one sample in sample buffer: " << sample_count; |
+ return; |
+ } |
+ |
+ CFDictionaryRef sample_attachments = |
+ static_cast<CFDictionaryRef>(CFArrayGetValueAtIndex( |
+ CMSampleBufferGetSampleAttachmentsArray(sbuf, true), 0)); |
+ |
+ // If the NotSync key is not present, it implies Sync, which indicates a |
+ // keyframe (at least I think, VT documentation is, erm, sparse). Could |
+ // alternatively use kCMSampleAttachmentKey_DependsOnOthers == false. |
+ bool keyframe = |
+ CFDictionaryContainsKey(sample_attachments, |
+ kCMSampleAttachmentKey_NotSync) == false; |
+ |
+ // Generate a frame id and update the last keyframe id if needed. |
+ // NOTE: VideoToolbox calls the output callback serially, so this is safe. |
+ uint32 frame_id = ++encoder->frame_id_; |
+ if (keyframe) { |
+ encoder->last_keyframe_id_ = frame_id; |
+ } |
+ |
+ CMSampleTimingInfo timing_info; |
+ CMSampleBufferGetSampleTimingInfo(sbuf, 0, &timing_info); |
+ DVLOG(3) << __func__ << ", timing info: " << timing_info |
+ << ", keyframe: " << keyframe << ", frame id: " << frame_id; |
+ |
+ scoped_ptr<EncodedFrame> encoded_frame(new EncodedFrame()); |
+ encoded_frame->frame_id = frame_id; |
+ encoded_frame->reference_time = fc->capture_time; |
+ encoded_frame->rtp_timestamp = GetVideoRtpTimestamp(fc->capture_time); |
+ if (keyframe) { |
+ encoded_frame->dependency = EncodedFrame::KEY; |
+ encoded_frame->referenced_frame_id = frame_id; |
+ } else { |
+ encoded_frame->dependency = EncodedFrame::DEPENDENT; |
+ // NOTE: Technically wrong, but without parsing the NALs our best guess is |
+ // the last keyframe. |
+ encoded_frame->referenced_frame_id = encoder->last_keyframe_id_; |
+ } |
+ |
+ CopySampleBufferToAnnexBBuffer(sbuf, &encoded_frame->data, keyframe); |
+ |
+ encoder->cast_environment_->PostTask( |
+ CastEnvironment::MAIN, |
+ FROM_HERE, |
+ base::Bind(fc->frame_encoded_callback, base::Passed(&encoded_frame))); |
+} |
+ |
+template <typename NalSizeType> |
+static void CopyNalsToAnnexB(char* avcc_buffer, |
+ const size_t avcc_size, |
+ std::string* annexb_buffer) { |
+ static_assert(sizeof(NalSizeType) == 1 || sizeof(NalSizeType) == 2 || |
+ sizeof(NalSizeType) == 4, |
+ "NAL size type has unsupported size"); |
+ static const char startcode_3[3] = {0, 0, 1}; |
+ DCHECK(avcc_buffer); |
+ DCHECK(annexb_buffer); |
+ size_t bytes_left = avcc_size; |
+ while (bytes_left > 0) { |
+ DCHECK(bytes_left > sizeof(NalSizeType)); |
+ NalSizeType nal_size; |
+ base::ReadBigEndian(avcc_buffer, &nal_size); |
+ bytes_left -= sizeof(NalSizeType); |
+ avcc_buffer += sizeof(NalSizeType); |
+ |
+ DCHECK(bytes_left >= nal_size); |
+ annexb_buffer->append(startcode_3, sizeof(startcode_3)); |
+ annexb_buffer->append(avcc_buffer, nal_size); |
+ bytes_left -= nal_size; |
+ avcc_buffer += nal_size; |
+ } |
+} |
+ |
+void H264VideoToolboxEncoder::CopySampleBufferToAnnexBBuffer( |
+ CMSampleBufferRef sbuf, |
+ std::string* annexb_buffer, |
+ bool keyframe) { |
+ // Perform two pass, one to figure out the total output size, and another to |
+ // copy the data after having performed a single output allocation. Note that |
+ // we'll allocate a bit more because we'll count 4 bytes instead of 3 for |
+ // video NALs. |
+ |
+ // TODO(jfroy): There is a bug in |
+ // CMVideoFormatDescriptionGetH264ParameterSetAtIndex, iterate until fail. |
+ |
+ OSStatus status; |
+ |
+ // Get the sample buffer's block buffer and format description. |
+ CMBlockBufferRef bb = CMSampleBufferGetDataBuffer(sbuf); |
+ DCHECK(bb); |
+ CMFormatDescriptionRef fdesc = CMSampleBufferGetFormatDescription(sbuf); |
+ DCHECK(fdesc); |
+ |
+ size_t bb_size = CMBlockBufferGetDataLength(bb); |
+ size_t total_bytes = bb_size; |
+ |
+ size_t pset_count; |
+ int nal_size_field_bytes; |
+ status = CMVideoFormatDescriptionGetH264ParameterSetAtIndex( |
+ fdesc, 0, nullptr, nullptr, &pset_count, &nal_size_field_bytes); |
+ if (status == kCMFormatDescriptionBridgeError_InvalidParameter) { |
+ DLOG(WARNING) << __func__ << " assuming 2 parameter sets and 4 bytes NAL " |
+ "length header" pset_count = 2; |
+ nal_size_field_bytes = 4; |
+ } else if (status != noErr) { |
+ DLOG(ERROR) |
+ << __func__ |
+ << " CMVideoFormatDescriptionGetH264ParameterSetAtIndex failed: " |
+ << status; |
+ return; |
+ } |
+ |
+ if (keyframe) { |
+ const uint8_t* pset; |
+ size_t pset_size; |
+ for (size_t pset_i = 0; pset_i < pset_count; ++pset_i) { |
+ status = CMVideoFormatDescriptionGetH264ParameterSetAtIndex( |
+ fdesc, pset_i, &pset, &pset_size, nullptr, nullptr); |
+ if (status != noErr) { |
+ DLOG(ERROR) |
+ << __func__ |
+ << " CMVideoFormatDescriptionGetH264ParameterSetAtIndex failed: " |
+ << status; |
+ return; |
+ } |
+ total_bytes += pset_size + nal_size_field_bytes; |
+ } |
+ } |
+ |
+ annexb_buffer->reserve(total_bytes); |
+ |
+ // Copy all parameter sets before keyframes. |
+ if (keyframe) { |
+ const uint8_t* pset; |
+ size_t pset_size; |
+ for (size_t pset_i = 0; pset_i < pset_count; ++pset_i) { |
+ status = CMVideoFormatDescriptionGetH264ParameterSetAtIndex( |
+ fdesc, pset_i, &pset, &pset_size, nullptr, nullptr); |
+ if (status != noErr) { |
+ DLOG(ERROR) |
+ << __func__ |
+ << " CMVideoFormatDescriptionGetH264ParameterSetAtIndex failed: " |
+ << status; |
+ return; |
+ } |
+ static const char startcode_4[4] = {0, 0, 0, 1}; |
+ annexb_buffer->append(startcode_4, sizeof(startcode_4)); |
+ annexb_buffer->append(reinterpret_cast<const char*>(pset), pset_size); |
+ } |
+ } |
+ |
+ // Block buffers can be composed of non-contiguous chunks. For the sake of |
+ // keeping this code simple, flatten non-contiguous block buffers. |
+ base::ScopedCFTypeRef<CMBlockBufferRef> contiguous_bb( |
+ bb, base::scoped_policy::RETAIN); |
+ if (!CMBlockBufferIsRangeContiguous(bb, 0, 0)) { |
+ DVLOG(3) << __func__ << " copying block buffer to contiguous buffer"; |
+ contiguous_bb.reset(); |
+ status = CMBlockBufferCreateContiguous(kCFAllocatorDefault, |
+ bb, |
+ kCFAllocatorDefault, |
+ nullptr, |
+ 0, |
+ 0, |
+ 0, |
+ contiguous_bb.InitializeInto()); |
+ if (status != noErr) { |
+ DLOG(ERROR) << __func__ |
+ << " CMBlockBufferCreateContiguous failed: " << status; |
+ return; |
+ } |
+ } |
+ |
+ // Copy all the NAL units. In the process convert them from AVCC format |
+ // (length header) to AnnexB format (start code). |
+ char* bb_data; |
+ status = |
+ CMBlockBufferGetDataPointer(contiguous_bb, 0, nullptr, nullptr, &bb_data); |
+ if (status != noErr) { |
+ DLOG(ERROR) << __func__ |
+ << " CMBlockBufferGetDataPointer failed: " << status; |
+ return; |
+ } |
+ |
+ if (nal_size_field_bytes == 1) { |
+ CopyNalsToAnnexB<uint8_t>(bb_data, bb_size, annexb_buffer); |
+ } else if (nal_size_field_bytes == 2) { |
+ CopyNalsToAnnexB<uint16_t>(bb_data, bb_size, annexb_buffer); |
+ } else if (nal_size_field_bytes == 4) { |
+ CopyNalsToAnnexB<uint32_t>(bb_data, bb_size, annexb_buffer); |
+ } |
+} |
+ |
+} // namespace cast |
+} // namespace media |