content/renderer/media_recorder/vpx_encoder.cc - Issue 2793303003: Refactor VideoTrackRecorder into smaller classes

Unified Diff: content/renderer/media_recorder/vpx_encoder.cc

Issue 2793303003: Refactor VideoTrackRecorder into smaller classes (Closed)

Patch Set: Created 3 years, 8 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Index: content/renderer/media_recorder/vpx_encoder.cc

diff --git a/content/renderer/media_recorder/vpx_encoder.cc b/content/renderer/media_recorder/vpx_encoder.cc

new file mode 100644

index 0000000000000000000000000000000000000000..65cb7403f9c51292ff7f796df57cdbc015048755

--- /dev/null

+++ b/content/renderer/media_recorder/vpx_encoder.cc

@@ -0,0 +1,308 @@

+// Use of this source code is governed by a BSD-style license that can be

+// found in the LICENSE file.

+#include "content/renderer/media_recorder/vpx_encoder.h"

+#include <algorithm>

+#include <string>

+#include "base/bind.h"

+#include "base/sys_info.h"

+#include "base/threading/thread.h"

+#include "base/trace_event/trace_event.h"

+#include "media/base/video_frame.h"

+#include "ui/gfx/geometry/size.h"

+using media::VideoFrame;

+using media::VideoFrameMetadata;

+namespace content {

+void VpxEncoder::VpxCodecDeleter::operator()(vpx_codec_ctx_t* codec) {

+ if (!codec)

+ return;

+ vpx_codec_err_t ret = vpx_codec_destroy(codec);

+ CHECK_EQ(ret, VPX_CODEC_OK);

+ delete codec;

+static int GetNumberOfThreadsForEncoding() {

+ // Do not saturate CPU utilization just for encoding. On a lower-end system

+ // with only 1 or 2 cores, use only one thread for encoding. On systems with

+ // more cores, allow half of the cores to be used for encoding.

+ return std::min(8, (base::SysInfo::NumberOfProcessors() + 1) / 2);

+// static

+void VpxEncoder::ShutdownEncoder(std::unique_ptr<base::Thread> encoding_thread,

+ ScopedVpxCodecCtxPtr encoder) {

+ DCHECK(encoding_thread->IsRunning());

+ encoding_thread->Stop();

+ // Both |encoding_thread| and |encoder| will be destroyed at end-of-scope.

+VpxEncoder::VpxEncoder(

+ bool use_vp9,

+ const VideoTrackRecorder::OnEncodedVideoCB& on_encoded_video_callback,

+ int32_t bits_per_second)

+ : VideoTrackRecorder::Encoder(on_encoded_video_callback, bits_per_second),

+ use_vp9_(use_vp9) {

+ codec_config_.g_timebase.den = 0; // Not initialized.

+ alpha_codec_config_.g_timebase.den = 0; // Not initialized.

+ DCHECK(encoding_thread_->IsRunning());

+VpxEncoder::~VpxEncoder() {

+ main_task_runner_->PostTask(

+ FROM_HERE,

+ base::Bind(&VpxEncoder::ShutdownEncoder, base::Passed(&encoding_thread_),

+ base::Passed(&encoder_)));

+bool VpxEncoder::CanEncodeAlphaChannel() {

+ return true;

+void VpxEncoder::EncodeOnEncodingTaskRunner(scoped_refptr<VideoFrame> frame,

+ base::TimeTicks capture_timestamp) {

+ TRACE_EVENT0("video", "VpxEncoder::EncodeOnEncodingTaskRunner");

+ DCHECK(encoding_task_runner_->BelongsToCurrentThread());

+ const gfx::Size frame_size = frame->visible_rect().size();

+ const base::TimeDelta duration = EstimateFrameDuration(frame);

+ const media::WebmMuxer::VideoParameters video_params(frame);

+ if (!IsInitialized(codec_config_) ||

+ gfx::Size(codec_config_.g_w, codec_config_.g_h) != frame_size) {

+ ConfigureEncoderOnEncodingTaskRunner(frame_size, &codec_config_, &encoder_);

+ }

+ const bool frame_has_alpha = frame->format() == media::PIXEL_FORMAT_YV12A;

+ if (frame_has_alpha && (!IsInitialized(alpha_codec_config_) ||

+ gfx::Size(alpha_codec_config_.g_w,

+ alpha_codec_config_.g_h) != frame_size)) {

+ ConfigureEncoderOnEncodingTaskRunner(frame_size, &alpha_codec_config_,

+ &alpha_encoder_);

+ u_plane_stride_ = media::VideoFrame::RowBytes(

+ VideoFrame::kUPlane, frame->format(), frame_size.width());

+ v_plane_stride_ = media::VideoFrame::RowBytes(

+ VideoFrame::kVPlane, frame->format(), frame_size.width());

+ v_plane_offset_ = media::VideoFrame::PlaneSize(

+ frame->format(), VideoFrame::kUPlane, frame_size)

+ .GetArea();

+ alpha_dummy_planes_.resize(

+ v_plane_offset_ + media::VideoFrame::PlaneSize(

+ frame->format(), VideoFrame::kVPlane, frame_size)

+ .GetArea());

+ // It is more expensive to encode 0x00, so use 0x80 instead.

+ std::fill(alpha_dummy_planes_.begin(), alpha_dummy_planes_.end(), 0x80);

+ }

+ // If we introduced a new alpha frame, force keyframe.

+ const bool force_keyframe = frame_has_alpha && !last_frame_had_alpha_;

+ last_frame_had_alpha_ = frame_has_alpha;

+ std::unique_ptr<std::string> data(new std::string);

+ bool keyframe = false;

+ DoEncode(encoder_.get(), frame_size, frame->data(VideoFrame::kYPlane),

+ frame->visible_data(VideoFrame::kYPlane),

+ frame->stride(VideoFrame::kYPlane),

+ frame->visible_data(VideoFrame::kUPlane),

+ frame->stride(VideoFrame::kUPlane),

+ frame->visible_data(VideoFrame::kVPlane),

+ frame->stride(VideoFrame::kVPlane), duration, force_keyframe,

+ data.get(), &keyframe);

+ std::unique_ptr<std::string> alpha_data(new std::string);

+ if (frame_has_alpha) {

+ bool alpha_keyframe = false;

+ DoEncode(alpha_encoder_.get(), frame_size, frame->data(VideoFrame::kAPlane),

+ frame->visible_data(VideoFrame::kAPlane),

+ frame->stride(VideoFrame::kAPlane), alpha_dummy_planes_.data(),

+ u_plane_stride_, alpha_dummy_planes_.data() + v_plane_offset_,

+ v_plane_stride_, duration, keyframe, alpha_data.get(),

+ &alpha_keyframe);

+ DCHECK_EQ(keyframe, alpha_keyframe);

+ }

+ frame = nullptr;

+ origin_task_runner_->PostTask(

+ FROM_HERE,

+ base::Bind(OnFrameEncodeCompleted, on_encoded_video_callback_,

+ video_params, base::Passed(&data), base::Passed(&alpha_data),

+ capture_timestamp, keyframe));

+void VpxEncoder::DoEncode(vpx_codec_ctx_t* const encoder,

+ const gfx::Size& frame_size,

+ uint8_t* const data,

+ uint8_t* const y_plane,

+ int y_stride,

+ uint8_t* const u_plane,

+ int u_stride,

+ uint8_t* const v_plane,

+ int v_stride,

+ const base::TimeDelta& duration,

+ bool force_keyframe,

+ std::string* const output_data,

+ bool* const keyframe) {

+ DCHECK(encoding_task_runner_->BelongsToCurrentThread());

+ vpx_image_t vpx_image;

+ vpx_image_t* const result =

+ vpx_img_wrap(&vpx_image, VPX_IMG_FMT_I420, frame_size.width(),

+ frame_size.height(), 1 /* align */, data);

+ DCHECK_EQ(result, &vpx_image);

+ vpx_image.planes[VPX_PLANE_Y] = y_plane;

+ vpx_image.planes[VPX_PLANE_U] = u_plane;

+ vpx_image.planes[VPX_PLANE_V] = v_plane;

+ vpx_image.stride[VPX_PLANE_Y] = y_stride;

+ vpx_image.stride[VPX_PLANE_U] = u_stride;

+ vpx_image.stride[VPX_PLANE_V] = v_stride;

+ const vpx_codec_flags_t flags = force_keyframe ? VPX_EFLAG_FORCE_KF : 0;

+ // Encode the frame. The presentation time stamp argument here is fixed to

+ // zero to force the encoder to base its single-frame bandwidth calculations

+ // entirely on |predicted_frame_duration|.

+ const vpx_codec_err_t ret =

+ vpx_codec_encode(encoder, &vpx_image, 0 /* pts */,

+ duration.InMicroseconds(), flags, VPX_DL_REALTIME);

+ DCHECK_EQ(ret, VPX_CODEC_OK)

+ << vpx_codec_err_to_string(ret) << ", #" << vpx_codec_error(encoder)

+ << " -" << vpx_codec_error_detail(encoder);

+ *keyframe = false;

+ vpx_codec_iter_t iter = NULL;

+ const vpx_codec_cx_pkt_t* pkt = NULL;

+ while ((pkt = vpx_codec_get_cx_data(encoder, &iter)) != NULL) {

+ if (pkt->kind != VPX_CODEC_CX_FRAME_PKT)

+ continue;

+ output_data->assign(static_cast<char*>(pkt->data.frame.buf),

+ pkt->data.frame.sz);

+ *keyframe = (pkt->data.frame.flags & VPX_FRAME_IS_KEY) != 0;

+ break;

+ }

+void VpxEncoder::ConfigureEncoderOnEncodingTaskRunner(

+ const gfx::Size& size,

+ vpx_codec_enc_cfg_t* codec_config,

+ ScopedVpxCodecCtxPtr* encoder) {

+ DCHECK(encoding_task_runner_->BelongsToCurrentThread());

+ if (IsInitialized(*codec_config)) {

+ // TODO(mcasas) VP8 quirk/optimisation: If the new |size| is strictly less-

+ // than-or-equal than the old size, in terms of area, the existing encoder

+ // instance could be reused after changing |codec_config->{g_w,g_h}|.

+ DVLOG(1) << "Destroying/Re-Creating encoder for new frame size: "

+ << gfx::Size(codec_config->g_w, codec_config->g_h).ToString()

+ << " --> " << size.ToString() << (use_vp9_ ? " vp9" : " vp8");

+ encoder->reset();

+ }

+ const vpx_codec_iface_t* codec_interface =

+ use_vp9_ ? vpx_codec_vp9_cx() : vpx_codec_vp8_cx();

+ vpx_codec_err_t result = vpx_codec_enc_config_default(

+ codec_interface, codec_config, 0 /* reserved */);

+ DCHECK_EQ(VPX_CODEC_OK, result);

+ DCHECK_EQ(320u, codec_config->g_w);

+ DCHECK_EQ(240u, codec_config->g_h);

+ DCHECK_EQ(256u, codec_config->rc_target_bitrate);

+ // Use the selected bitrate or adjust default bit rate to account for the

+ // actual size. Note: |rc_target_bitrate| units are kbit per second.

+ if (bits_per_second_ > 0) {

+ codec_config->rc_target_bitrate = bits_per_second_ / 1000;

+ } else {

+ codec_config->rc_target_bitrate = size.GetArea() *

+ codec_config->rc_target_bitrate /

+ codec_config->g_w / codec_config->g_h;

+ }

+ // Both VP8/VP9 configuration should be Variable BitRate by default.

+ DCHECK_EQ(VPX_VBR, codec_config->rc_end_usage);

+ if (use_vp9_) {

+ // Number of frames to consume before producing output.

+ codec_config->g_lag_in_frames = 0;

+ // DCHECK that the profile selected by default is I420 (magic number 0).

+ DCHECK_EQ(0u, codec_config->g_profile);

+ } else {

+ // VP8 always produces frames instantaneously.

+ DCHECK_EQ(0u, codec_config->g_lag_in_frames);

+ }

+ DCHECK(size.width());

+ DCHECK(size.height());

+ codec_config->g_w = size.width();

+ codec_config->g_h = size.height();

+ codec_config->g_pass = VPX_RC_ONE_PASS;

+ // Timebase is the smallest interval used by the stream, can be set to the

+ // frame rate or to e.g. microseconds.

+ codec_config->g_timebase.num = 1;

+ codec_config->g_timebase.den = base::Time::kMicrosecondsPerSecond;

+ // Let the encoder decide where to place the Keyframes, between min and max.

+ // In VPX_KF_AUTO mode libvpx will sometimes emit keyframes regardless of min/

+ // max distance out of necessity.

+ // Note that due to http://crbug.com/440223, it might be necessary to force a

+ // key frame after 10,000frames since decoding fails after 30,000 non-key

+ // frames.

+ // Forcing a keyframe in regular intervals also allows seeking in the

+ // resulting recording with decent performance.

+ codec_config->kf_mode = VPX_KF_AUTO;

+ codec_config->kf_min_dist = 0;

+ codec_config->kf_max_dist = 100;

+ codec_config->g_threads = GetNumberOfThreadsForEncoding();

+ // Number of frames to consume before producing output.

+ codec_config->g_lag_in_frames = 0;

+ encoder->reset(new vpx_codec_ctx_t);

+ const vpx_codec_err_t ret = vpx_codec_enc_init(

+ encoder->get(), codec_interface, codec_config, 0 /* flags */);

+ DCHECK_EQ(VPX_CODEC_OK, ret);

+ if (use_vp9_) {

+ // Values of VP8E_SET_CPUUSED greater than 0 will increase encoder speed at

+ // the expense of quality up to a maximum value of 8 for VP9, by tuning the

+ // target time spent encoding the frame. Go from 8 to 5 (values for real

+ // time encoding) depending on the amount of cores available in the system.

+ const int kCpuUsed =

+ std::max(5, 8 - base::SysInfo::NumberOfProcessors() / 2);

+ result = vpx_codec_control(encoder->get(), VP8E_SET_CPUUSED, kCpuUsed);

+ DLOG_IF(WARNING, VPX_CODEC_OK != result) << "VP8E_SET_CPUUSED failed";

+ }

+bool VpxEncoder::IsInitialized(const vpx_codec_enc_cfg_t& codec_config) const {

+ DCHECK(encoding_task_runner_->BelongsToCurrentThread());

+ return codec_config.g_timebase.den != 0;

+base::TimeDelta VpxEncoder::EstimateFrameDuration(

+ const scoped_refptr<VideoFrame>& frame) {

+ DCHECK(encoding_task_runner_->BelongsToCurrentThread());

+ using base::TimeDelta;

+ TimeDelta predicted_frame_duration;

+ if (!frame->metadata()->GetTimeDelta(VideoFrameMetadata::FRAME_DURATION,

+ &predicted_frame_duration) ||

+ predicted_frame_duration <= TimeDelta()) {

+ // The source of the video frame did not provide the frame duration. Use

+ // the actual amount of time between the current and previous frame as a

+ // prediction for the next frame's duration.

+ // TODO(mcasas): This duration estimation could lead to artifacts if the

+ // cadence of the received stream is compromised (e.g. camera freeze, pause,

+ // remote packet loss). Investigate using GetFrameRate() in this case.

+ predicted_frame_duration = frame->timestamp() - last_frame_timestamp_;

+ }

+ last_frame_timestamp_ = frame->timestamp();

+ // Make sure |predicted_frame_duration| is in a safe range of values.

+ const TimeDelta kMaxFrameDuration = TimeDelta::FromSecondsD(1.0 / 8);

+ const TimeDelta kMinFrameDuration = TimeDelta::FromMilliseconds(1);

+ return std::min(kMaxFrameDuration,

+ std::max(predicted_frame_duration, kMinFrameDuration));

+} // namespace content

« content/renderer/media_recorder/video_track_recorder.h ('K') | « content/renderer/media_recorder/vpx_encoder.h ('k') | no next file » | no next file with comments »