| Index: media/video/half_float_maker.cc
|
| diff --git a/media/video/half_float_maker.cc b/media/video/half_float_maker.cc
|
| new file mode 100644
|
| index 0000000000000000000000000000000000000000..49c56883d368ac9e1d24f699db8adc1dc99f884f
|
| --- /dev/null
|
| +++ b/media/video/half_float_maker.cc
|
| @@ -0,0 +1,91 @@
|
| +// Copyright (c) 2017 The Chromium Authors. All rights reserved.
|
| +// Use of this source code is governed by a BSD-style license that can be
|
| +// found in the LICENSE file.
|
| +
|
| +#include "media/video/half_float_maker.h"
|
| +#include "third_party/libyuv/include/libyuv.h"
|
| +
|
| +namespace media {
|
| +
|
| +// By OR-ing with 0x3800, 10-bit numbers become half-floats in the
|
| +// range [0.5..1) and 9-bit numbers get the range [0.5..0.75).
|
| +//
|
| +// Half-floats are evaluated as:
|
| +// float value = pow(2.0, exponent - 25) * (0x400 + fraction);
|
| +//
|
| +// In our case the exponent is 14 (since we or with 0x3800) and
|
| +// pow(2.0, 14-25) * 0x400 evaluates to 0.5 (our offset) and
|
| +// pow(2.0, 14-25) * fraction is [0..0.49951171875] for 10-bit and
|
| +// [0..0.24951171875] for 9-bit.
|
| +//
|
| +// https://en.wikipedia.org/wiki/Half-precision_floating-point_format
|
| +class HalfFloatMaker_xor : public HalfFloatMaker {
|
| + public:
|
| + explicit HalfFloatMaker_xor(int bits_per_channel)
|
| + : bits_per_channel_(bits_per_channel) {}
|
| + float Offset() const override { return 0.5; }
|
| + float Multiplier() const override {
|
| + int max_input_value = (1 << bits_per_channel_) - 1;
|
| + // 2 << 11 = 2048 would be 1.0 with our exponent.
|
| + return 2048.0 / max_input_value;
|
| + }
|
| + void MakeHalfFloats(const uint16_t* src, size_t num, uint16_t* dst) override {
|
| + // Micro-benchmarking indicates that the compiler does
|
| + // a good enough job of optimizing this loop that trying
|
| + // to manually operate on one uint64 at a time is not
|
| + // actually helpful.
|
| + // Note to future optimizers: Benchmark your optimizations!
|
| + for (size_t i = 0; i < num; i++)
|
| + dst[i] = src[i] | 0x3800;
|
| + }
|
| +
|
| + private:
|
| + int bits_per_channel_;
|
| +};
|
| +
|
| +// Convert plane of 16 bit shorts to half floats using libyuv.
|
| +class HalfFloatMaker_libyuv : public HalfFloatMaker {
|
| + public:
|
| + explicit HalfFloatMaker_libyuv(int bits_per_channel) {
|
| + int max_value = (1 << bits_per_channel) - 1;
|
| + // For less than 15 bits, we can give libyuv a multiplier of
|
| + // 1.0, which is faster on some platforms. If bits is 16 or larger,
|
| + // a multiplier of 1.0 would cause overflows. However, a multiplier
|
| + // of 1/max_value would cause subnormal floats, which perform
|
| + // very poorly on some platforms.
|
| + if (bits_per_channel <= 15) {
|
| + libyuv_multiplier_ = 1.0f;
|
| + } else {
|
| + // This multiplier makes sure that we avoid subnormal values.
|
| + libyuv_multiplier_ = 1.0f / 4096.0f;
|
| + }
|
| + resource_multiplier_ = 1.0f / libyuv_multiplier_ / max_value;
|
| + }
|
| + float Offset() const override { return 0.0f; }
|
| + float Multiplier() const override { return resource_multiplier_; }
|
| + void MakeHalfFloats(const uint16_t* src, size_t num, uint16_t* dst) override {
|
| + // Source and dest stride can be zero since we're only copying
|
| + // one row at a time.
|
| + int stride = 0;
|
| + int rows = 1;
|
| + libyuv::HalfFloatPlane(src, stride, dst, stride, libyuv_multiplier_, num,
|
| + rows);
|
| + }
|
| +
|
| + private:
|
| + float libyuv_multiplier_;
|
| + float resource_multiplier_;
|
| +};
|
| +
|
| +std::unique_ptr<HalfFloatMaker> HalfFloatMaker::NewHalfFloatMaker(
|
| + int bits_per_channel) {
|
| + if (bits_per_channel < 11) {
|
| + return std::unique_ptr<HalfFloatMaker>(
|
| + new HalfFloatMaker_xor(bits_per_channel));
|
| + } else {
|
| + return std::unique_ptr<HalfFloatMaker>(
|
| + new HalfFloatMaker_libyuv(bits_per_channel));
|
| + }
|
| +}
|
| +
|
| +} // namespace media
|
|
|