Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(228)

Unified Diff: media/filters/vp9_parser.h

Issue 2133993002: Parse VP9 compressed header (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@master
Patch Set: reset curr_frame_info_ when Reset Created 4 years, 4 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View side-by-side diff with in-line comments
Download patch
« no previous file with comments | « media/filters/vp9_compressed_header_parser.cc ('k') | media/filters/vp9_parser.cc » ('j') | no next file with comments »
Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
Index: media/filters/vp9_parser.h
diff --git a/media/filters/vp9_parser.h b/media/filters/vp9_parser.h
index 4d430494170f48dae739febfd283fee09750f50b..acb88d7e76a443cfc12ac6ff20238ecc1699fd53 100644
--- a/media/filters/vp9_parser.h
+++ b/media/filters/vp9_parser.h
@@ -18,9 +18,10 @@
#include <deque>
+#include "base/callback.h"
#include "base/macros.h"
+#include "base/memory/weak_ptr.h"
#include "media/base/media_export.h"
-#include "media/filters/vp9_raw_bits_reader.h"
namespace media {
@@ -29,6 +30,9 @@ const int kVp9NumRefFramesLog2 = 3;
const size_t kVp9NumRefFrames = 1 << kVp9NumRefFramesLog2;
const uint8_t kVp9MaxProb = 255;
const size_t kVp9NumRefsPerFrame = 3;
+const size_t kVp9NumFrameContexts = 4;
+
+using Vp9Prob = uint8_t;
enum class Vp9ColorSpace {
UNKNOWN = 0,
@@ -41,15 +45,29 @@ enum class Vp9ColorSpace {
SRGB = 7,
};
-enum Vp9InterpFilter {
+enum Vp9InterpolationFilter {
EIGHTTAP = 0,
EIGHTTAP_SMOOTH = 1,
EIGHTTAP_SHARP = 2,
BILINEAR = 3,
- SWICHABLE = 4,
+ SWITCHABLE = 4,
+};
+
+enum Vp9RefType {
+ VP9_FRAME_INTRA = 0,
+ VP9_FRAME_LAST = 1,
+ VP9_FRAME_GOLDEN = 2,
+ VP9_FRAME_ALTREF = 3,
+ VP9_FRAME_MAX = 4,
+};
+
+enum Vp9ReferenceMode {
+ SINGLE_REFERENCE = 0,
+ COMPOUND_REFERENCE = 1,
+ REFERENCE_MODE_SELECT = 2,
};
-struct MEDIA_EXPORT Vp9Segmentation {
+struct MEDIA_EXPORT Vp9SegmentationParams {
static const size_t kNumSegments = 8;
static const size_t kNumTreeProbs = kNumSegments - 1;
static const size_t kNumPredictionProbs = 3;
@@ -69,7 +87,7 @@ struct MEDIA_EXPORT Vp9Segmentation {
uint8_t pred_probs[kNumPredictionProbs];
bool update_data;
- bool abs_delta;
+ bool abs_or_delta_update;
bool feature_enabled[kNumSegments][SEG_LVL_MAX];
int16_t feature_data[kNumSegments][SEG_LVL_MAX];
@@ -85,41 +103,80 @@ struct MEDIA_EXPORT Vp9Segmentation {
}
};
-struct MEDIA_EXPORT Vp9LoopFilter {
- enum Vp9FrameType {
- VP9_FRAME_INTRA = 0,
- VP9_FRAME_LAST = 1,
- VP9_FRAME_GOLDEN = 2,
- VP9_FRAME_ALTREF = 3,
- VP9_FRAME_MAX = 4,
- };
-
+struct MEDIA_EXPORT Vp9LoopFilterParams {
static const size_t kNumModeDeltas = 2;
- uint8_t filter_level;
- uint8_t sharpness_level;
+ uint8_t level;
+ uint8_t sharpness;
- bool mode_ref_delta_enabled;
- bool mode_ref_delta_update;
+ bool delta_enabled;
+ bool delta_update;
bool update_ref_deltas[VP9_FRAME_MAX];
int8_t ref_deltas[VP9_FRAME_MAX];
bool update_mode_deltas[kNumModeDeltas];
int8_t mode_deltas[kNumModeDeltas];
- uint8_t lvl[Vp9Segmentation::kNumSegments][VP9_FRAME_MAX][kNumModeDeltas];
+ // Calculated from above fields.
+ uint8_t lvl[Vp9SegmentationParams::kNumSegments][VP9_FRAME_MAX]
+ [kNumModeDeltas];
};
// Members of Vp9FrameHeader will be 0-initialized by Vp9Parser::ParseNextFrame.
struct MEDIA_EXPORT Vp9QuantizationParams {
bool IsLossless() const {
- return base_qindex == 0 && y_dc_delta == 0 && uv_dc_delta == 0 &&
- uv_ac_delta == 0;
+ return base_q_idx == 0 && delta_q_y_dc == 0 && delta_q_uv_dc == 0 &&
+ delta_q_uv_ac == 0;
}
- uint8_t base_qindex;
- int8_t y_dc_delta;
- int8_t uv_dc_delta;
- int8_t uv_ac_delta;
+ uint8_t base_q_idx;
+ int8_t delta_q_y_dc;
+ int8_t delta_q_uv_dc;
+ int8_t delta_q_uv_ac;
+};
+
+// Entropy context for frame parsing
+struct MEDIA_EXPORT Vp9FrameContext {
+ Vp9Prob tx_probs_8x8[2][1];
+ Vp9Prob tx_probs_16x16[2][2];
+ Vp9Prob tx_probs_32x32[2][3];
+
+ Vp9Prob coef_probs[4][2][2][6][6][3];
+ Vp9Prob skip_prob[3];
+ Vp9Prob inter_mode_probs[7][3];
+ Vp9Prob interp_filter_probs[4][2];
+ Vp9Prob is_inter_prob[4];
+
+ Vp9Prob comp_mode_prob[5];
+ Vp9Prob single_ref_prob[5][2];
+ Vp9Prob comp_ref_prob[5];
+
+ Vp9Prob y_mode_probs[4][9];
+ Vp9Prob uv_mode_probs[10][9];
+ Vp9Prob partition_probs[16][3];
+
+ Vp9Prob mv_joint_probs[3];
+ Vp9Prob mv_sign_prob[2];
+ Vp9Prob mv_class_probs[2][10];
+ Vp9Prob mv_class0_bit_prob[2];
+ Vp9Prob mv_bits_prob[2][10];
+ Vp9Prob mv_class0_fr_probs[2][2][3];
+ Vp9Prob mv_fr_probs[2][3];
+ Vp9Prob mv_class0_hp_prob[2];
+ Vp9Prob mv_hp_prob[2];
+};
+
+struct MEDIA_EXPORT Vp9CompressedHeader {
+ enum Vp9TxMode {
+ ONLY_4X4 = 0,
+ ALLOW_8X8 = 1,
+ ALLOW_16X16 = 2,
+ ALLOW_32X32 = 3,
+ TX_MODE_SELECT = 4,
+ TX_MODES = 5,
+ };
+
+ Vp9TxMode tx_mode;
+ Vp9ReferenceMode reference_mode;
};
// VP9 frame header.
@@ -130,12 +187,15 @@ struct MEDIA_EXPORT Vp9FrameHeader {
};
bool IsKeyframe() const;
- bool RefreshFlag(size_t i) const { return !!(refresh_flags & (1u << i)); }
+ bool IsIntra() const;
+ bool RefreshFlag(size_t i) const {
+ return !!(refresh_frame_flags & (1u << i));
+ }
uint8_t profile;
bool show_existing_frame;
- uint8_t frame_to_show;
+ uint8_t frame_to_show_map_idx;
FrameType frame_type;
@@ -144,32 +204,35 @@ struct MEDIA_EXPORT Vp9FrameHeader {
uint8_t bit_depth;
Vp9ColorSpace color_space;
- bool yuv_range;
+ bool color_range;
uint8_t subsampling_x;
uint8_t subsampling_y;
- // The range of width and height is 1..2^16.
- uint32_t width;
- uint32_t height;
- uint32_t display_width;
- uint32_t display_height;
+ // The range of frame_width and frame_height is 1..2^16.
+ uint32_t frame_width;
+ uint32_t frame_height;
+ uint32_t render_width;
+ uint32_t render_height;
bool intra_only;
- uint8_t reset_context;
- uint8_t refresh_flags;
- uint8_t frame_refs[kVp9NumRefsPerFrame];
- bool ref_sign_biases[kVp9NumRefsPerFrame];
+ uint8_t reset_frame_context;
+ uint8_t refresh_frame_flags;
+ uint8_t ref_frame_idx[kVp9NumRefsPerFrame];
+ bool ref_frame_sign_bias[Vp9RefType::VP9_FRAME_MAX];
bool allow_high_precision_mv;
- Vp9InterpFilter interp_filter;
+ Vp9InterpolationFilter interpolation_filter;
bool refresh_frame_context;
bool frame_parallel_decoding_mode;
uint8_t frame_context_idx;
+ // |frame_context_idx_to_save_probs| is to be used by save_probs() only, and
+ // |frame_context_idx| otherwise.
+ uint8_t frame_context_idx_to_save_probs;
Vp9QuantizationParams quant_params;
- uint8_t log2_tile_cols;
- uint8_t log2_tile_rows;
+ uint8_t tile_cols_log2;
+ uint8_t tile_rows_log2;
// Pointer to the beginning of frame data. It is a responsibility of the
// client of the Vp9Parser to maintain validity of this data while it is
@@ -180,10 +243,51 @@ struct MEDIA_EXPORT Vp9FrameHeader {
size_t frame_size;
// Size of compressed header in bytes.
- size_t first_partition_size;
+ size_t header_size_in_bytes;
// Size of uncompressed header in bytes.
size_t uncompressed_header_size;
+
+ Vp9CompressedHeader compressed_header;
+ // Initial frame entropy context after load_probs2(frame_context_idx).
+ Vp9FrameContext initial_frame_context;
+ // Current frame entropy context after header parsing.
+ Vp9FrameContext frame_context;
+};
+
+class Vp9FrameContextManager {
+ public:
+ // If context update is needed after decoding a frame, the client must
+ // execute this callback, passing the updated context state.
+ using ContextRefreshCallback = base::Callback<void(const Vp9FrameContext&)>;
+
+ static bool IsValidFrameContext(const Vp9FrameContext& context);
+
+ Vp9FrameContextManager();
+ ~Vp9FrameContextManager();
+ bool initialized() const { return initialized_; }
+ bool needs_client_update() const { return needs_client_update_; }
+ const Vp9FrameContext& frame_context() const;
+
+ // Resets to uninitialized state.
+ void Reset();
+
+ // Sets this context need update from parser's client. Returns a callback for
+ // update.
+ ContextRefreshCallback SetNeedsClientUpdate();
+
+ // Updates frame context.
+ void Update(const Vp9FrameContext& frame_context);
+
+ private:
+ // Updates frame context from parser's client.
+ void UpdateFromClient(const Vp9FrameContext& frame_context);
+
+ bool initialized_ = false;
+ bool needs_client_update_ = false;
+ Vp9FrameContext frame_context_;
+
+ base::WeakPtrFactory<Vp9FrameContextManager> weak_ptr_factory_;
};
// A parser for VP9 bitstream.
@@ -194,9 +298,40 @@ class MEDIA_EXPORT Vp9Parser {
kOk,
kInvalidStream,
kEOStream,
+ kAwaitingRefresh,
+ };
+
+ // The parsing context to keep track of references.
+ struct ReferenceSlot {
+ bool initialized;
+ uint32_t frame_width;
+ uint32_t frame_height;
+ uint8_t subsampling_x;
+ uint8_t subsampling_y;
+ uint8_t bit_depth;
+
+ // More fields for consistency checking.
+ uint8_t profile;
+ Vp9ColorSpace color_space;
+ };
+
+ // The parsing context that persists across frames.
+ struct Context {
+ void Reset();
+
+ // Segmentation and loop filter state.
+ Vp9SegmentationParams segmentation;
+ Vp9LoopFilterParams loop_filter;
+
+ // Frame references.
+ ReferenceSlot ref_slots[kVp9NumRefFrames];
+
+ Vp9FrameContextManager frame_context_managers[kVp9NumFrameContexts];
};
- Vp9Parser();
+ // The constructor. See ParseNextFrame() for comments for
+ // |parsing_compressed_header|.
+ explicit Vp9Parser(bool parsing_compressed_header);
~Vp9Parser();
// Set a new stream buffer to read from, starting at |stream| and of size
@@ -207,51 +342,54 @@ class MEDIA_EXPORT Vp9Parser {
// Parse the next frame in the current stream buffer, filling |fhdr| with
// the parsed frame header and updating current segmentation and loop filter
- // state. Return kOk if a frame has successfully been parsed, kEOStream if
- // there is no more data in the current stream buffer, or kInvalidStream
- // on error.
- Result ParseNextFrame(Vp9FrameHeader* fhdr);
+ // state. If |parsing_compressed_header_|, this function also fills
+ // |context_refresh_cb|, which is used to update frame context. If
+ // |*context_refresh_cb| is null, no callback is necessary.
+ // Return kOk if a frame has successfully been parsed,
+ // kEOStream if there is no more data in the current stream buffer,
+ // kAwaitingRefresh if this frame awaiting frame context update, or
+ // kInvalidStream on error.
+ Result ParseNextFrame(
+ Vp9FrameHeader* fhdr,
+ Vp9FrameContextManager::ContextRefreshCallback* context_refresh_cb);
// Return current segmentation state.
- const Vp9Segmentation& GetSegmentation() const { return segmentation_; }
+ const Vp9SegmentationParams& GetSegmentation() const {
+ return context_.segmentation;
+ }
// Return current loop filter state.
- const Vp9LoopFilter& GetLoopFilter() const { return loop_filter_; }
+ const Vp9LoopFilterParams& GetLoopFilter() const {
+ return context_.loop_filter;
+ }
// Clear parser state and return to an initialized state.
void Reset();
private:
- // The parsing context to keep track of references.
- struct ReferenceSlot {
- uint32_t width;
- uint32_t height;
+ class UncompressedHeaderParser;
+ class CompressedHeaderParser;
+
+ // Stores start pointer and size of each frame within the current superframe.
+ struct FrameInfo {
+ FrameInfo() = default;
+ FrameInfo(const uint8_t* ptr, off_t size);
+ bool IsValid() const { return ptr != nullptr; }
+ void Reset() { ptr = nullptr; }
+
+ // Starting address of the frame.
+ const uint8_t* ptr = nullptr;
+
+ // Size of the frame in bytes.
+ off_t size = 0;
};
- bool ParseSuperframe();
- uint8_t ReadProfile();
- bool VerifySyncCode();
- bool ReadBitDepthColorSpaceSampling(Vp9FrameHeader* fhdr);
- void ReadFrameSize(Vp9FrameHeader* fhdr);
- bool ReadFrameSizeFromRefs(Vp9FrameHeader* fhdr);
- void ReadDisplayFrameSize(Vp9FrameHeader* fhdr);
- Vp9InterpFilter ReadInterpFilter();
- void ReadLoopFilter();
- void ReadQuantization(Vp9QuantizationParams* quants);
- void ReadSegmentationMap();
- void ReadSegmentationData();
- void ReadSegmentation();
- void ReadTiles(Vp9FrameHeader* fhdr);
- bool ParseUncompressedHeader(const uint8_t* stream,
- off_t frame_size,
- Vp9FrameHeader* fhdr);
- void UpdateSlots(const Vp9FrameHeader* fhdr);
-
- void ResetLoopfilter();
- void SetupPastIndependence();
+ std::deque<FrameInfo> ParseSuperframe();
+
size_t GetQIndex(const Vp9QuantizationParams& quant, size_t segid) const;
- void SetupSegmentationDequant(const Vp9QuantizationParams& quant);
+ void SetupSegmentationDequant();
void SetupLoopFilter();
+ void UpdateSlots();
// Current address in the bitstream buffer.
const uint8_t* stream_;
@@ -259,29 +397,15 @@ class MEDIA_EXPORT Vp9Parser {
// Remaining bytes in stream_.
off_t bytes_left_;
- // Stores start pointer and size of each frame within the current superframe.
- struct FrameInfo {
- FrameInfo(const uint8_t* ptr, off_t size);
-
- // Starting address of the frame.
- const uint8_t* ptr;
-
- // Size of the frame in bytes.
- off_t size;
- };
+ bool parsing_compressed_header_;
// FrameInfo for the remaining frames in the current superframe to be parsed.
std::deque<FrameInfo> frames_;
- // Raw bits decoder for uncompressed frame header.
- Vp9RawBitsReader reader_;
-
- // Segmentation and loop filter state that persists across frames.
- Vp9Segmentation segmentation_;
- Vp9LoopFilter loop_filter_;
+ Context context_;
- // The parsing context to keep track of references.
- ReferenceSlot ref_slots_[kVp9NumRefFrames];
+ FrameInfo curr_frame_info_;
+ Vp9FrameHeader curr_frame_header_;
DISALLOW_COPY_AND_ASSIGN(Vp9Parser);
};
« no previous file with comments | « media/filters/vp9_compressed_header_parser.cc ('k') | media/filters/vp9_parser.cc » ('j') | no next file with comments »

Powered by Google App Engine
This is Rietveld 408576698