Index: source/libvpx/vp9/encoder/vp9_pickmode.c |
=================================================================== |
--- source/libvpx/vp9/encoder/vp9_pickmode.c (revision 293081) |
+++ source/libvpx/vp9/encoder/vp9_pickmode.c (working copy) |
@@ -65,7 +65,8 @@ |
different_ref_found = 1; |
if (candidate->ref_frame[0] == ref_frame) |
- ADD_MV_REF_LIST(get_sub_block_mv(candidate_mi, 0, mv_ref->col, -1)); |
+ ADD_MV_REF_LIST(get_sub_block_mv(candidate_mi, 0, mv_ref->col, -1), |
+ refmv_count, mv_ref_list, Done); |
} |
} |
@@ -82,7 +83,7 @@ |
different_ref_found = 1; |
if (candidate->ref_frame[0] == ref_frame) |
- ADD_MV_REF_LIST(candidate->mv[0]); |
+ ADD_MV_REF_LIST(candidate->mv[0], refmv_count, mv_ref_list, Done); |
} |
} |
@@ -97,7 +98,8 @@ |
* xd->mi_stride].src_mi->mbmi; |
// If the candidate is INTRA we don't want to consider its mv. |
- IF_DIFF_REF_FRAME_ADD_MV(candidate); |
+ IF_DIFF_REF_FRAME_ADD_MV(candidate, ref_frame, ref_sign_bias, |
+ refmv_count, mv_ref_list, Done); |
} |
} |
} |
@@ -439,7 +441,8 @@ |
vp9_predict_intra_block(xd, block >> (2 * tx_size), |
b_width_log2_lookup[plane_bsize], |
tx_size, args->mode, |
- p->src.buf, src_stride, |
+ x->skip_encode ? p->src.buf : pd->dst.buf, |
+ x->skip_encode ? src_stride : dst_stride, |
pd->dst.buf, dst_stride, |
i, j, 0); |
// This procedure assumes zero offset from p->src.buf and pd->dst.buf. |
@@ -450,22 +453,25 @@ |
args->dist += dist; |
} |
-static const THR_MODES mode_idx[MAX_REF_FRAMES - 1][INTER_MODES] = { |
+static const THR_MODES mode_idx[MAX_REF_FRAMES][4] = { |
+ {THR_DC, THR_H_PRED, THR_V_PRED, THR_TM}, |
{THR_NEARESTMV, THR_NEARMV, THR_ZEROMV, THR_NEWMV}, |
{THR_NEARESTG, THR_NEARG, THR_ZEROG, THR_NEWG}, |
{THR_NEARESTA, THR_NEARA, THR_ZEROA, THR_NEWA}, |
}; |
+static const PREDICTION_MODE intra_mode_list[] = { |
+ DC_PRED, V_PRED, H_PRED, TM_PRED |
+}; |
+ |
// TODO(jingning) placeholder for inter-frame non-RD mode decision. |
// this needs various further optimizations. to be continued.. |
void vp9_pick_inter_mode(VP9_COMP *cpi, MACROBLOCK *x, |
- const TileInfo *const tile, |
- int mi_row, int mi_col, |
- int *returnrate, |
- int64_t *returndistortion, |
- BLOCK_SIZE bsize, |
- PICK_MODE_CONTEXT *ctx) { |
+ TileDataEnc *tile_data, |
+ int mi_row, int mi_col, RD_COST *rd_cost, |
+ BLOCK_SIZE bsize, PICK_MODE_CONTEXT *ctx) { |
VP9_COMMON *const cm = &cpi->common; |
+ TileInfo *const tile_info = &tile_data->tile_info; |
MACROBLOCKD *const xd = &x->e_mbd; |
MB_MODE_INFO *const mbmi = &xd->mi[0].src_mi->mbmi; |
struct macroblockd_plane *const pd = &xd->plane[0]; |
@@ -478,11 +484,8 @@ |
struct buf_2d yv12_mb[4][MAX_MB_PLANE]; |
static const int flag_list[4] = { 0, VP9_LAST_FLAG, VP9_GOLD_FLAG, |
VP9_ALT_FLAG }; |
- int64_t best_rd = INT64_MAX; |
- int64_t this_rd = INT64_MAX; |
+ RD_COST this_rdc, best_rdc; |
uint8_t skip_txfm = 0; |
- int rate = INT_MAX; |
- int64_t dist = INT64_MAX; |
// var_y and sse_y are saved to be used in skipping checking |
unsigned int var_y = UINT_MAX; |
unsigned int sse_y = UINT_MAX; |
@@ -498,8 +501,8 @@ |
const int8_t segment_id = mbmi->segment_id; |
const int *const rd_threshes = cpi->rd.threshes[segment_id][bsize]; |
- const int *const rd_thresh_freq_fact = cpi->rd.thresh_freq_fact[bsize]; |
- INTERP_FILTER filter_ref = cm->interp_filter; |
+ const int *const rd_thresh_freq_fact = tile_data->thresh_freq_fact[bsize]; |
+ INTERP_FILTER filter_ref; |
const int bsl = mi_width_log2_lookup[bsize]; |
const int pred_filter_search = cm->interp_filter == SWITCHABLE ? |
(((mi_row + mi_col) >> bsl) + |
@@ -519,8 +522,10 @@ |
PRED_BUFFER *best_pred = NULL; |
PRED_BUFFER *this_mode_pred = NULL; |
const int pixels_in_block = bh * bw; |
+ int reuse_inter_pred = cpi->sf.reuse_inter_pred_sby && ctx->pred_pixel_ready; |
+ int ref_frame_skip_mask = 0; |
- if (cpi->sf.reuse_inter_pred_sby) { |
+ if (reuse_inter_pred) { |
int i; |
for (i = 0; i < 3; i++) { |
#if CONFIG_VP9_HIGHBITDEPTH |
@@ -542,9 +547,17 @@ |
x->skip_encode = cpi->sf.skip_encode_frame && x->q_index < QIDX_SKIP_THRESH; |
x->skip = 0; |
+ if (xd->up_available) |
+ filter_ref = xd->mi[-xd->mi_stride].src_mi->mbmi.interp_filter; |
+ else if (xd->left_available) |
+ filter_ref = xd->mi[-1].src_mi->mbmi.interp_filter; |
+ else |
+ filter_ref = cm->interp_filter; |
+ |
// initialize mode decisions |
- *returnrate = INT_MAX; |
- *returndistortion = INT64_MAX; |
+ vp9_rd_cost_reset(&best_rdc); |
+ vp9_rd_cost_reset(&this_rdc); |
+ vp9_rd_cost_reset(rd_cost); |
vpx_memset(mbmi, 0, sizeof(MB_MODE_INFO)); |
mbmi->sb_type = bsize; |
mbmi->ref_frame[0] = NONE; |
@@ -555,29 +568,25 @@ |
EIGHTTAP : cm->interp_filter; |
mbmi->segment_id = segment_id; |
- for (ref_frame = LAST_FRAME; ref_frame <= ALTREF_FRAME; ++ref_frame) { |
- PREDICTION_MODE this_mode; |
+ for (ref_frame = LAST_FRAME; ref_frame <= GOLDEN_FRAME; ++ref_frame) { |
x->pred_mv_sad[ref_frame] = INT_MAX; |
frame_mv[NEWMV][ref_frame].as_int = INVALID_MV; |
frame_mv[ZEROMV][ref_frame].as_int = 0; |
- if (xd->up_available) |
- filter_ref = xd->mi[-xd->mi_stride].src_mi->mbmi.interp_filter; |
- else if (xd->left_available) |
- filter_ref = xd->mi[-1].src_mi->mbmi.interp_filter; |
- |
if (cpi->ref_frame_flags & flag_list[ref_frame]) { |
const YV12_BUFFER_CONFIG *yv12 = get_ref_frame_buffer(cpi, ref_frame); |
int_mv *const candidates = mbmi->ref_mvs[ref_frame]; |
const struct scale_factors *const sf = &cm->frame_refs[ref_frame - 1].sf; |
+ |
vp9_setup_pred_block(xd, yv12_mb[ref_frame], yv12, mi_row, mi_col, |
sf, sf); |
if (!cm->error_resilient_mode) |
- vp9_find_mv_refs(cm, xd, tile, xd->mi[0].src_mi, ref_frame, |
+ vp9_find_mv_refs(cm, xd, tile_info, xd->mi[0].src_mi, ref_frame, |
candidates, mi_row, mi_col); |
else |
- const_motion[ref_frame] = mv_refs_rt(cm, xd, tile, xd->mi[0].src_mi, |
+ const_motion[ref_frame] = mv_refs_rt(cm, xd, tile_info, |
+ xd->mi[0].src_mi, |
ref_frame, candidates, |
mi_row, mi_col); |
@@ -589,9 +598,24 @@ |
vp9_mv_pred(cpi, x, yv12_mb[ref_frame][0].buf, yv12->y_stride, |
ref_frame, bsize); |
} else { |
- continue; |
+ ref_frame_skip_mask |= (1 << ref_frame); |
} |
+ } |
+ for (ref_frame = LAST_FRAME; ref_frame <= GOLDEN_FRAME; ++ref_frame) { |
+ PREDICTION_MODE this_mode; |
+ int i = (ref_frame == LAST_FRAME) ? GOLDEN_FRAME : LAST_FRAME; |
+ |
+ if (!(cpi->ref_frame_flags & flag_list[ref_frame])) |
+ continue; |
+ |
+ if (cpi->ref_frame_flags & flag_list[i]) |
+ if (x->pred_mv_sad[ref_frame] > (x->pred_mv_sad[i] << 1)) |
+ ref_frame_skip_mask |= (1 << ref_frame); |
+ |
+ if (ref_frame_skip_mask & (1 << ref_frame)) |
+ continue; |
+ |
// Select prediction reference frames. |
xd->plane[0].pre[0] = yv12_mb[ref_frame][0]; |
@@ -603,28 +627,28 @@ |
for (this_mode = NEARESTMV; this_mode <= NEWMV; ++this_mode) { |
int rate_mv = 0; |
int mode_rd_thresh; |
+ int mode_index = mode_idx[ref_frame][INTER_OFFSET(this_mode)]; |
- if (const_motion[ref_frame] && |
- (this_mode == NEARMV || this_mode == ZEROMV)) |
+ if (const_motion[ref_frame] && this_mode == NEARMV) |
continue; |
if (!(cpi->sf.inter_mode_mask[bsize] & (1 << this_mode))) |
continue; |
- mode_rd_thresh = |
- rd_threshes[mode_idx[ref_frame - |
- LAST_FRAME][INTER_OFFSET(this_mode)]]; |
- if (rd_less_than_thresh(best_rd, mode_rd_thresh, |
- rd_thresh_freq_fact[this_mode])) |
+ mode_rd_thresh = rd_threshes[mode_index]; |
+ if (rd_less_than_thresh(best_rdc.rdcost, mode_rd_thresh, |
+ rd_thresh_freq_fact[mode_index])) |
continue; |
if (this_mode == NEWMV) { |
+ if (ref_frame > LAST_FRAME) |
+ continue; |
if (cpi->sf.partition_search_type != VAR_BASED_PARTITION && |
- this_rd < (int64_t)(1 << num_pels_log2_lookup[bsize])) |
+ this_rdc.rdcost < (int64_t)(1 << num_pels_log2_lookup[bsize])) |
continue; |
if (!combined_motion_search(cpi, x, bsize, mi_row, mi_col, |
&frame_mv[NEWMV][ref_frame], |
- &rate_mv, best_rd)) |
+ &rate_mv, best_rdc.rdcost)) |
continue; |
} |
@@ -639,8 +663,8 @@ |
// Search for the best prediction filter type, when the resulting |
// motion vector is at sub-pixel accuracy level for luma component, i.e., |
// the last three bits are all zeros. |
- if (cpi->sf.reuse_inter_pred_sby) { |
- if (this_mode == NEARESTMV) { |
+ if (reuse_inter_pred) { |
+ if (!this_mode_pred) { |
this_mode_pred = &tmp[3]; |
} else { |
this_mode_pred = &tmp[get_pred_buffer(tmp, 3)]; |
@@ -677,7 +701,7 @@ |
best_cost = cost; |
skip_txfm = x->skip_txfm[0]; |
- if (cpi->sf.reuse_inter_pred_sby) { |
+ if (reuse_inter_pred) { |
if (this_mode_pred != current_pred) { |
free_pred_buffer(this_mode_pred); |
this_mode_pred = current_pred; |
@@ -692,13 +716,13 @@ |
} |
} |
- if (cpi->sf.reuse_inter_pred_sby && this_mode_pred != current_pred) |
+ if (reuse_inter_pred && this_mode_pred != current_pred) |
free_pred_buffer(current_pred); |
mbmi->interp_filter = best_filter; |
mbmi->tx_size = pf_tx_size[mbmi->interp_filter]; |
- rate = pf_rate[mbmi->interp_filter]; |
- dist = pf_dist[mbmi->interp_filter]; |
+ this_rdc.rate = pf_rate[mbmi->interp_filter]; |
+ this_rdc.dist = pf_dist[mbmi->interp_filter]; |
var_y = pf_var[mbmi->interp_filter]; |
sse_y = pf_sse[mbmi->interp_filter]; |
x->skip_txfm[0] = skip_txfm; |
@@ -705,22 +729,26 @@ |
} else { |
mbmi->interp_filter = (filter_ref == SWITCHABLE) ? EIGHTTAP: filter_ref; |
vp9_build_inter_predictors_sby(xd, mi_row, mi_col, bsize); |
- model_rd_for_sb_y(cpi, bsize, x, xd, &rate, &dist, &var_y, &sse_y); |
+ model_rd_for_sb_y(cpi, bsize, x, xd, &this_rdc.rate, &this_rdc.dist, |
+ &var_y, &sse_y); |
} |
- rate += rate_mv; |
- rate += cpi->inter_mode_cost[mbmi->mode_context[ref_frame]] |
+ this_rdc.rate += rate_mv; |
+ this_rdc.rate += cpi->inter_mode_cost[mbmi->mode_context[ref_frame]] |
[INTER_OFFSET(this_mode)]; |
- this_rd = RDCOST(x->rdmult, x->rddiv, rate, dist); |
+ this_rdc.rdcost = RDCOST(x->rdmult, x->rddiv, |
+ this_rdc.rate, this_rdc.dist); |
// Skipping checking: test to see if this block can be reconstructed by |
// prediction only. |
if (cpi->allow_encode_breakout) { |
encode_breakout_test(cpi, x, bsize, mi_row, mi_col, ref_frame, |
- this_mode, var_y, sse_y, yv12_mb, &rate, &dist); |
+ this_mode, var_y, sse_y, yv12_mb, |
+ &this_rdc.rate, &this_rdc.dist); |
if (x->skip) { |
- rate += rate_mv; |
- this_rd = RDCOST(x->rdmult, x->rddiv, rate, dist); |
+ this_rdc.rate += rate_mv; |
+ this_rdc.rdcost = RDCOST(x->rdmult, x->rddiv, |
+ this_rdc.rate, this_rdc.dist); |
} |
} |
@@ -732,10 +760,8 @@ |
(void)ctx; |
#endif |
- if (this_rd < best_rd || x->skip) { |
- best_rd = this_rd; |
- *returnrate = rate; |
- *returndistortion = dist; |
+ if (this_rdc.rdcost < best_rdc.rdcost || x->skip) { |
+ best_rdc = this_rdc; |
best_mode = this_mode; |
best_pred_filter = mbmi->interp_filter; |
best_tx_size = mbmi->tx_size; |
@@ -742,13 +768,12 @@ |
best_ref_frame = ref_frame; |
skip_txfm = x->skip_txfm[0]; |
- if (cpi->sf.reuse_inter_pred_sby) { |
+ if (reuse_inter_pred) { |
free_pred_buffer(best_pred); |
- |
best_pred = this_mode_pred; |
} |
} else { |
- if (cpi->sf.reuse_inter_pred_sby) |
+ if (reuse_inter_pred) |
free_pred_buffer(this_mode_pred); |
} |
@@ -755,31 +780,14 @@ |
if (x->skip) |
break; |
} |
- // If the current reference frame is valid and we found a usable mode, |
- // we are done. |
- if (best_rd < INT64_MAX) |
+ |
+ // Check that a prediction mode has been selected. |
+ assert(best_rdc.rdcost < INT64_MAX); |
+ |
+ if (x->skip) |
break; |
} |
- // If best prediction is not in dst buf, then copy the prediction block from |
- // temp buf to dst buf. |
- if (best_pred != NULL && cpi->sf.reuse_inter_pred_sby && |
- best_pred->data != orig_dst.buf) { |
- pd->dst = orig_dst; |
-#if CONFIG_VP9_HIGHBITDEPTH |
- if (cm->use_highbitdepth) { |
- vp9_highbd_convolve_copy(best_pred->data, bw, pd->dst.buf, pd->dst.stride, |
- NULL, 0, NULL, 0, bw, bh, xd->bd); |
- } else { |
- vp9_convolve_copy(best_pred->data, bw, pd->dst.buf, pd->dst.stride, |
- NULL, 0, NULL, 0, bw, bh); |
- } |
-#else |
- vp9_convolve_copy(best_pred->data, bw, pd->dst.buf, pd->dst.stride, NULL, 0, |
- NULL, 0, bw, bh); |
-#endif // CONFIG_VP9_HIGHBITDEPTH |
- } |
- |
mbmi->mode = best_mode; |
mbmi->interp_filter = best_pred_filter; |
mbmi->tx_size = best_tx_size; |
@@ -790,21 +798,31 @@ |
// Perform intra prediction search, if the best SAD is above a certain |
// threshold. |
- if (!x->skip && best_rd > inter_mode_thresh && |
+ if (!x->skip && best_rdc.rdcost > inter_mode_thresh && |
bsize <= cpi->sf.max_intra_bsize) { |
- PREDICTION_MODE this_mode; |
struct estimate_block_intra_args args = { cpi, x, DC_PRED, 0, 0 }; |
const TX_SIZE intra_tx_size = |
MIN(max_txsize_lookup[bsize], |
tx_mode_to_biggest_tx_size[cpi->common.tx_mode]); |
+ int i; |
- if (cpi->sf.reuse_inter_pred_sby) { |
- pd->dst.buf = tmp[0].data; |
- pd->dst.stride = bw; |
+ if (reuse_inter_pred && best_pred != NULL) { |
+ if (best_pred->data == orig_dst.buf) { |
+ this_mode_pred = &tmp[get_pred_buffer(tmp, 3)]; |
+ vp9_convolve_copy(best_pred->data, best_pred->stride, |
+ this_mode_pred->data, this_mode_pred->stride, |
+ NULL, 0, NULL, 0, bw, bh); |
+ best_pred = this_mode_pred; |
+ } |
} |
+ pd->dst = orig_dst; |
- for (this_mode = DC_PRED; this_mode <= DC_PRED; ++this_mode) { |
+ for (i = 0; i < 4; ++i) { |
const TX_SIZE saved_tx_size = mbmi->tx_size; |
+ const PREDICTION_MODE this_mode = intra_mode_list[i]; |
+ if (!((1 << this_mode) & cpi->sf.intra_y_mode_mask[intra_tx_size])) |
+ continue; |
+ skip_txfm = x->skip_txfm[0]; |
args.mode = this_mode; |
args.rate = 0; |
args.dist = 0; |
@@ -811,17 +829,15 @@ |
mbmi->tx_size = intra_tx_size; |
vp9_foreach_transformed_block_in_plane(xd, bsize, 0, |
estimate_block_intra, &args); |
- mbmi->tx_size = saved_tx_size; |
- rate = args.rate; |
- dist = args.dist; |
- rate += cpi->mbmode_cost[this_mode]; |
- rate += intra_cost_penalty; |
- this_rd = RDCOST(x->rdmult, x->rddiv, rate, dist); |
+ this_rdc.rate = args.rate; |
+ this_rdc.dist = args.dist; |
+ this_rdc.rate += cpi->mbmode_cost[this_mode]; |
+ this_rdc.rate += intra_cost_penalty; |
+ this_rdc.rdcost = RDCOST(x->rdmult, x->rddiv, |
+ this_rdc.rate, this_rdc.dist); |
- if (this_rd + intra_mode_cost < best_rd) { |
- best_rd = this_rd; |
- *returnrate = rate; |
- *returndistortion = dist; |
+ if (this_rdc.rdcost + intra_mode_cost < best_rdc.rdcost) { |
+ best_rdc = this_rdc; |
mbmi->mode = this_mode; |
mbmi->tx_size = intra_tx_size; |
mbmi->ref_frame[0] = INTRA_FRAME; |
@@ -829,9 +845,40 @@ |
mbmi->mv[0].as_int = INVALID_MV; |
} else { |
x->skip_txfm[0] = skip_txfm; |
+ mbmi->tx_size = saved_tx_size; |
} |
} |
- if (cpi->sf.reuse_inter_pred_sby) |
- pd->dst = orig_dst; |
} |
+ |
+ pd->dst = orig_dst; |
+ |
+ if (reuse_inter_pred && best_pred != NULL) { |
+ if (best_pred->data != orig_dst.buf && is_inter_mode(mbmi->mode)) { |
+#if CONFIG_VP9_HIGHBITDEPTH |
+ if (cm->use_highbitdepth) |
+ vp9_highbd_convolve_copy(best_pred->data, best_pred->stride, |
+ pd->dst.buf, pd->dst.stride, NULL, 0, |
+ NULL, 0, bw, bh, xd->bd); |
+ else |
+ vp9_convolve_copy(best_pred->data, best_pred->stride, |
+ pd->dst.buf, pd->dst.stride, NULL, 0, |
+ NULL, 0, bw, bh); |
+#else |
+ vp9_convolve_copy(best_pred->data, best_pred->stride, |
+ pd->dst.buf, pd->dst.stride, NULL, 0, |
+ NULL, 0, bw, bh); |
+#endif |
+ } |
+ } |
+ |
+ if (is_inter_block(mbmi)) |
+ vp9_update_rd_thresh_fact(tile_data->thresh_freq_fact, |
+ cpi->sf.adaptive_rd_thresh, bsize, |
+ mode_idx[best_ref_frame][INTER_OFFSET(mbmi->mode)]); |
+ else |
+ vp9_update_rd_thresh_fact(tile_data->thresh_freq_fact, |
+ cpi->sf.adaptive_rd_thresh, bsize, |
+ mode_idx[INTRA_FRAME][mbmi->mode]); |
+ |
+ *rd_cost = best_rdc; |
} |