| Index: source/libvpx/vp9/encoder/vp9_quantize.c
 | 
| ===================================================================
 | 
| --- source/libvpx/vp9/encoder/vp9_quantize.c	(revision 240950)
 | 
| +++ source/libvpx/vp9/encoder/vp9_quantize.c	(working copy)
 | 
| @@ -22,7 +22,7 @@
 | 
|  extern int enc_debug;
 | 
|  #endif
 | 
|  
 | 
| -void vp9_quantize_b_c(const int16_t *coeff_ptr, intptr_t n_coeffs,
 | 
| +void vp9_quantize_b_c(const int16_t *coeff_ptr, intptr_t count,
 | 
|                        int skip_block,
 | 
|                        const int16_t *zbin_ptr, const int16_t *round_ptr,
 | 
|                        const int16_t *quant_ptr, const int16_t *quant_shift_ptr,
 | 
| @@ -30,58 +30,44 @@
 | 
|                        const int16_t *dequant_ptr,
 | 
|                        int zbin_oq_value, uint16_t *eob_ptr,
 | 
|                        const int16_t *scan, const int16_t *iscan) {
 | 
| -  int i, rc, eob;
 | 
| -  int zbins[2], nzbins[2], zbin;
 | 
| -  int x, y, z, sz;
 | 
| -  int zero_flag = n_coeffs;
 | 
| +  int i, non_zero_count = count, eob = -1;
 | 
| +  const int zbins[2] = { zbin_ptr[0] + zbin_oq_value,
 | 
| +                         zbin_ptr[1] + zbin_oq_value };
 | 
| +  const int nzbins[2] = { zbins[0] * -1,
 | 
| +                          zbins[1] * -1 };
 | 
|  
 | 
| -  vpx_memset(qcoeff_ptr, 0, n_coeffs*sizeof(int16_t));
 | 
| -  vpx_memset(dqcoeff_ptr, 0, n_coeffs*sizeof(int16_t));
 | 
| +  vpx_memset(qcoeff_ptr, 0, count * sizeof(int16_t));
 | 
| +  vpx_memset(dqcoeff_ptr, 0, count * sizeof(int16_t));
 | 
|  
 | 
| -  eob = -1;
 | 
| -
 | 
| -  // Base ZBIN
 | 
| -  zbins[0] = zbin_ptr[0] + zbin_oq_value;
 | 
| -  zbins[1] = zbin_ptr[1] + zbin_oq_value;
 | 
| -  nzbins[0] = zbins[0] * -1;
 | 
| -  nzbins[1] = zbins[1] * -1;
 | 
| -
 | 
|    if (!skip_block) {
 | 
|      // Pre-scan pass
 | 
| -    for (i = n_coeffs - 1; i >= 0; i--) {
 | 
| -      rc = scan[i];
 | 
| -      z = coeff_ptr[rc];
 | 
| +    for (i = count - 1; i >= 0; i--) {
 | 
| +      const int rc = scan[i];
 | 
| +      const int coeff = coeff_ptr[rc];
 | 
|  
 | 
| -      if (z < zbins[rc != 0] && z > nzbins[rc != 0]) {
 | 
| -        zero_flag--;
 | 
| -      } else {
 | 
| +      if (coeff < zbins[rc != 0] && coeff > nzbins[rc != 0])
 | 
| +        non_zero_count--;
 | 
| +      else
 | 
|          break;
 | 
| -      }
 | 
|      }
 | 
|  
 | 
|      // Quantization pass: All coefficients with index >= zero_flag are
 | 
|      // skippable. Note: zero_flag can be zero.
 | 
| -    for (i = 0; i < zero_flag; i++) {
 | 
| -      rc = scan[i];
 | 
| -      z  = coeff_ptr[rc];
 | 
| +    for (i = 0; i < non_zero_count; i++) {
 | 
| +      const int rc = scan[i];
 | 
| +      const int coeff = coeff_ptr[rc];
 | 
| +      const int coeff_sign = (coeff >> 31);
 | 
| +      const int abs_coeff = (coeff ^ coeff_sign) - coeff_sign;
 | 
|  
 | 
| -      zbin = (zbins[rc != 0]);
 | 
| +      if (abs_coeff >= zbins[rc != 0]) {
 | 
| +        int tmp = clamp(abs_coeff + round_ptr[rc != 0], INT16_MIN, INT16_MAX);
 | 
| +        tmp = ((((tmp * quant_ptr[rc != 0]) >> 16) + tmp) *
 | 
| +                  quant_shift_ptr[rc != 0]) >> 16;  // quantization
 | 
| +        qcoeff_ptr[rc]  = (tmp ^ coeff_sign) - coeff_sign;
 | 
| +        dqcoeff_ptr[rc] = qcoeff_ptr[rc] * dequant_ptr[rc != 0];
 | 
|  
 | 
| -      sz = (z >> 31);                               // sign of z
 | 
| -      x  = (z ^ sz) - sz;
 | 
| -
 | 
| -      if (x >= zbin) {
 | 
| -        x += (round_ptr[rc != 0]);
 | 
| -        x  = clamp(x, INT16_MIN, INT16_MAX);
 | 
| -        y  = (((int)(((int)(x * quant_ptr[rc != 0]) >> 16) + x)) *
 | 
| -              quant_shift_ptr[rc != 0]) >> 16;      // quantize (x)
 | 
| -        x  = (y ^ sz) - sz;                         // get the sign back
 | 
| -        qcoeff_ptr[rc]  = x;                        // write to destination
 | 
| -        dqcoeff_ptr[rc] = x * dequant_ptr[rc != 0];  // dequantized value
 | 
| -
 | 
| -        if (y) {
 | 
| -          eob = i;                                  // last nonzero coeffs
 | 
| -        }
 | 
| +        if (tmp)
 | 
| +          eob = i;
 | 
|        }
 | 
|      }
 | 
|    }
 | 
| @@ -151,45 +137,18 @@
 | 
|    *eob_ptr = eob + 1;
 | 
|  }
 | 
|  
 | 
| -struct plane_block_idx {
 | 
| -  int plane;
 | 
| -  int block;
 | 
| -};
 | 
| -
 | 
| -// TODO(jkoleszar): returning a struct so it can be used in a const context,
 | 
| -// expect to refactor this further later.
 | 
| -static INLINE struct plane_block_idx plane_block_idx(int y_blocks,
 | 
| -                                                     int b_idx) {
 | 
| -  const int v_offset = y_blocks * 5 / 4;
 | 
| -  struct plane_block_idx res;
 | 
| -
 | 
| -  if (b_idx < y_blocks) {
 | 
| -    res.plane = 0;
 | 
| -    res.block = b_idx;
 | 
| -  } else if (b_idx < v_offset) {
 | 
| -    res.plane = 1;
 | 
| -    res.block = b_idx - y_blocks;
 | 
| -  } else {
 | 
| -    assert(b_idx < y_blocks * 3 / 2);
 | 
| -    res.plane = 2;
 | 
| -    res.block = b_idx - v_offset;
 | 
| -  }
 | 
| -  return res;
 | 
| -}
 | 
| -
 | 
| -void vp9_regular_quantize_b_4x4(MACROBLOCK *x, int y_blocks, int b_idx,
 | 
| +void vp9_regular_quantize_b_4x4(MACROBLOCK *x, int plane, int block,
 | 
|                                  const int16_t *scan, const int16_t *iscan) {
 | 
|    MACROBLOCKD *const xd = &x->e_mbd;
 | 
| -  const struct plane_block_idx pb_idx = plane_block_idx(y_blocks, b_idx);
 | 
| -  struct macroblock_plane* p = &x->plane[pb_idx.plane];
 | 
| -  struct macroblockd_plane* pd = &xd->plane[pb_idx.plane];
 | 
| +  struct macroblock_plane* p = &x->plane[plane];
 | 
| +  struct macroblockd_plane* pd = &xd->plane[plane];
 | 
|  
 | 
| -  vp9_quantize_b(BLOCK_OFFSET(p->coeff, pb_idx.block),
 | 
| +  vp9_quantize_b(BLOCK_OFFSET(p->coeff, block),
 | 
|             16, x->skip_block,
 | 
|             p->zbin, p->round, p->quant, p->quant_shift,
 | 
| -           BLOCK_OFFSET(pd->qcoeff, pb_idx.block),
 | 
| -           BLOCK_OFFSET(pd->dqcoeff, pb_idx.block),
 | 
| -           pd->dequant, p->zbin_extra, &pd->eobs[pb_idx.block], scan, iscan);
 | 
| +           BLOCK_OFFSET(p->qcoeff, block),
 | 
| +           BLOCK_OFFSET(pd->dqcoeff, block),
 | 
| +           pd->dequant, p->zbin_extra, &p->eobs[block], scan, iscan);
 | 
|  }
 | 
|  
 | 
|  static void invert_quant(int16_t *quant, int16_t *shift, int d) {
 | 
| @@ -315,17 +274,17 @@
 | 
|                                          SEG_LVL_SKIP);
 | 
|  
 | 
|    /* save this macroblock QIndex for vp9_update_zbin_extra() */
 | 
| -  x->e_mbd.q_index = qindex;
 | 
| +  x->q_index = qindex;
 | 
|  
 | 
|    /* R/D setup */
 | 
|    cpi->mb.errorperbit = rdmult >> 6;
 | 
|    cpi->mb.errorperbit += (cpi->mb.errorperbit == 0);
 | 
|  
 | 
| -  vp9_initialize_me_consts(cpi, xd->q_index);
 | 
| +  vp9_initialize_me_consts(cpi, x->q_index);
 | 
|  }
 | 
|  
 | 
|  void vp9_update_zbin_extra(VP9_COMP *cpi, MACROBLOCK *x) {
 | 
| -  const int qindex = x->e_mbd.q_index;
 | 
| +  const int qindex = x->q_index;
 | 
|    const int y_zbin_extra = (cpi->common.y_dequant[qindex][1] *
 | 
|                  (cpi->zbin_mode_boost + x->act_zbin_adj)) >> 7;
 | 
|    const int uv_zbin_extra = (cpi->common.uv_dequant[qindex][1] *
 | 
| 
 |