OLD | NEW |
1 /* | 1 /* |
2 * Copyright (c) 2010 The WebM project authors. All Rights Reserved. | 2 * Copyright (c) 2010 The WebM project authors. All Rights Reserved. |
3 * | 3 * |
4 * Use of this source code is governed by a BSD-style license | 4 * Use of this source code is governed by a BSD-style license |
5 * that can be found in the LICENSE file in the root of the source | 5 * that can be found in the LICENSE file in the root of the source |
6 * tree. An additional intellectual property rights grant can be found | 6 * tree. An additional intellectual property rights grant can be found |
7 * in the file PATENTS. All contributing project authors may | 7 * in the file PATENTS. All contributing project authors may |
8 * be found in the AUTHORS file in the root of the source tree. | 8 * be found in the AUTHORS file in the root of the source tree. |
9 */ | 9 */ |
10 | 10 |
11 #include <assert.h> | 11 #include <assert.h> |
12 | 12 |
| 13 #include "./vpx_scale_rtcd.h" |
13 #include "./vpx_config.h" | 14 #include "./vpx_config.h" |
| 15 |
14 #include "vpx/vpx_integer.h" | 16 #include "vpx/vpx_integer.h" |
| 17 |
15 #include "vp9/common/vp9_blockd.h" | 18 #include "vp9/common/vp9_blockd.h" |
16 #include "vp9/common/vp9_filter.h" | 19 #include "vp9/common/vp9_filter.h" |
17 #include "vp9/common/vp9_reconinter.h" | 20 #include "vp9/common/vp9_reconinter.h" |
18 #include "vp9/common/vp9_reconintra.h" | 21 #include "vp9/common/vp9_reconintra.h" |
19 #include "./vpx_scale_rtcd.h" | |
20 | 22 |
21 static int scale_value_x_with_scaling(int val, | |
22 const struct scale_factors *scale) { | |
23 return (val * scale->x_scale_fp >> VP9_REF_SCALE_SHIFT); | |
24 } | |
25 | |
26 static int scale_value_y_with_scaling(int val, | |
27 const struct scale_factors *scale) { | |
28 return (val * scale->y_scale_fp >> VP9_REF_SCALE_SHIFT); | |
29 } | |
30 | |
31 static int unscaled_value(int val, const struct scale_factors *scale) { | |
32 (void) scale; | |
33 return val; | |
34 } | |
35 | |
36 static MV32 mv_q3_to_q4_with_scaling(const MV *mv, | |
37 const struct scale_factors *scale) { | |
38 const MV32 res = { | |
39 ((mv->row << 1) * scale->y_scale_fp >> VP9_REF_SCALE_SHIFT) | |
40 + scale->y_offset_q4, | |
41 ((mv->col << 1) * scale->x_scale_fp >> VP9_REF_SCALE_SHIFT) | |
42 + scale->x_offset_q4 | |
43 }; | |
44 return res; | |
45 } | |
46 | |
47 static MV32 mv_q3_to_q4_without_scaling(const MV *mv, | |
48 const struct scale_factors *scale) { | |
49 const MV32 res = { | |
50 mv->row << 1, | |
51 mv->col << 1 | |
52 }; | |
53 return res; | |
54 } | |
55 | |
56 static MV32 mv_q4_with_scaling(const MV *mv, | |
57 const struct scale_factors *scale) { | |
58 const MV32 res = { | |
59 (mv->row * scale->y_scale_fp >> VP9_REF_SCALE_SHIFT) + scale->y_offset_q4, | |
60 (mv->col * scale->x_scale_fp >> VP9_REF_SCALE_SHIFT) + scale->x_offset_q4 | |
61 }; | |
62 return res; | |
63 } | |
64 | |
65 static MV32 mv_q4_without_scaling(const MV *mv, | |
66 const struct scale_factors *scale) { | |
67 const MV32 res = { | |
68 mv->row, | |
69 mv->col | |
70 }; | |
71 return res; | |
72 } | |
73 | |
74 static void set_offsets_with_scaling(struct scale_factors *scale, | |
75 int row, int col) { | |
76 const int x_q4 = 16 * col; | |
77 const int y_q4 = 16 * row; | |
78 | |
79 scale->x_offset_q4 = (x_q4 * scale->x_scale_fp >> VP9_REF_SCALE_SHIFT) & 0xf; | |
80 scale->y_offset_q4 = (y_q4 * scale->y_scale_fp >> VP9_REF_SCALE_SHIFT) & 0xf; | |
81 } | |
82 | |
83 static void set_offsets_without_scaling(struct scale_factors *scale, | |
84 int row, int col) { | |
85 scale->x_offset_q4 = 0; | |
86 scale->y_offset_q4 = 0; | |
87 } | |
88 | |
89 static int get_fixed_point_scale_factor(int other_size, int this_size) { | |
90 // Calculate scaling factor once for each reference frame | |
91 // and use fixed point scaling factors in decoding and encoding routines. | |
92 // Hardware implementations can calculate scale factor in device driver | |
93 // and use multiplication and shifting on hardware instead of division. | |
94 return (other_size << VP9_REF_SCALE_SHIFT) / this_size; | |
95 } | |
96 | |
97 void vp9_setup_scale_factors_for_frame(struct scale_factors *scale, | |
98 int other_w, int other_h, | |
99 int this_w, int this_h) { | |
100 scale->x_scale_fp = get_fixed_point_scale_factor(other_w, this_w); | |
101 scale->x_offset_q4 = 0; // calculated per-mb | |
102 scale->x_step_q4 = (16 * scale->x_scale_fp >> VP9_REF_SCALE_SHIFT); | |
103 | |
104 scale->y_scale_fp = get_fixed_point_scale_factor(other_h, this_h); | |
105 scale->y_offset_q4 = 0; // calculated per-mb | |
106 scale->y_step_q4 = (16 * scale->y_scale_fp >> VP9_REF_SCALE_SHIFT); | |
107 | |
108 if ((other_w == this_w) && (other_h == this_h)) { | |
109 scale->scale_value_x = unscaled_value; | |
110 scale->scale_value_y = unscaled_value; | |
111 scale->set_scaled_offsets = set_offsets_without_scaling; | |
112 scale->scale_mv_q3_to_q4 = mv_q3_to_q4_without_scaling; | |
113 scale->scale_mv_q4 = mv_q4_without_scaling; | |
114 } else { | |
115 scale->scale_value_x = scale_value_x_with_scaling; | |
116 scale->scale_value_y = scale_value_y_with_scaling; | |
117 scale->set_scaled_offsets = set_offsets_with_scaling; | |
118 scale->scale_mv_q3_to_q4 = mv_q3_to_q4_with_scaling; | |
119 scale->scale_mv_q4 = mv_q4_with_scaling; | |
120 } | |
121 | |
122 // TODO(agrange): Investigate the best choice of functions to use here | |
123 // for EIGHTTAP_SMOOTH. Since it is not interpolating, need to choose what | |
124 // to do at full-pel offsets. The current selection, where the filter is | |
125 // applied in one direction only, and not at all for 0,0, seems to give the | |
126 // best quality, but it may be worth trying an additional mode that does | |
127 // do the filtering on full-pel. | |
128 if (scale->x_step_q4 == 16) { | |
129 if (scale->y_step_q4 == 16) { | |
130 // No scaling in either direction. | |
131 scale->predict[0][0][0] = vp9_convolve_copy; | |
132 scale->predict[0][0][1] = vp9_convolve_avg; | |
133 scale->predict[0][1][0] = vp9_convolve8_vert; | |
134 scale->predict[0][1][1] = vp9_convolve8_avg_vert; | |
135 scale->predict[1][0][0] = vp9_convolve8_horiz; | |
136 scale->predict[1][0][1] = vp9_convolve8_avg_horiz; | |
137 } else { | |
138 // No scaling in x direction. Must always scale in the y direction. | |
139 scale->predict[0][0][0] = vp9_convolve8_vert; | |
140 scale->predict[0][0][1] = vp9_convolve8_avg_vert; | |
141 scale->predict[0][1][0] = vp9_convolve8_vert; | |
142 scale->predict[0][1][1] = vp9_convolve8_avg_vert; | |
143 scale->predict[1][0][0] = vp9_convolve8; | |
144 scale->predict[1][0][1] = vp9_convolve8_avg; | |
145 } | |
146 } else { | |
147 if (scale->y_step_q4 == 16) { | |
148 // No scaling in the y direction. Must always scale in the x direction. | |
149 scale->predict[0][0][0] = vp9_convolve8_horiz; | |
150 scale->predict[0][0][1] = vp9_convolve8_avg_horiz; | |
151 scale->predict[0][1][0] = vp9_convolve8; | |
152 scale->predict[0][1][1] = vp9_convolve8_avg; | |
153 scale->predict[1][0][0] = vp9_convolve8_horiz; | |
154 scale->predict[1][0][1] = vp9_convolve8_avg_horiz; | |
155 } else { | |
156 // Must always scale in both directions. | |
157 scale->predict[0][0][0] = vp9_convolve8; | |
158 scale->predict[0][0][1] = vp9_convolve8_avg; | |
159 scale->predict[0][1][0] = vp9_convolve8; | |
160 scale->predict[0][1][1] = vp9_convolve8_avg; | |
161 scale->predict[1][0][0] = vp9_convolve8; | |
162 scale->predict[1][0][1] = vp9_convolve8_avg; | |
163 } | |
164 } | |
165 // 2D subpel motion always gets filtered in both directions | |
166 scale->predict[1][1][0] = vp9_convolve8; | |
167 scale->predict[1][1][1] = vp9_convolve8_avg; | |
168 } | |
169 | 23 |
170 void vp9_setup_interp_filters(MACROBLOCKD *xd, | 24 void vp9_setup_interp_filters(MACROBLOCKD *xd, |
171 INTERPOLATIONFILTERTYPE mcomp_filter_type, | 25 INTERPOLATIONFILTERTYPE mcomp_filter_type, |
172 VP9_COMMON *cm) { | 26 VP9_COMMON *cm) { |
173 if (xd->mode_info_context) { | 27 if (xd->mode_info_context) { |
174 MB_MODE_INFO *mbmi = &xd->mode_info_context->mbmi; | 28 MB_MODE_INFO *mbmi = &xd->mode_info_context->mbmi; |
175 | 29 |
176 set_scale_factors(xd, mbmi->ref_frame[0] - 1, mbmi->ref_frame[1] - 1, | 30 set_scale_factors(xd, mbmi->ref_frame[0] - 1, mbmi->ref_frame[1] - 1, |
177 cm->active_ref_scale); | 31 cm->active_ref_scale); |
178 } | 32 } |
(...skipping 11 matching lines...) Expand all Loading... |
190 break; | 44 break; |
191 case BILINEAR: | 45 case BILINEAR: |
192 xd->subpix.filter_x = xd->subpix.filter_y = vp9_bilinear_filters; | 46 xd->subpix.filter_x = xd->subpix.filter_y = vp9_bilinear_filters; |
193 break; | 47 break; |
194 } | 48 } |
195 assert(((intptr_t)xd->subpix.filter_x & 0xff) == 0); | 49 assert(((intptr_t)xd->subpix.filter_x & 0xff) == 0); |
196 } | 50 } |
197 | 51 |
198 void vp9_build_inter_predictor(const uint8_t *src, int src_stride, | 52 void vp9_build_inter_predictor(const uint8_t *src, int src_stride, |
199 uint8_t *dst, int dst_stride, | 53 uint8_t *dst, int dst_stride, |
200 const int_mv *src_mv, | 54 const MV *src_mv, |
201 const struct scale_factors *scale, | 55 const struct scale_factors *scale, |
202 int w, int h, int weight, | 56 int w, int h, int ref, |
203 const struct subpix_fn_table *subpix, | 57 const struct subpix_fn_table *subpix, |
204 enum mv_precision precision) { | 58 enum mv_precision precision) { |
205 const MV32 mv = precision == MV_PRECISION_Q4 | 59 const int is_q4 = precision == MV_PRECISION_Q4; |
206 ? scale->scale_mv_q4(&src_mv->as_mv, scale) | 60 const MV mv_q4 = { is_q4 ? src_mv->row : src_mv->row << 1, |
207 : scale->scale_mv_q3_to_q4(&src_mv->as_mv, scale); | 61 is_q4 ? src_mv->col : src_mv->col << 1 }; |
208 const int subpel_x = mv.col & 15; | 62 const MV32 mv = scale->scale_mv(&mv_q4, scale); |
209 const int subpel_y = mv.row & 15; | 63 const int subpel_x = mv.col & SUBPEL_MASK; |
| 64 const int subpel_y = mv.row & SUBPEL_MASK; |
210 | 65 |
211 src += (mv.row >> 4) * src_stride + (mv.col >> 4); | 66 src += (mv.row >> SUBPEL_BITS) * src_stride + (mv.col >> SUBPEL_BITS); |
212 scale->predict[!!subpel_x][!!subpel_y][weight]( | 67 scale->predict[subpel_x != 0][subpel_y != 0][ref]( |
213 src, src_stride, dst, dst_stride, | 68 src, src_stride, dst, dst_stride, |
214 subpix->filter_x[subpel_x], scale->x_step_q4, | 69 subpix->filter_x[subpel_x], scale->x_step_q4, |
215 subpix->filter_y[subpel_y], scale->y_step_q4, | 70 subpix->filter_y[subpel_y], scale->y_step_q4, |
216 w, h); | 71 w, h); |
217 } | 72 } |
218 | 73 |
219 static INLINE int round_mv_comp_q4(int value) { | 74 static INLINE int round_mv_comp_q4(int value) { |
220 return (value < 0 ? value - 2 : value + 2) / 4; | 75 return (value < 0 ? value - 2 : value + 2) / 4; |
221 } | 76 } |
222 | 77 |
223 static int mi_mv_pred_row_q4(MACROBLOCKD *mb, int idx) { | 78 static MV mi_mv_pred_q4(const MODE_INFO *mi, int idx) { |
224 const int temp = mb->mode_info_context->bmi[0].as_mv[idx].as_mv.row + | 79 MV res = { round_mv_comp_q4(mi->bmi[0].as_mv[idx].as_mv.row + |
225 mb->mode_info_context->bmi[1].as_mv[idx].as_mv.row + | 80 mi->bmi[1].as_mv[idx].as_mv.row + |
226 mb->mode_info_context->bmi[2].as_mv[idx].as_mv.row + | 81 mi->bmi[2].as_mv[idx].as_mv.row + |
227 mb->mode_info_context->bmi[3].as_mv[idx].as_mv.row; | 82 mi->bmi[3].as_mv[idx].as_mv.row), |
228 return round_mv_comp_q4(temp); | 83 round_mv_comp_q4(mi->bmi[0].as_mv[idx].as_mv.col + |
229 } | 84 mi->bmi[1].as_mv[idx].as_mv.col + |
230 | 85 mi->bmi[2].as_mv[idx].as_mv.col + |
231 static int mi_mv_pred_col_q4(MACROBLOCKD *mb, int idx) { | 86 mi->bmi[3].as_mv[idx].as_mv.col) }; |
232 const int temp = mb->mode_info_context->bmi[0].as_mv[idx].as_mv.col + | 87 return res; |
233 mb->mode_info_context->bmi[1].as_mv[idx].as_mv.col + | |
234 mb->mode_info_context->bmi[2].as_mv[idx].as_mv.col + | |
235 mb->mode_info_context->bmi[3].as_mv[idx].as_mv.col; | |
236 return round_mv_comp_q4(temp); | |
237 } | 88 } |
238 | 89 |
239 // TODO(jkoleszar): yet another mv clamping function :-( | 90 // TODO(jkoleszar): yet another mv clamping function :-( |
240 MV clamp_mv_to_umv_border_sb(const MV *src_mv, | 91 MV clamp_mv_to_umv_border_sb(const MACROBLOCKD *xd, const MV *src_mv, |
241 int bwl, int bhl, int ss_x, int ss_y, | 92 int bw, int bh, int ss_x, int ss_y) { |
242 int mb_to_left_edge, int mb_to_top_edge, | 93 // If the MV points so far into the UMV border that no visible pixels |
243 int mb_to_right_edge, int mb_to_bottom_edge) { | 94 // are used for reconstruction, the subpel part of the MV can be |
244 /* If the MV points so far into the UMV border that no visible pixels | 95 // discarded and the MV limited to 16 pixels with equivalent results. |
245 * are used for reconstruction, the subpel part of the MV can be | 96 const int spel_left = (VP9_INTERP_EXTEND + bw) << SUBPEL_BITS; |
246 * discarded and the MV limited to 16 pixels with equivalent results. | 97 const int spel_right = spel_left - SUBPEL_SHIFTS; |
247 */ | 98 const int spel_top = (VP9_INTERP_EXTEND + bh) << SUBPEL_BITS; |
248 const int spel_left = (VP9_INTERP_EXTEND + (4 << bwl)) << 4; | 99 const int spel_bottom = spel_top - SUBPEL_SHIFTS; |
249 const int spel_right = spel_left - (1 << 4); | 100 MV clamped_mv = { |
250 const int spel_top = (VP9_INTERP_EXTEND + (4 << bhl)) << 4; | 101 src_mv->row << (1 - ss_y), |
251 const int spel_bottom = spel_top - (1 << 4); | 102 src_mv->col << (1 - ss_x) |
252 MV clamped_mv; | 103 }; |
253 | |
254 assert(ss_x <= 1); | 104 assert(ss_x <= 1); |
255 assert(ss_y <= 1); | 105 assert(ss_y <= 1); |
256 clamped_mv.col = clamp(src_mv->col << (1 - ss_x), | 106 |
257 (mb_to_left_edge << (1 - ss_x)) - spel_left, | 107 clamp_mv(&clamped_mv, (xd->mb_to_left_edge << (1 - ss_x)) - spel_left, |
258 (mb_to_right_edge << (1 - ss_x)) + spel_right); | 108 (xd->mb_to_right_edge << (1 - ss_x)) + spel_right, |
259 clamped_mv.row = clamp(src_mv->row << (1 - ss_y), | 109 (xd->mb_to_top_edge << (1 - ss_y)) - spel_top, |
260 (mb_to_top_edge << (1 - ss_y)) - spel_top, | 110 (xd->mb_to_bottom_edge << (1 - ss_y)) + spel_bottom); |
261 (mb_to_bottom_edge << (1 - ss_y)) + spel_bottom); | 111 |
262 return clamped_mv; | 112 return clamped_mv; |
263 } | 113 } |
264 | 114 |
265 struct build_inter_predictors_args { | 115 struct build_inter_predictors_args { |
266 MACROBLOCKD *xd; | 116 MACROBLOCKD *xd; |
267 int x; | 117 int x, y; |
268 int y; | |
269 uint8_t* dst[MAX_MB_PLANE]; | |
270 int dst_stride[MAX_MB_PLANE]; | |
271 uint8_t* pre[2][MAX_MB_PLANE]; | |
272 int pre_stride[2][MAX_MB_PLANE]; | |
273 }; | 118 }; |
274 static void build_inter_predictors(int plane, int block, | 119 |
275 BLOCK_SIZE_TYPE bsize, | 120 static void build_inter_predictors(int plane, int block, BLOCK_SIZE bsize, |
276 int pred_w, int pred_h, | 121 int pred_w, int pred_h, |
277 void *argv) { | 122 void *argv) { |
278 const struct build_inter_predictors_args* const arg = argv; | 123 const struct build_inter_predictors_args* const arg = argv; |
279 MACROBLOCKD * const xd = arg->xd; | 124 MACROBLOCKD *const xd = arg->xd; |
280 const int bwl = b_width_log2(bsize) - xd->plane[plane].subsampling_x; | 125 struct macroblockd_plane *const pd = &xd->plane[plane]; |
281 const int bhl = b_height_log2(bsize) - xd->plane[plane].subsampling_y; | 126 const int bwl = b_width_log2(bsize) - pd->subsampling_x; |
282 const int x = 4 * (block & ((1 << bwl) - 1)), y = 4 * (block >> bwl); | 127 const int bw = 4 << bwl; |
283 const int use_second_ref = xd->mode_info_context->mbmi.ref_frame[1] > 0; | 128 const int bh = plane_block_height(bsize, pd); |
284 int which_mv; | 129 const int x = 4 * (block & ((1 << bwl) - 1)); |
| 130 const int y = 4 * (block >> bwl); |
| 131 const MODE_INFO *const mi = xd->mode_info_context; |
| 132 const int use_second_ref = mi->mbmi.ref_frame[1] > 0; |
| 133 int ref; |
285 | 134 |
286 assert(x < (4 << bwl)); | 135 assert(x < bw); |
287 assert(y < (4 << bhl)); | 136 assert(y < bh); |
288 assert(xd->mode_info_context->mbmi.sb_type < BLOCK_SIZE_SB8X8 || | 137 assert(mi->mbmi.sb_type < BLOCK_8X8 || 4 << pred_w == bw); |
289 4 << pred_w == (4 << bwl)); | 138 assert(mi->mbmi.sb_type < BLOCK_8X8 || 4 << pred_h == bh); |
290 assert(xd->mode_info_context->mbmi.sb_type < BLOCK_SIZE_SB8X8 || | |
291 4 << pred_h == (4 << bhl)); | |
292 | 139 |
293 for (which_mv = 0; which_mv < 1 + use_second_ref; ++which_mv) { | 140 for (ref = 0; ref < 1 + use_second_ref; ++ref) { |
294 // source | 141 struct scale_factors *const scale = &xd->scale_factor[ref]; |
295 const uint8_t * const base_pre = arg->pre[which_mv][plane]; | 142 struct buf_2d *const pre_buf = &pd->pre[ref]; |
296 const int pre_stride = arg->pre_stride[which_mv][plane]; | 143 struct buf_2d *const dst_buf = &pd->dst; |
297 const uint8_t *const pre = base_pre + | |
298 scaled_buffer_offset(x, y, pre_stride, &xd->scale_factor[which_mv]); | |
299 struct scale_factors * const scale = &xd->scale_factor[which_mv]; | |
300 | 144 |
301 // dest | 145 const uint8_t *const pre = pre_buf->buf + scaled_buffer_offset(x, y, |
302 uint8_t *const dst = arg->dst[plane] + arg->dst_stride[plane] * y + x; | 146 pre_buf->stride, scale); |
303 | 147 |
304 // motion vector | 148 uint8_t *const dst = dst_buf->buf + dst_buf->stride * y + x; |
305 const MV *mv; | |
306 MV split_chroma_mv; | |
307 int_mv clamped_mv; | |
308 | 149 |
309 if (xd->mode_info_context->mbmi.sb_type < BLOCK_SIZE_SB8X8) { | 150 // TODO(jkoleszar): All chroma MVs in SPLITMV mode are taken as the |
310 if (plane == 0) { | 151 // same MV (the average of the 4 luma MVs) but we could do something |
311 mv = &xd->mode_info_context->bmi[block].as_mv[which_mv].as_mv; | 152 // smarter for non-4:2:0. Just punt for now, pending the changes to get |
312 } else { | 153 // rid of SPLITMV mode entirely. |
313 // TODO(jkoleszar): All chroma MVs in SPLITMV mode are taken as the | 154 const MV mv = mi->mbmi.sb_type < BLOCK_8X8 |
314 // same MV (the average of the 4 luma MVs) but we could do something | 155 ? (plane == 0 ? mi->bmi[block].as_mv[ref].as_mv |
315 // smarter for non-4:2:0. Just punt for now, pending the changes to get | 156 : mi_mv_pred_q4(mi, ref)) |
316 // rid of SPLITMV mode entirely. | 157 : mi->mbmi.mv[ref].as_mv; |
317 split_chroma_mv.row = mi_mv_pred_row_q4(xd, which_mv); | |
318 split_chroma_mv.col = mi_mv_pred_col_q4(xd, which_mv); | |
319 mv = &split_chroma_mv; | |
320 } | |
321 } else { | |
322 mv = &xd->mode_info_context->mbmi.mv[which_mv].as_mv; | |
323 } | |
324 | 158 |
325 /* TODO(jkoleszar): This clamping is done in the incorrect place for the | 159 // TODO(jkoleszar): This clamping is done in the incorrect place for the |
326 * scaling case. It needs to be done on the scaled MV, not the pre-scaling | 160 // scaling case. It needs to be done on the scaled MV, not the pre-scaling |
327 * MV. Note however that it performs the subsampling aware scaling so | 161 // MV. Note however that it performs the subsampling aware scaling so |
328 * that the result is always q4. | 162 // that the result is always q4. |
329 */ | 163 const MV res_mv = clamp_mv_to_umv_border_sb(xd, &mv, bw, bh, |
330 clamped_mv.as_mv = clamp_mv_to_umv_border_sb(mv, bwl, bhl, | 164 pd->subsampling_x, |
331 xd->plane[plane].subsampling_x, | 165 pd->subsampling_y); |
332 xd->plane[plane].subsampling_y, | 166 |
333 xd->mb_to_left_edge, | |
334 xd->mb_to_top_edge, | |
335 xd->mb_to_right_edge, | |
336 xd->mb_to_bottom_edge); | |
337 scale->set_scaled_offsets(scale, arg->y + y, arg->x + x); | 167 scale->set_scaled_offsets(scale, arg->y + y, arg->x + x); |
338 | 168 vp9_build_inter_predictor(pre, pre_buf->stride, dst, dst_buf->stride, |
339 vp9_build_inter_predictor(pre, pre_stride, | 169 &res_mv, scale, |
340 dst, arg->dst_stride[plane], | 170 4 << pred_w, 4 << pred_h, ref, |
341 &clamped_mv, &xd->scale_factor[which_mv], | |
342 4 << pred_w, 4 << pred_h, which_mv, | |
343 &xd->subpix, MV_PRECISION_Q4); | 171 &xd->subpix, MV_PRECISION_Q4); |
344 } | 172 } |
345 } | 173 } |
346 void vp9_build_inter_predictors_sby(MACROBLOCKD *xd, | |
347 int mi_row, | |
348 int mi_col, | |
349 BLOCK_SIZE_TYPE bsize) { | |
350 struct build_inter_predictors_args args = { | |
351 xd, mi_col * MI_SIZE, mi_row * MI_SIZE, | |
352 {xd->plane[0].dst.buf, NULL, NULL}, {xd->plane[0].dst.stride, 0, 0}, | |
353 {{xd->plane[0].pre[0].buf, NULL, NULL}, | |
354 {xd->plane[0].pre[1].buf, NULL, NULL}}, | |
355 {{xd->plane[0].pre[0].stride, 0, 0}, {xd->plane[0].pre[1].stride, 0, 0}}, | |
356 }; | |
357 | 174 |
358 foreach_predicted_block_in_plane(xd, bsize, 0, build_inter_predictors, &args); | 175 // TODO(jkoleszar): In principle, pred_w, pred_h are unnecessary, as we could |
| 176 // calculate the subsampled BLOCK_SIZE, but that type isn't defined for |
| 177 // sizes smaller than 16x16 yet. |
| 178 typedef void (*foreach_predicted_block_visitor)(int plane, int block, |
| 179 BLOCK_SIZE bsize, |
| 180 int pred_w, int pred_h, |
| 181 void *arg); |
| 182 static INLINE void foreach_predicted_block_in_plane( |
| 183 const MACROBLOCKD* const xd, BLOCK_SIZE bsize, int plane, |
| 184 foreach_predicted_block_visitor visit, void *arg) { |
| 185 int i, x, y; |
| 186 |
| 187 // block sizes in number of 4x4 blocks log 2 ("*_b") |
| 188 // 4x4=0, 8x8=2, 16x16=4, 32x32=6, 64x64=8 |
| 189 // subsampled size of the block |
| 190 const int bwl = b_width_log2(bsize) - xd->plane[plane].subsampling_x; |
| 191 const int bhl = b_height_log2(bsize) - xd->plane[plane].subsampling_y; |
| 192 |
| 193 // size of the predictor to use. |
| 194 int pred_w, pred_h; |
| 195 |
| 196 if (xd->mode_info_context->mbmi.sb_type < BLOCK_8X8) { |
| 197 assert(bsize == BLOCK_8X8); |
| 198 pred_w = 0; |
| 199 pred_h = 0; |
| 200 } else { |
| 201 pred_w = bwl; |
| 202 pred_h = bhl; |
| 203 } |
| 204 assert(pred_w <= bwl); |
| 205 assert(pred_h <= bhl); |
| 206 |
| 207 // visit each subblock in raster order |
| 208 i = 0; |
| 209 for (y = 0; y < 1 << bhl; y += 1 << pred_h) { |
| 210 for (x = 0; x < 1 << bwl; x += 1 << pred_w) { |
| 211 visit(plane, i, bsize, pred_w, pred_h, arg); |
| 212 i += 1 << pred_w; |
| 213 } |
| 214 i += (1 << (bwl + pred_h)) - (1 << bwl); |
| 215 } |
359 } | 216 } |
360 void vp9_build_inter_predictors_sbuv(MACROBLOCKD *xd, | 217 |
361 int mi_row, | 218 static void build_inter_predictors_for_planes(MACROBLOCKD *xd, BLOCK_SIZE bsize, |
362 int mi_col, | 219 int mi_row, int mi_col, |
363 BLOCK_SIZE_TYPE bsize) { | 220 int plane_from, int plane_to) { |
364 struct build_inter_predictors_args args = { | 221 int plane; |
365 xd, mi_col * MI_SIZE, mi_row * MI_SIZE, | 222 for (plane = plane_from; plane <= plane_to; ++plane) { |
366 #if CONFIG_ALPHA | 223 struct build_inter_predictors_args args = { |
367 {NULL, xd->plane[1].dst.buf, xd->plane[2].dst.buf, | 224 xd, mi_col * MI_SIZE, mi_row * MI_SIZE, |
368 xd->plane[3].dst.buf}, | 225 }; |
369 {0, xd->plane[1].dst.stride, xd->plane[1].dst.stride, | 226 foreach_predicted_block_in_plane(xd, bsize, plane, build_inter_predictors, |
370 xd->plane[3].dst.stride}, | 227 &args); |
371 {{NULL, xd->plane[1].pre[0].buf, xd->plane[2].pre[0].buf, | 228 } |
372 xd->plane[3].pre[0].buf}, | |
373 {NULL, xd->plane[1].pre[1].buf, xd->plane[2].pre[1].buf, | |
374 xd->plane[3].pre[1].buf}}, | |
375 {{0, xd->plane[1].pre[0].stride, xd->plane[1].pre[0].stride, | |
376 xd->plane[3].pre[0].stride}, | |
377 {0, xd->plane[1].pre[1].stride, xd->plane[1].pre[1].stride, | |
378 xd->plane[3].pre[1].stride}}, | |
379 #else | |
380 {NULL, xd->plane[1].dst.buf, xd->plane[2].dst.buf}, | |
381 {0, xd->plane[1].dst.stride, xd->plane[1].dst.stride}, | |
382 {{NULL, xd->plane[1].pre[0].buf, xd->plane[2].pre[0].buf}, | |
383 {NULL, xd->plane[1].pre[1].buf, xd->plane[2].pre[1].buf}}, | |
384 {{0, xd->plane[1].pre[0].stride, xd->plane[1].pre[0].stride}, | |
385 {0, xd->plane[1].pre[1].stride, xd->plane[1].pre[1].stride}}, | |
386 #endif | |
387 }; | |
388 foreach_predicted_block_uv(xd, bsize, build_inter_predictors, &args); | |
389 } | 229 } |
390 void vp9_build_inter_predictors_sb(MACROBLOCKD *xd, | |
391 int mi_row, int mi_col, | |
392 BLOCK_SIZE_TYPE bsize) { | |
393 | 230 |
394 vp9_build_inter_predictors_sby(xd, mi_row, mi_col, bsize); | 231 void vp9_build_inter_predictors_sby(MACROBLOCKD *xd, int mi_row, int mi_col, |
395 vp9_build_inter_predictors_sbuv(xd, mi_row, mi_col, bsize); | 232 BLOCK_SIZE bsize) { |
| 233 build_inter_predictors_for_planes(xd, bsize, mi_row, mi_col, 0, 0); |
| 234 } |
| 235 void vp9_build_inter_predictors_sbuv(MACROBLOCKD *xd, int mi_row, int mi_col, |
| 236 BLOCK_SIZE bsize) { |
| 237 build_inter_predictors_for_planes(xd, bsize, mi_row, mi_col, 1, |
| 238 MAX_MB_PLANE - 1); |
| 239 } |
| 240 void vp9_build_inter_predictors_sb(MACROBLOCKD *xd, int mi_row, int mi_col, |
| 241 BLOCK_SIZE bsize) { |
| 242 build_inter_predictors_for_planes(xd, bsize, mi_row, mi_col, 0, |
| 243 MAX_MB_PLANE - 1); |
396 } | 244 } |
397 | 245 |
398 // TODO(dkovalev: find better place for this function) | 246 // TODO(dkovalev: find better place for this function) |
399 void vp9_setup_scale_factors(VP9_COMMON *cm, int i) { | 247 void vp9_setup_scale_factors(VP9_COMMON *cm, int i) { |
400 const int ref = cm->active_ref_idx[i]; | 248 const int ref = cm->active_ref_idx[i]; |
401 struct scale_factors *const sf = &cm->active_ref_scale[i]; | 249 struct scale_factors *const sf = &cm->active_ref_scale[i]; |
402 if (ref >= NUM_YV12_BUFFERS) { | 250 if (ref >= NUM_YV12_BUFFERS) { |
403 memset(sf, 0, sizeof(*sf)); | 251 vp9_zero(*sf); |
404 } else { | 252 } else { |
405 YV12_BUFFER_CONFIG *const fb = &cm->yv12_fb[ref]; | 253 YV12_BUFFER_CONFIG *const fb = &cm->yv12_fb[ref]; |
406 vp9_setup_scale_factors_for_frame(sf, | 254 vp9_setup_scale_factors_for_frame(sf, |
407 fb->y_crop_width, fb->y_crop_height, | 255 fb->y_crop_width, fb->y_crop_height, |
408 cm->width, cm->height); | 256 cm->width, cm->height); |
409 | 257 |
410 if (sf->x_scale_fp != VP9_REF_NO_SCALE || | 258 if (vp9_is_scaled(sf)) |
411 sf->y_scale_fp != VP9_REF_NO_SCALE) | |
412 vp9_extend_frame_borders(fb, cm->subsampling_x, cm->subsampling_y); | 259 vp9_extend_frame_borders(fb, cm->subsampling_x, cm->subsampling_y); |
413 } | 260 } |
414 } | 261 } |
415 | 262 |
OLD | NEW |