OLD | NEW |
1 /* | 1 /* |
2 * Copyright 2011 The LibYuv Project Authors. All rights reserved. | 2 * Copyright 2011 The LibYuv Project Authors. All rights reserved. |
3 * | 3 * |
4 * Use of this source code is governed by a BSD-style license | 4 * Use of this source code is governed by a BSD-style license |
5 * that can be found in the LICENSE file in the root of the source | 5 * that can be found in the LICENSE file in the root of the source |
6 * tree. An additional intellectual property rights grant can be found | 6 * tree. An additional intellectual property rights grant can be found |
7 * in the file PATENTS. All contributing project authors may | 7 * in the file PATENTS. All contributing project authors may |
8 * be found in the AUTHORS file in the root of the source tree. | 8 * be found in the AUTHORS file in the root of the source tree. |
9 */ | 9 */ |
10 | 10 |
(...skipping 1145 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
1156 EXPECT_LE(max_diff, 1); | 1156 EXPECT_LE(max_diff, 1); |
1157 } | 1157 } |
1158 | 1158 |
1159 TEST_F(LibYUVPlanarTest, ARGBBlend_Opt) { | 1159 TEST_F(LibYUVPlanarTest, ARGBBlend_Opt) { |
1160 int max_diff = TestBlend(benchmark_width_, benchmark_height_, | 1160 int max_diff = TestBlend(benchmark_width_, benchmark_height_, |
1161 benchmark_iterations_, | 1161 benchmark_iterations_, |
1162 disable_cpu_flags_, benchmark_cpu_info_, +1, 0); | 1162 disable_cpu_flags_, benchmark_cpu_info_, +1, 0); |
1163 EXPECT_LE(max_diff, 1); | 1163 EXPECT_LE(max_diff, 1); |
1164 } | 1164 } |
1165 | 1165 |
| 1166 #ifdef HAS_BLENDPLANEROW_SSSE3 |
| 1167 // TODO(fbarchard): Switch to I420Blend. |
| 1168 static void TestBlendPlane(int width, int height, int benchmark_iterations, |
| 1169 int invert, int off) { |
| 1170 int has_ssse3 = TestCpuFlag(kCpuHasSSSE3); |
| 1171 width = width * height; |
| 1172 height = 1; |
| 1173 if (width < 1) { |
| 1174 width = 1; |
| 1175 } |
| 1176 if (width < 256) { |
| 1177 width = 256; |
| 1178 } |
| 1179 const int kBpp = 1; |
| 1180 const int kStride = width * kBpp; |
| 1181 align_buffer_64(src_argb_a, kStride * height + off); |
| 1182 align_buffer_64(src_argb_b, kStride * height + off); |
| 1183 align_buffer_64(src_argb_alpha, kStride * height + off); |
| 1184 align_buffer_64(dst_argb_c, kStride * height); |
| 1185 align_buffer_64(dst_argb_opt, kStride * height); |
| 1186 |
| 1187 if (has_ssse3) { |
| 1188 for (int i = 0; i < 255; ++i) { |
| 1189 src_argb_a[i] = i; |
| 1190 src_argb_b[i] = 255 - i; |
| 1191 src_argb_alpha[i] = 255; |
| 1192 } |
| 1193 memset(dst_argb_opt, 0xfb, kStride * height); |
| 1194 BlendPlaneRow_SSSE3(src_argb_a + off, |
| 1195 src_argb_b + off, |
| 1196 src_argb_alpha + off, |
| 1197 dst_argb_opt, |
| 1198 width * height); |
| 1199 for (int i = 0; i < kStride * height; ++i) { |
| 1200 EXPECT_EQ(src_argb_a[i], dst_argb_opt[i]); |
| 1201 } |
| 1202 } |
| 1203 for (int i = 0; i < kStride * height; ++i) { |
| 1204 src_argb_a[i + off] = (fastrand() & 0xff); |
| 1205 src_argb_b[i + off] = (fastrand() & 0xff); |
| 1206 src_argb_alpha[i + off] = (fastrand() & 0xff); |
| 1207 } |
| 1208 memset(dst_argb_c, 255, kStride * height); |
| 1209 memset(dst_argb_opt, 255, kStride * height); |
| 1210 |
| 1211 BlendPlaneRow_C(src_argb_a + off, |
| 1212 src_argb_b + off, |
| 1213 src_argb_alpha + off, |
| 1214 dst_argb_c, |
| 1215 width * height); |
| 1216 for (int i = 0; i < benchmark_iterations; ++i) { |
| 1217 if (has_ssse3) { |
| 1218 BlendPlaneRow_SSSE3(src_argb_a + off, |
| 1219 src_argb_b + off, |
| 1220 src_argb_alpha + off, |
| 1221 dst_argb_opt, |
| 1222 width * height); |
| 1223 } else { |
| 1224 BlendPlaneRow_C(src_argb_a + off, |
| 1225 src_argb_b + off, |
| 1226 src_argb_alpha + off, |
| 1227 dst_argb_opt, |
| 1228 width * height); |
| 1229 } |
| 1230 } |
| 1231 for (int i = 0; i < kStride * height; ++i) { |
| 1232 EXPECT_EQ(dst_argb_c[i], dst_argb_opt[i]); |
| 1233 } |
| 1234 free_aligned_buffer_64(src_argb_a); |
| 1235 free_aligned_buffer_64(src_argb_b); |
| 1236 free_aligned_buffer_64(dst_argb_c); |
| 1237 free_aligned_buffer_64(dst_argb_opt); |
| 1238 return; |
| 1239 } |
| 1240 |
| 1241 TEST_F(LibYUVPlanarTest, BlendPlane_Opt) { |
| 1242 TestBlendPlane(benchmark_width_, benchmark_height_, benchmark_iterations_, |
| 1243 +1, 0); |
| 1244 } |
| 1245 #endif |
| 1246 |
1166 TEST_F(LibYUVPlanarTest, TestAffine) { | 1247 TEST_F(LibYUVPlanarTest, TestAffine) { |
1167 SIMD_ALIGNED(uint8 orig_pixels_0[1280][4]); | 1248 SIMD_ALIGNED(uint8 orig_pixels_0[1280][4]); |
1168 SIMD_ALIGNED(uint8 interpolate_pixels_C[1280][4]); | 1249 SIMD_ALIGNED(uint8 interpolate_pixels_C[1280][4]); |
1169 | 1250 |
1170 for (int i = 0; i < 1280; ++i) { | 1251 for (int i = 0; i < 1280; ++i) { |
1171 for (int j = 0; j < 4; ++j) { | 1252 for (int j = 0; j < 4; ++j) { |
1172 orig_pixels_0[i][j] = i; | 1253 orig_pixels_0[i][j] = i; |
1173 } | 1254 } |
1174 } | 1255 } |
1175 | 1256 |
(...skipping 1169 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
2345 | 2426 |
2346 TEST_F(LibYUVPlanarTest, SetPlane_Opt) { | 2427 TEST_F(LibYUVPlanarTest, SetPlane_Opt) { |
2347 int max_diff = TestARGBRect(benchmark_width_, benchmark_height_, | 2428 int max_diff = TestARGBRect(benchmark_width_, benchmark_height_, |
2348 benchmark_iterations_, | 2429 benchmark_iterations_, |
2349 disable_cpu_flags_, benchmark_cpu_info_, | 2430 disable_cpu_flags_, benchmark_cpu_info_, |
2350 +1, 0, 1); | 2431 +1, 0, 1); |
2351 EXPECT_EQ(0, max_diff); | 2432 EXPECT_EQ(0, max_diff); |
2352 } | 2433 } |
2353 | 2434 |
2354 } // namespace libyuv | 2435 } // namespace libyuv |
OLD | NEW |