Chromium Code Reviews
chromiumcodereview-hr@appspot.gserviceaccount.com (chromiumcodereview-hr) | Please choose your nickname with Settings | Help | Chromium Project | Gerrit Changes | Sign out
(365)

Side by Side Diff: src/core/SkOpts.cpp

Issue 1577703006: Optimized premultiplying swizzles for NEON (Closed) Base URL: https://skia.googlesource.com/skia.git@master
Patch Set: Response to comments Created 4 years, 11 months ago
Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.
Jump to:
View unified diff | Download patch
« no previous file with comments | « no previous file | src/opts/SkOpts_neon.cpp » ('j') | src/opts/SkSwizzler_opts.h » ('J')
Toggle Intra-line Diffs ('i') | Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
OLDNEW
1 /* 1 /*
2 * Copyright 2015 Google Inc. 2 * Copyright 2015 Google Inc.
3 * 3 *
4 * Use of this source code is governed by a BSD-style license that can be 4 * Use of this source code is governed by a BSD-style license that can be
5 * found in the LICENSE file. 5 * found in the LICENSE file.
6 */ 6 */
7 7
8 #include "SkOnce.h" 8 #include "SkOnce.h"
9 #include "SkOpts.h" 9 #include "SkOpts.h"
10 10
11 #define SK_OPTS_NS sk_default 11 #define SK_OPTS_NS sk_default
12 #include "SkBlitMask_opts.h" 12 #include "SkBlitMask_opts.h"
13 #include "SkBlitRow_opts.h" 13 #include "SkBlitRow_opts.h"
14 #include "SkBlurImageFilter_opts.h" 14 #include "SkBlurImageFilter_opts.h"
15 #include "SkColorCubeFilter_opts.h" 15 #include "SkColorCubeFilter_opts.h"
16 #include "SkFloatingPoint_opts.h" 16 #include "SkFloatingPoint_opts.h"
17 #include "SkMatrix_opts.h" 17 #include "SkMatrix_opts.h"
18 #include "SkMorphologyImageFilter_opts.h" 18 #include "SkMorphologyImageFilter_opts.h"
19 #include "SkSwizzler_opts.h"
19 #include "SkTextureCompressor_opts.h" 20 #include "SkTextureCompressor_opts.h"
20 #include "SkUtils_opts.h" 21 #include "SkUtils_opts.h"
21 #include "SkXfermode_opts.h" 22 #include "SkXfermode_opts.h"
22 23
23 #if defined(SK_CPU_X86) && !defined(SK_BUILD_FOR_IOS) 24 #if defined(SK_CPU_X86) && !defined(SK_BUILD_FOR_IOS)
24 #if defined(SK_BUILD_FOR_WIN32) 25 #if defined(SK_BUILD_FOR_WIN32)
25 #include <intrin.h> 26 #include <intrin.h>
26 static void cpuid (uint32_t abcd[4]) { __cpuid ((int*)abcd, 1); } 27 static void cpuid (uint32_t abcd[4]) { __cpuid ((int*)abcd, 1); }
27 static void cpuid7(uint32_t abcd[4]) { __cpuidex((int*)abcd, 7, 0); } 28 static void cpuid7(uint32_t abcd[4]) { __cpuidex((int*)abcd, 7, 0); }
28 static uint64_t xgetbv(uint32_t xcr) { return _xgetbv(xcr); } 29 static uint64_t xgetbv(uint32_t xcr) { return _xgetbv(xcr); }
(...skipping 13 matching lines...) Expand all
42 return (uint64_t)(edx) << 32 | eax; 43 return (uint64_t)(edx) << 32 | eax;
43 } 44 }
44 #endif 45 #endif
45 #elif !defined(SK_ARM_HAS_NEON) && \ 46 #elif !defined(SK_ARM_HAS_NEON) && \
46 defined(SK_CPU_ARM32) && \ 47 defined(SK_CPU_ARM32) && \
47 defined(SK_BUILD_FOR_ANDROID) && \ 48 defined(SK_BUILD_FOR_ANDROID) && \
48 !defined(SK_BUILD_FOR_ANDROID_FRAMEWORK) 49 !defined(SK_BUILD_FOR_ANDROID_FRAMEWORK)
49 #include <cpu-features.h> 50 #include <cpu-features.h>
50 #endif 51 #endif
51 52
52 namespace sk_default {
53
54 // These variable names in these functions just pretend the input is BGRA.
55 // They work fine with both RGBA and BGRA.
56
57 static void premul_xxxa(uint32_t dst[], const uint32_t src[], int count) {
58 for (int i = 0; i < count; i++) {
59 uint8_t a = src[i] >> 24,
60 r = src[i] >> 16,
61 g = src[i] >> 8,
62 b = src[i] >> 0;
63 r = (r*a+127)/255;
64 g = (g*a+127)/255;
65 b = (b*a+127)/255;
66 dst[i] = (uint32_t)a << 24
67 | (uint32_t)r << 16
68 | (uint32_t)g << 8
69 | (uint32_t)b << 0;
70 }
71 }
72
73 static void swaprb_xxxa(uint32_t dst[], const uint32_t src[], int count) {
74 for (int i = 0; i < count; i++) {
75 uint8_t a = src[i] >> 24,
76 r = src[i] >> 16,
77 g = src[i] >> 8,
78 b = src[i] >> 0;
79 dst[i] = (uint32_t)a << 24
80 | (uint32_t)b << 16
81 | (uint32_t)g << 8
82 | (uint32_t)r << 0;
83 }
84 }
85
86 static void premul_swaprb_xxxa(uint32_t dst[], const uint32_t src[], int count) {
87 for (int i = 0; i < count; i++) {
88 uint8_t a = src[i] >> 24,
89 r = src[i] >> 16,
90 g = src[i] >> 8,
91 b = src[i] >> 0;
92 r = (r*a+127)/255;
93 g = (g*a+127)/255;
94 b = (b*a+127)/255;
95 dst[i] = (uint32_t)a << 24
96 | (uint32_t)b << 16
97 | (uint32_t)g << 8
98 | (uint32_t)r << 0;
99 }
100 }
101
102 } // namespace sk_default
103
104 namespace SkOpts { 53 namespace SkOpts {
105 // Define default function pointer values here... 54 // Define default function pointer values here...
106 // If our global compile options are set high enough, these defaults might e ven be 55 // If our global compile options are set high enough, these defaults might e ven be
107 // CPU-specialized, e.g. a typical x86-64 machine might start with SSE2 defa ults. 56 // CPU-specialized, e.g. a typical x86-64 machine might start with SSE2 defa ults.
108 // They'll still get a chance to be replaced with even better ones, e.g. usi ng SSE4.1. 57 // They'll still get a chance to be replaced with even better ones, e.g. usi ng SSE4.1.
109 decltype(rsqrt) rsqrt = sk_default::rsqrt; 58 decltype(rsqrt) rsqrt = sk_default::rsqrt;
110 decltype(memset16) memset16 = sk_default::memset16; 59 decltype(memset16) memset16 = sk_default::memset16;
111 decltype(memset32) memset32 = sk_default::memset32; 60 decltype(memset32) memset32 = sk_default::memset32;
112 decltype(create_xfermode) create_xfermode = sk_default::create_xfermode; 61 decltype(create_xfermode) create_xfermode = sk_default::create_xfermode;
113 decltype(color_cube_filter_span) color_cube_filter_span = sk_default::color_ cube_filter_span; 62 decltype(color_cube_filter_span) color_cube_filter_span = sk_default::color_ cube_filter_span;
(...skipping 11 matching lines...) Expand all
125 decltype(fill_block_dimensions) fill_block_dimensions = sk_default::fill_blo ck_dimensions; 74 decltype(fill_block_dimensions) fill_block_dimensions = sk_default::fill_blo ck_dimensions;
126 75
127 decltype(blit_mask_d32_a8) blit_mask_d32_a8 = sk_default::blit_mask_d32_a8; 76 decltype(blit_mask_d32_a8) blit_mask_d32_a8 = sk_default::blit_mask_d32_a8;
128 77
129 decltype(blit_row_color32) blit_row_color32 = sk_default::blit_row_color32; 78 decltype(blit_row_color32) blit_row_color32 = sk_default::blit_row_color32;
130 79
131 decltype(matrix_translate) matrix_translate = sk_default::matrix _translate; 80 decltype(matrix_translate) matrix_translate = sk_default::matrix _translate;
132 decltype(matrix_scale_translate) matrix_scale_translate = sk_default::matrix _scale_translate; 81 decltype(matrix_scale_translate) matrix_scale_translate = sk_default::matrix _scale_translate;
133 decltype(matrix_affine) matrix_affine = sk_default::matrix _affine; 82 decltype(matrix_affine) matrix_affine = sk_default::matrix _affine;
134 83
135 decltype( premul_xxxa) premul_xxxa = sk_default:: premul_ xxxa; 84 decltype( premul_xxxa) premul_xxxa = sk_default::premul_xxxa<fa lse>;
mtklein 2016/01/13 17:04:36 I'd prefer to add shims to SkSwizzler_opts.h to ke
msarett 2016/01/13 18:52:05 Agreed on all counts! Done.
136 decltype( swaprb_xxxa) swaprb_xxxa = sk_default:: swaprb_ xxxa; 85 decltype( swaprb_xxxa) swaprb_xxxa = sk_default::swaprb_xxxa;
137 decltype(premul_swaprb_xxxa) premul_swaprb_xxxa = sk_default::premul_swaprb_ xxxa; 86 decltype(premul_swaprb_xxxa) premul_swaprb_xxxa = sk_default::premul_xxxa<tr ue>;
138 87
139 // Each Init_foo() is defined in src/opts/SkOpts_foo.cpp. 88 // Each Init_foo() is defined in src/opts/SkOpts_foo.cpp.
140 void Init_ssse3(); 89 void Init_ssse3();
141 void Init_sse41(); 90 void Init_sse41();
142 void Init_sse42() {} 91 void Init_sse42() {}
143 void Init_avx(); 92 void Init_avx();
144 void Init_avx2() {} 93 void Init_avx2() {}
145 void Init_neon(); 94 void Init_neon();
146 95
147 static void init() { 96 static void init() {
(...skipping 26 matching lines...) Expand all
174 123
175 SK_DECLARE_STATIC_ONCE(gInitOnce); 124 SK_DECLARE_STATIC_ONCE(gInitOnce);
176 void Init() { SkOnce(&gInitOnce, init); } 125 void Init() { SkOnce(&gInitOnce, init); }
177 126
178 #if SK_ALLOW_STATIC_GLOBAL_INITIALIZERS 127 #if SK_ALLOW_STATIC_GLOBAL_INITIALIZERS
179 static struct AutoInit { 128 static struct AutoInit {
180 AutoInit() { Init(); } 129 AutoInit() { Init(); }
181 } gAutoInit; 130 } gAutoInit;
182 #endif 131 #endif
183 } 132 }
OLDNEW
« no previous file with comments | « no previous file | src/opts/SkOpts_neon.cpp » ('j') | src/opts/SkSwizzler_opts.h » ('J')

Powered by Google App Engine
This is Rietveld 408576698