| OLD | NEW | 
|---|
| 1 /* | 1 /* | 
| 2  * Copyright 2014 | 2  * Copyright 2014 | 
| 3  * | 3  * | 
| 4  * Use of this source code is governed by a BSD-style license that can be | 4  * Use of this source code is governed by a BSD-style license that can be | 
| 5  * found in the LICENSE file. | 5  * found in the LICENSE file. | 
| 6  */ | 6  */ | 
| 7 | 7 | 
| 8 #include "SkTextureCompressor.h" | 8 #include "SkTextureCompressor.h" | 
| 9 #include "SkTextureCompression_opts.h" | 9 #include "SkTextureCompression_opts.h" | 
| 10 | 10 | 
| (...skipping 129 matching lines...) Expand 10 before | Expand all | Expand 10 after  Loading... | 
| 140 #if defined (SK_CPU_BENDIAN) | 140 #if defined (SK_CPU_BENDIAN) | 
| 141 static inline uint64x2_t fix_endianness(uint64x2_t x) { | 141 static inline uint64x2_t fix_endianness(uint64x2_t x) { | 
| 142     return x; | 142     return x; | 
| 143 } | 143 } | 
| 144 #else | 144 #else | 
| 145 static inline uint64x2_t fix_endianness(uint64x2_t x) { | 145 static inline uint64x2_t fix_endianness(uint64x2_t x) { | 
| 146     return vreinterpretq_u64_u8(vrev64q_u8(vreinterpretq_u8_u64(x))); | 146     return vreinterpretq_u64_u8(vrev64q_u8(vreinterpretq_u8_u64(x))); | 
| 147 } | 147 } | 
| 148 #endif | 148 #endif | 
| 149 | 149 | 
| 150 static void compress_r11eac_blocks(uint64_t* dst, const uint8_t* src, int rowByt
     es) { | 150 static void compress_r11eac_blocks(uint64_t* dst, const uint8_t* src, size_t row
     Bytes) { | 
| 151 | 151 | 
| 152     // Try to avoid switching between vector and non-vector ops... | 152     // Try to avoid switching between vector and non-vector ops... | 
| 153     const uint8_t *const src1 = src; | 153     const uint8_t *const src1 = src; | 
| 154     const uint8_t *const src2 = src + rowBytes; | 154     const uint8_t *const src2 = src + rowBytes; | 
| 155     const uint8_t *const src3 = src + 2*rowBytes; | 155     const uint8_t *const src3 = src + 2*rowBytes; | 
| 156     const uint8_t *const src4 = src + 3*rowBytes; | 156     const uint8_t *const src4 = src + 3*rowBytes; | 
| 157     uint64_t *const dst1 = dst; | 157     uint64_t *const dst1 = dst; | 
| 158     uint64_t *const dst2 = dst + 2; | 158     uint64_t *const dst2 = dst + 2; | 
| 159 | 159 | 
| 160     const uint8x16_t alphaRow1 = vld1q_u8(src1); | 160     const uint8x16_t alphaRow1 = vld1q_u8(src1); | 
| (...skipping 40 matching lines...) Expand 10 before | Expand all | Expand 10 after  Loading... | 
| 201     const uint64x2_t indicesLeft = fix_endianness(pack_indices(blockIndicesLeft)
     ); | 201     const uint64x2_t indicesLeft = fix_endianness(pack_indices(blockIndicesLeft)
     ); | 
| 202     const uint64x2_t indicesRight = fix_endianness(pack_indices(blockIndicesRigh
     t)); | 202     const uint64x2_t indicesRight = fix_endianness(pack_indices(blockIndicesRigh
     t)); | 
| 203 | 203 | 
| 204     const uint64x2_t d1 = vcombine_u64(vget_low_u64(indicesLeft), vget_low_u64(i
     ndicesRight)); | 204     const uint64x2_t d1 = vcombine_u64(vget_low_u64(indicesLeft), vget_low_u64(i
     ndicesRight)); | 
| 205     const uint64x2_t d2 = vcombine_u64(vget_high_u64(indicesLeft), vget_high_u64
     (indicesRight)); | 205     const uint64x2_t d2 = vcombine_u64(vget_high_u64(indicesLeft), vget_high_u64
     (indicesRight)); | 
| 206     vst1q_u64(dst1, d1); | 206     vst1q_u64(dst1, d1); | 
| 207     vst1q_u64(dst2, d2); | 207     vst1q_u64(dst2, d2); | 
| 208 } | 208 } | 
| 209 | 209 | 
| 210 bool CompressA8toR11EAC_NEON(uint8_t* dst, const uint8_t* src, | 210 bool CompressA8toR11EAC_NEON(uint8_t* dst, const uint8_t* src, | 
| 211                              int width, int height, int rowBytes) { | 211                              int width, int height, size_t rowBytes) { | 
| 212 | 212 | 
| 213     // Since we're going to operate on 4 blocks at a time, the src width | 213     // Since we're going to operate on 4 blocks at a time, the src width | 
| 214     // must be a multiple of 16. However, the height only needs to be a | 214     // must be a multiple of 16. However, the height only needs to be a | 
| 215     // multiple of 4 | 215     // multiple of 4 | 
| 216     if (0 == width || 0 == height || (width % 16) != 0 || (height % 4) != 0) { | 216     if (0 == width || 0 == height || (width % 16) != 0 || (height % 4) != 0) { | 
| 217         return SkTextureCompressor::CompressBufferToFormat( | 217         return SkTextureCompressor::CompressBufferToFormat( | 
| 218             dst, src, | 218             dst, src, | 
| 219             kAlpha_8_SkColorType, | 219             kAlpha_8_SkColorType, | 
| 220             width, height, rowBytes, | 220             width, height, rowBytes, | 
| 221             SkTextureCompressor::kR11_EAC_Format, false); | 221             SkTextureCompressor::kR11_EAC_Format, false); | 
| 222     } | 222     } | 
| 223 | 223 | 
| 224     const int blocksX = width >> 2; | 224     const int blocksX = width >> 2; | 
| 225     const int blocksY = height >> 2; | 225     const int blocksY = height >> 2; | 
| 226 | 226 | 
| 227     SkASSERT((blocksX % 4) == 0); | 227     SkASSERT((blocksX % 4) == 0); | 
| 228 | 228 | 
| 229     uint64_t* encPtr = reinterpret_cast<uint64_t*>(dst); | 229     uint64_t* encPtr = reinterpret_cast<uint64_t*>(dst); | 
| 230     for (int y = 0; y < blocksY; ++y) { | 230     for (int y = 0; y < blocksY; ++y) { | 
| 231         for (int x = 0; x < blocksX; x+=4) { | 231         for (int x = 0; x < blocksX; x+=4) { | 
| 232             // Compress it | 232             // Compress it | 
| 233             compress_r11eac_blocks(encPtr, src + 4*x, rowBytes); | 233             compress_r11eac_blocks(encPtr, src + 4*x, rowBytes); | 
| 234             encPtr += 4; | 234             encPtr += 4; | 
| 235         } | 235         } | 
| 236         src += 4 * rowBytes; | 236         src += 4 * rowBytes; | 
| 237     } | 237     } | 
| 238     return true; | 238     return true; | 
| 239 } | 239 } | 
| OLD | NEW | 
|---|