OLD | NEW |
1 ; | 1 ; |
2 ; Copyright (c) 2010 The WebM project authors. All Rights Reserved. | 2 ; Copyright (c) 2010 The WebM project authors. All Rights Reserved. |
3 ; | 3 ; |
4 ; Use of this source code is governed by a BSD-style license | 4 ; Use of this source code is governed by a BSD-style license |
5 ; that can be found in the LICENSE file in the root of the source | 5 ; that can be found in the LICENSE file in the root of the source |
6 ; tree. An additional intellectual property rights grant can be found | 6 ; tree. An additional intellectual property rights grant can be found |
7 ; in the file PATENTS. All contributing project authors may | 7 ; in the file PATENTS. All contributing project authors may |
8 ; be found in the AUTHORS file in the root of the source tree. | 8 ; be found in the AUTHORS file in the root of the source tree. |
9 ; | 9 ; |
10 | 10 |
(...skipping 254 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
265 movq xmm1, [rsi + rdx + 8] ;B | 265 movq xmm1, [rsi + rdx + 8] ;B |
266 movq xmm2, [rsi + rdx * 2 + 8] ;C | 266 movq xmm2, [rsi + rdx * 2 + 8] ;C |
267 movq xmm3, [rax + rdx * 2 + 8] ;D | 267 movq xmm3, [rax + rdx * 2 + 8] ;D |
268 movq xmm4, [rsi + rdx * 4 + 8] ;E | 268 movq xmm4, [rsi + rdx * 4 + 8] ;E |
269 movq xmm5, [rax + rdx * 4 + 8] ;F | 269 movq xmm5, [rax + rdx * 4 + 8] ;F |
270 | 270 |
271 punpcklbw xmm0, xmm1 ;A B | 271 punpcklbw xmm0, xmm1 ;A B |
272 punpcklbw xmm2, xmm3 ;C D | 272 punpcklbw xmm2, xmm3 ;C D |
273 punpcklbw xmm4, xmm5 ;E F | 273 punpcklbw xmm4, xmm5 ;E F |
274 | 274 |
275 | |
276 movq xmm6, [rsi + rbx + 8] ;G | 275 movq xmm6, [rsi + rbx + 8] ;G |
277 movq xmm7, [rax + rbx + 8] ;H | 276 movq xmm7, [rax + rbx + 8] ;H |
278 punpcklbw xmm6, xmm7 ;G H | 277 punpcklbw xmm6, xmm7 ;G H |
279 | 278 |
280 | |
281 pmaddubsw xmm0, k0k1 | 279 pmaddubsw xmm0, k0k1 |
282 pmaddubsw xmm2, k2k3 | 280 pmaddubsw xmm2, k2k3 |
283 pmaddubsw xmm4, k4k5 | 281 pmaddubsw xmm4, k4k5 |
284 pmaddubsw xmm6, k6k7 | 282 pmaddubsw xmm6, k6k7 |
285 | 283 |
286 paddsw xmm0, xmm6 | 284 paddsw xmm0, xmm6 |
| 285 movdqa xmm1, xmm2 |
| 286 pmaxsw xmm2, xmm4 |
| 287 pminsw xmm4, xmm1 |
| 288 paddsw xmm0, xmm4 |
287 paddsw xmm0, xmm2 | 289 paddsw xmm0, xmm2 |
288 paddsw xmm0, xmm4 | 290 |
289 paddsw xmm0, krd | 291 paddsw xmm0, krd |
290 | |
291 psraw xmm0, 7 | 292 psraw xmm0, 7 |
292 packuswb xmm0, xmm0 | 293 packuswb xmm0, xmm0 |
293 | 294 |
294 add rsi, rdx | 295 add rsi, rdx |
295 add rax, rdx | 296 add rax, rdx |
296 %if %1 | 297 %if %1 |
297 movq xmm1, [rdi+8] | 298 movq xmm1, [rdi+8] |
298 pavgb xmm0, xmm1 | 299 pavgb xmm0, xmm1 |
299 %endif | 300 %endif |
300 | 301 |
(...skipping 750 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
1051 db 0, 1, 1, 2, 2, 3, 3, 4, 4, 5, 5, 6, 6, 7, 7, 8 | 1052 db 0, 1, 1, 2, 2, 3, 3, 4, 4, 5, 5, 6, 6, 7, 7, 8 |
1052 align 16 | 1053 align 16 |
1053 shuf_t2t3: | 1054 shuf_t2t3: |
1054 db 2, 3, 3, 4, 4, 5, 5, 6, 6, 7, 7, 8, 8, 9, 9, 10 | 1055 db 2, 3, 3, 4, 4, 5, 5, 6, 6, 7, 7, 8, 8, 9, 9, 10 |
1055 align 16 | 1056 align 16 |
1056 shuf_t4t5: | 1057 shuf_t4t5: |
1057 db 4, 5, 5, 6, 6, 7, 7, 8, 8, 9, 9, 10, 10, 11, 11, 12 | 1058 db 4, 5, 5, 6, 6, 7, 7, 8, 8, 9, 9, 10, 10, 11, 11, 12 |
1058 align 16 | 1059 align 16 |
1059 shuf_t6t7: | 1060 shuf_t6t7: |
1060 db 6, 7, 7, 8, 8, 9, 9, 10, 10, 11, 11, 12, 12, 13, 13, 14 | 1061 db 6, 7, 7, 8, 8, 9, 9, 10, 10, 11, 11, 12, 12, 13, 13, 14 |
OLD | NEW |