OLD | NEW |
1 ; | 1 ; |
2 ; Copyright (c) 2010 The WebM project authors. All Rights Reserved. | 2 ; Copyright (c) 2010 The WebM project authors. All Rights Reserved. |
3 ; | 3 ; |
4 ; Use of this source code is governed by a BSD-style license | 4 ; Use of this source code is governed by a BSD-style license |
5 ; that can be found in the LICENSE file in the root of the source | 5 ; that can be found in the LICENSE file in the root of the source |
6 ; tree. An additional intellectual property rights grant can be found | 6 ; tree. An additional intellectual property rights grant can be found |
7 ; in the file PATENTS. All contributing project authors may | 7 ; in the file PATENTS. All contributing project authors may |
8 ; be found in the AUTHORS file in the root of the source tree. | 8 ; be found in the AUTHORS file in the root of the source tree. |
9 ; | 9 ; |
10 | 10 |
(...skipping 265 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
276 | 276 |
277 ;void vp8_loop_filter_horizontal_edge_sse2 | 277 ;void vp8_loop_filter_horizontal_edge_sse2 |
278 ;( | 278 ;( |
279 ; unsigned char *src_ptr, | 279 ; unsigned char *src_ptr, |
280 ; int src_pixel_step, | 280 ; int src_pixel_step, |
281 ; const char *flimit, | 281 ; const char *flimit, |
282 ; const char *limit, | 282 ; const char *limit, |
283 ; const char *thresh, | 283 ; const char *thresh, |
284 ; int count | 284 ; int count |
285 ;) | 285 ;) |
286 global sym(vp8_loop_filter_horizontal_edge_sse2) | 286 global sym(vp8_loop_filter_horizontal_edge_sse2) PRIVATE |
287 sym(vp8_loop_filter_horizontal_edge_sse2): | 287 sym(vp8_loop_filter_horizontal_edge_sse2): |
288 push rbp | 288 push rbp |
289 mov rbp, rsp | 289 mov rbp, rsp |
290 SHADOW_ARGS_TO_STACK 6 | 290 SHADOW_ARGS_TO_STACK 6 |
291 SAVE_XMM | 291 SAVE_XMM |
292 GET_GOT rbx | 292 GET_GOT rbx |
293 push rsi | 293 push rsi |
294 push rdi | 294 push rdi |
295 ; end prolog | 295 ; end prolog |
296 | 296 |
(...skipping 29 matching lines...) Expand all Loading... |
326 | 326 |
327 ;void vp8_loop_filter_horizontal_edge_uv_sse2 | 327 ;void vp8_loop_filter_horizontal_edge_uv_sse2 |
328 ;( | 328 ;( |
329 ; unsigned char *src_ptr, | 329 ; unsigned char *src_ptr, |
330 ; int src_pixel_step, | 330 ; int src_pixel_step, |
331 ; const char *flimit, | 331 ; const char *flimit, |
332 ; const char *limit, | 332 ; const char *limit, |
333 ; const char *thresh, | 333 ; const char *thresh, |
334 ; int count | 334 ; int count |
335 ;) | 335 ;) |
336 global sym(vp8_loop_filter_horizontal_edge_uv_sse2) | 336 global sym(vp8_loop_filter_horizontal_edge_uv_sse2) PRIVATE |
337 sym(vp8_loop_filter_horizontal_edge_uv_sse2): | 337 sym(vp8_loop_filter_horizontal_edge_uv_sse2): |
338 push rbp | 338 push rbp |
339 mov rbp, rsp | 339 mov rbp, rsp |
340 SHADOW_ARGS_TO_STACK 6 | 340 SHADOW_ARGS_TO_STACK 6 |
341 SAVE_XMM | 341 SAVE_XMM |
342 GET_GOT rbx | 342 GET_GOT rbx |
343 push rsi | 343 push rsi |
344 push rdi | 344 push rdi |
345 ; end prolog | 345 ; end prolog |
346 | 346 |
(...skipping 225 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
572 | 572 |
573 ;void vp8_mbloop_filter_horizontal_edge_sse2 | 573 ;void vp8_mbloop_filter_horizontal_edge_sse2 |
574 ;( | 574 ;( |
575 ; unsigned char *src_ptr, | 575 ; unsigned char *src_ptr, |
576 ; int src_pixel_step, | 576 ; int src_pixel_step, |
577 ; const char *flimit, | 577 ; const char *flimit, |
578 ; const char *limit, | 578 ; const char *limit, |
579 ; const char *thresh, | 579 ; const char *thresh, |
580 ; int count | 580 ; int count |
581 ;) | 581 ;) |
582 global sym(vp8_mbloop_filter_horizontal_edge_sse2) | 582 global sym(vp8_mbloop_filter_horizontal_edge_sse2) PRIVATE |
583 sym(vp8_mbloop_filter_horizontal_edge_sse2): | 583 sym(vp8_mbloop_filter_horizontal_edge_sse2): |
584 push rbp | 584 push rbp |
585 mov rbp, rsp | 585 mov rbp, rsp |
586 SHADOW_ARGS_TO_STACK 6 | 586 SHADOW_ARGS_TO_STACK 6 |
587 SAVE_XMM | 587 SAVE_XMM |
588 GET_GOT rbx | 588 GET_GOT rbx |
589 push rsi | 589 push rsi |
590 push rdi | 590 push rdi |
591 ; end prolog | 591 ; end prolog |
592 | 592 |
(...skipping 29 matching lines...) Expand all Loading... |
622 | 622 |
623 ;void vp8_mbloop_filter_horizontal_edge_uv_sse2 | 623 ;void vp8_mbloop_filter_horizontal_edge_uv_sse2 |
624 ;( | 624 ;( |
625 ; unsigned char *u, | 625 ; unsigned char *u, |
626 ; int src_pixel_step, | 626 ; int src_pixel_step, |
627 ; const char *flimit, | 627 ; const char *flimit, |
628 ; const char *limit, | 628 ; const char *limit, |
629 ; const char *thresh, | 629 ; const char *thresh, |
630 ; unsigned char *v | 630 ; unsigned char *v |
631 ;) | 631 ;) |
632 global sym(vp8_mbloop_filter_horizontal_edge_uv_sse2) | 632 global sym(vp8_mbloop_filter_horizontal_edge_uv_sse2) PRIVATE |
633 sym(vp8_mbloop_filter_horizontal_edge_uv_sse2): | 633 sym(vp8_mbloop_filter_horizontal_edge_uv_sse2): |
634 push rbp | 634 push rbp |
635 mov rbp, rsp | 635 mov rbp, rsp |
636 SHADOW_ARGS_TO_STACK 6 | 636 SHADOW_ARGS_TO_STACK 6 |
637 SAVE_XMM | 637 SAVE_XMM |
638 GET_GOT rbx | 638 GET_GOT rbx |
639 push rsi | 639 push rsi |
640 push rdi | 640 push rdi |
641 ; end prolog | 641 ; end prolog |
642 | 642 |
(...skipping 369 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
1012 | 1012 |
1013 ;void vp8_loop_filter_vertical_edge_sse2 | 1013 ;void vp8_loop_filter_vertical_edge_sse2 |
1014 ;( | 1014 ;( |
1015 ; unsigned char *src_ptr, | 1015 ; unsigned char *src_ptr, |
1016 ; int src_pixel_step, | 1016 ; int src_pixel_step, |
1017 ; const char *flimit, | 1017 ; const char *flimit, |
1018 ; const char *limit, | 1018 ; const char *limit, |
1019 ; const char *thresh, | 1019 ; const char *thresh, |
1020 ; int count | 1020 ; int count |
1021 ;) | 1021 ;) |
1022 global sym(vp8_loop_filter_vertical_edge_sse2) | 1022 global sym(vp8_loop_filter_vertical_edge_sse2) PRIVATE |
1023 sym(vp8_loop_filter_vertical_edge_sse2): | 1023 sym(vp8_loop_filter_vertical_edge_sse2): |
1024 push rbp | 1024 push rbp |
1025 mov rbp, rsp | 1025 mov rbp, rsp |
1026 SHADOW_ARGS_TO_STACK 6 | 1026 SHADOW_ARGS_TO_STACK 6 |
1027 SAVE_XMM | 1027 SAVE_XMM |
1028 GET_GOT rbx | 1028 GET_GOT rbx |
1029 push rsi | 1029 push rsi |
1030 push rdi | 1030 push rdi |
1031 ; end prolog | 1031 ; end prolog |
1032 | 1032 |
(...skipping 46 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
1079 | 1079 |
1080 ;void vp8_loop_filter_vertical_edge_uv_sse2 | 1080 ;void vp8_loop_filter_vertical_edge_uv_sse2 |
1081 ;( | 1081 ;( |
1082 ; unsigned char *u, | 1082 ; unsigned char *u, |
1083 ; int src_pixel_step, | 1083 ; int src_pixel_step, |
1084 ; const char *flimit, | 1084 ; const char *flimit, |
1085 ; const char *limit, | 1085 ; const char *limit, |
1086 ; const char *thresh, | 1086 ; const char *thresh, |
1087 ; unsigned char *v | 1087 ; unsigned char *v |
1088 ;) | 1088 ;) |
1089 global sym(vp8_loop_filter_vertical_edge_uv_sse2) | 1089 global sym(vp8_loop_filter_vertical_edge_uv_sse2) PRIVATE |
1090 sym(vp8_loop_filter_vertical_edge_uv_sse2): | 1090 sym(vp8_loop_filter_vertical_edge_uv_sse2): |
1091 push rbp | 1091 push rbp |
1092 mov rbp, rsp | 1092 mov rbp, rsp |
1093 SHADOW_ARGS_TO_STACK 6 | 1093 SHADOW_ARGS_TO_STACK 6 |
1094 SAVE_XMM | 1094 SAVE_XMM |
1095 GET_GOT rbx | 1095 GET_GOT rbx |
1096 push rsi | 1096 push rsi |
1097 push rdi | 1097 push rdi |
1098 ; end prolog | 1098 ; end prolog |
1099 | 1099 |
(...skipping 137 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
1237 | 1237 |
1238 ;void vp8_mbloop_filter_vertical_edge_sse2 | 1238 ;void vp8_mbloop_filter_vertical_edge_sse2 |
1239 ;( | 1239 ;( |
1240 ; unsigned char *src_ptr, | 1240 ; unsigned char *src_ptr, |
1241 ; int src_pixel_step, | 1241 ; int src_pixel_step, |
1242 ; const char *flimit, | 1242 ; const char *flimit, |
1243 ; const char *limit, | 1243 ; const char *limit, |
1244 ; const char *thresh, | 1244 ; const char *thresh, |
1245 ; int count | 1245 ; int count |
1246 ;) | 1246 ;) |
1247 global sym(vp8_mbloop_filter_vertical_edge_sse2) | 1247 global sym(vp8_mbloop_filter_vertical_edge_sse2) PRIVATE |
1248 sym(vp8_mbloop_filter_vertical_edge_sse2): | 1248 sym(vp8_mbloop_filter_vertical_edge_sse2): |
1249 push rbp | 1249 push rbp |
1250 mov rbp, rsp | 1250 mov rbp, rsp |
1251 SHADOW_ARGS_TO_STACK 6 | 1251 SHADOW_ARGS_TO_STACK 6 |
1252 SAVE_XMM | 1252 SAVE_XMM |
1253 GET_GOT rbx | 1253 GET_GOT rbx |
1254 push rsi | 1254 push rsi |
1255 push rdi | 1255 push rdi |
1256 ; end prolog | 1256 ; end prolog |
1257 | 1257 |
(...skipping 48 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
1306 | 1306 |
1307 ;void vp8_mbloop_filter_vertical_edge_uv_sse2 | 1307 ;void vp8_mbloop_filter_vertical_edge_uv_sse2 |
1308 ;( | 1308 ;( |
1309 ; unsigned char *u, | 1309 ; unsigned char *u, |
1310 ; int src_pixel_step, | 1310 ; int src_pixel_step, |
1311 ; const char *flimit, | 1311 ; const char *flimit, |
1312 ; const char *limit, | 1312 ; const char *limit, |
1313 ; const char *thresh, | 1313 ; const char *thresh, |
1314 ; unsigned char *v | 1314 ; unsigned char *v |
1315 ;) | 1315 ;) |
1316 global sym(vp8_mbloop_filter_vertical_edge_uv_sse2) | 1316 global sym(vp8_mbloop_filter_vertical_edge_uv_sse2) PRIVATE |
1317 sym(vp8_mbloop_filter_vertical_edge_uv_sse2): | 1317 sym(vp8_mbloop_filter_vertical_edge_uv_sse2): |
1318 push rbp | 1318 push rbp |
1319 mov rbp, rsp | 1319 mov rbp, rsp |
1320 SHADOW_ARGS_TO_STACK 6 | 1320 SHADOW_ARGS_TO_STACK 6 |
1321 SAVE_XMM | 1321 SAVE_XMM |
1322 GET_GOT rbx | 1322 GET_GOT rbx |
1323 push rsi | 1323 push rsi |
1324 push rdi | 1324 push rdi |
1325 ; end prolog | 1325 ; end prolog |
1326 | 1326 |
(...skipping 47 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
1374 | 1374 |
1375 ;void vp8_loop_filter_simple_horizontal_edge_sse2 | 1375 ;void vp8_loop_filter_simple_horizontal_edge_sse2 |
1376 ;( | 1376 ;( |
1377 ; unsigned char *src_ptr, | 1377 ; unsigned char *src_ptr, |
1378 ; int src_pixel_step, | 1378 ; int src_pixel_step, |
1379 ; const char *flimit, | 1379 ; const char *flimit, |
1380 ; const char *limit, | 1380 ; const char *limit, |
1381 ; const char *thresh, | 1381 ; const char *thresh, |
1382 ; int count | 1382 ; int count |
1383 ;) | 1383 ;) |
1384 global sym(vp8_loop_filter_simple_horizontal_edge_sse2) | 1384 global sym(vp8_loop_filter_simple_horizontal_edge_sse2) PRIVATE |
1385 sym(vp8_loop_filter_simple_horizontal_edge_sse2): | 1385 sym(vp8_loop_filter_simple_horizontal_edge_sse2): |
1386 push rbp | 1386 push rbp |
1387 mov rbp, rsp | 1387 mov rbp, rsp |
1388 SHADOW_ARGS_TO_STACK 6 | 1388 SHADOW_ARGS_TO_STACK 6 |
1389 SAVE_XMM | 1389 SAVE_XMM |
1390 GET_GOT rbx | 1390 GET_GOT rbx |
1391 push rsi | 1391 push rsi |
1392 push rdi | 1392 push rdi |
1393 ; end prolog | 1393 ; end prolog |
1394 | 1394 |
(...skipping 96 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
1491 | 1491 |
1492 ;void vp8_loop_filter_simple_vertical_edge_sse2 | 1492 ;void vp8_loop_filter_simple_vertical_edge_sse2 |
1493 ;( | 1493 ;( |
1494 ; unsigned char *src_ptr, | 1494 ; unsigned char *src_ptr, |
1495 ; int src_pixel_step, | 1495 ; int src_pixel_step, |
1496 ; const char *flimit, | 1496 ; const char *flimit, |
1497 ; const char *limit, | 1497 ; const char *limit, |
1498 ; const char *thresh, | 1498 ; const char *thresh, |
1499 ; int count | 1499 ; int count |
1500 ;) | 1500 ;) |
1501 global sym(vp8_loop_filter_simple_vertical_edge_sse2) | 1501 global sym(vp8_loop_filter_simple_vertical_edge_sse2) PRIVATE |
1502 sym(vp8_loop_filter_simple_vertical_edge_sse2): | 1502 sym(vp8_loop_filter_simple_vertical_edge_sse2): |
1503 push rbp ; save old base pointer value. | 1503 push rbp ; save old base pointer value. |
1504 mov rbp, rsp ; set new base pointer value. | 1504 mov rbp, rsp ; set new base pointer value. |
1505 SHADOW_ARGS_TO_STACK 6 | 1505 SHADOW_ARGS_TO_STACK 6 |
1506 SAVE_XMM | 1506 SAVE_XMM |
1507 GET_GOT rbx ; save callee-saved reg | 1507 GET_GOT rbx ; save callee-saved reg |
1508 push rsi | 1508 push rsi |
1509 push rdi | 1509 push rdi |
1510 ; end prolog | 1510 ; end prolog |
1511 | 1511 |
(...skipping 259 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
1771 times 16 db 0x04 | 1771 times 16 db 0x04 |
1772 align 16 | 1772 align 16 |
1773 ones: | 1773 ones: |
1774 times 8 dw 0x0001 | 1774 times 8 dw 0x0001 |
1775 align 16 | 1775 align 16 |
1776 s9: | 1776 s9: |
1777 times 8 dw 0x0900 | 1777 times 8 dw 0x0900 |
1778 align 16 | 1778 align 16 |
1779 s63: | 1779 s63: |
1780 times 8 dw 0x003f | 1780 times 8 dw 0x003f |
OLD | NEW |