OLD | NEW |
(Empty) | |
| 1 %ifidn __OUTPUT_FORMAT__,obj |
| 2 section code use32 class=code align=64 |
| 3 %elifidn __OUTPUT_FORMAT__,win32 |
| 4 %ifdef __YASM_VERSION_ID__ |
| 5 %if __YASM_VERSION_ID__ < 01010000h |
| 6 %error yasm version 1.1.0 or later needed. |
| 7 %endif |
| 8 ; Yasm automatically includes .00 and complains about redefining it. |
| 9 ; https://www.tortall.net/projects/yasm/manual/html/objfmt-win32-safeseh.html |
| 10 %else |
| 11 $@feat.00 equ 1 |
| 12 %endif |
| 13 section .text code align=64 |
| 14 %else |
| 15 section .text code |
| 16 %endif |
| 17 ;extern _OPENSSL_ia32cap_P |
| 18 global _aesni_encrypt |
| 19 align 16 |
| 20 _aesni_encrypt: |
| 21 L$_aesni_encrypt_begin: |
| 22 mov eax,DWORD [4+esp] |
| 23 mov edx,DWORD [12+esp] |
| 24 movups xmm2,[eax] |
| 25 mov ecx,DWORD [240+edx] |
| 26 mov eax,DWORD [8+esp] |
| 27 movups xmm0,[edx] |
| 28 movups xmm1,[16+edx] |
| 29 lea edx,[32+edx] |
| 30 xorps xmm2,xmm0 |
| 31 L$000enc1_loop_1: |
| 32 db 102,15,56,220,209 |
| 33 dec ecx |
| 34 movups xmm1,[edx] |
| 35 lea edx,[16+edx] |
| 36 jnz NEAR L$000enc1_loop_1 |
| 37 db 102,15,56,221,209 |
| 38 pxor xmm0,xmm0 |
| 39 pxor xmm1,xmm1 |
| 40 movups [eax],xmm2 |
| 41 pxor xmm2,xmm2 |
| 42 ret |
| 43 global _aesni_decrypt |
| 44 align 16 |
| 45 _aesni_decrypt: |
| 46 L$_aesni_decrypt_begin: |
| 47 mov eax,DWORD [4+esp] |
| 48 mov edx,DWORD [12+esp] |
| 49 movups xmm2,[eax] |
| 50 mov ecx,DWORD [240+edx] |
| 51 mov eax,DWORD [8+esp] |
| 52 movups xmm0,[edx] |
| 53 movups xmm1,[16+edx] |
| 54 lea edx,[32+edx] |
| 55 xorps xmm2,xmm0 |
| 56 L$001dec1_loop_2: |
| 57 db 102,15,56,222,209 |
| 58 dec ecx |
| 59 movups xmm1,[edx] |
| 60 lea edx,[16+edx] |
| 61 jnz NEAR L$001dec1_loop_2 |
| 62 db 102,15,56,223,209 |
| 63 pxor xmm0,xmm0 |
| 64 pxor xmm1,xmm1 |
| 65 movups [eax],xmm2 |
| 66 pxor xmm2,xmm2 |
| 67 ret |
| 68 align 16 |
| 69 __aesni_encrypt2: |
| 70 movups xmm0,[edx] |
| 71 shl ecx,4 |
| 72 movups xmm1,[16+edx] |
| 73 xorps xmm2,xmm0 |
| 74 pxor xmm3,xmm0 |
| 75 movups xmm0,[32+edx] |
| 76 lea edx,[32+ecx*1+edx] |
| 77 neg ecx |
| 78 add ecx,16 |
| 79 L$002enc2_loop: |
| 80 db 102,15,56,220,209 |
| 81 db 102,15,56,220,217 |
| 82 movups xmm1,[ecx*1+edx] |
| 83 add ecx,32 |
| 84 db 102,15,56,220,208 |
| 85 db 102,15,56,220,216 |
| 86 movups xmm0,[ecx*1+edx-16] |
| 87 jnz NEAR L$002enc2_loop |
| 88 db 102,15,56,220,209 |
| 89 db 102,15,56,220,217 |
| 90 db 102,15,56,221,208 |
| 91 db 102,15,56,221,216 |
| 92 ret |
| 93 align 16 |
| 94 __aesni_decrypt2: |
| 95 movups xmm0,[edx] |
| 96 shl ecx,4 |
| 97 movups xmm1,[16+edx] |
| 98 xorps xmm2,xmm0 |
| 99 pxor xmm3,xmm0 |
| 100 movups xmm0,[32+edx] |
| 101 lea edx,[32+ecx*1+edx] |
| 102 neg ecx |
| 103 add ecx,16 |
| 104 L$003dec2_loop: |
| 105 db 102,15,56,222,209 |
| 106 db 102,15,56,222,217 |
| 107 movups xmm1,[ecx*1+edx] |
| 108 add ecx,32 |
| 109 db 102,15,56,222,208 |
| 110 db 102,15,56,222,216 |
| 111 movups xmm0,[ecx*1+edx-16] |
| 112 jnz NEAR L$003dec2_loop |
| 113 db 102,15,56,222,209 |
| 114 db 102,15,56,222,217 |
| 115 db 102,15,56,223,208 |
| 116 db 102,15,56,223,216 |
| 117 ret |
| 118 align 16 |
| 119 __aesni_encrypt3: |
| 120 movups xmm0,[edx] |
| 121 shl ecx,4 |
| 122 movups xmm1,[16+edx] |
| 123 xorps xmm2,xmm0 |
| 124 pxor xmm3,xmm0 |
| 125 pxor xmm4,xmm0 |
| 126 movups xmm0,[32+edx] |
| 127 lea edx,[32+ecx*1+edx] |
| 128 neg ecx |
| 129 add ecx,16 |
| 130 L$004enc3_loop: |
| 131 db 102,15,56,220,209 |
| 132 db 102,15,56,220,217 |
| 133 db 102,15,56,220,225 |
| 134 movups xmm1,[ecx*1+edx] |
| 135 add ecx,32 |
| 136 db 102,15,56,220,208 |
| 137 db 102,15,56,220,216 |
| 138 db 102,15,56,220,224 |
| 139 movups xmm0,[ecx*1+edx-16] |
| 140 jnz NEAR L$004enc3_loop |
| 141 db 102,15,56,220,209 |
| 142 db 102,15,56,220,217 |
| 143 db 102,15,56,220,225 |
| 144 db 102,15,56,221,208 |
| 145 db 102,15,56,221,216 |
| 146 db 102,15,56,221,224 |
| 147 ret |
| 148 align 16 |
| 149 __aesni_decrypt3: |
| 150 movups xmm0,[edx] |
| 151 shl ecx,4 |
| 152 movups xmm1,[16+edx] |
| 153 xorps xmm2,xmm0 |
| 154 pxor xmm3,xmm0 |
| 155 pxor xmm4,xmm0 |
| 156 movups xmm0,[32+edx] |
| 157 lea edx,[32+ecx*1+edx] |
| 158 neg ecx |
| 159 add ecx,16 |
| 160 L$005dec3_loop: |
| 161 db 102,15,56,222,209 |
| 162 db 102,15,56,222,217 |
| 163 db 102,15,56,222,225 |
| 164 movups xmm1,[ecx*1+edx] |
| 165 add ecx,32 |
| 166 db 102,15,56,222,208 |
| 167 db 102,15,56,222,216 |
| 168 db 102,15,56,222,224 |
| 169 movups xmm0,[ecx*1+edx-16] |
| 170 jnz NEAR L$005dec3_loop |
| 171 db 102,15,56,222,209 |
| 172 db 102,15,56,222,217 |
| 173 db 102,15,56,222,225 |
| 174 db 102,15,56,223,208 |
| 175 db 102,15,56,223,216 |
| 176 db 102,15,56,223,224 |
| 177 ret |
| 178 align 16 |
| 179 __aesni_encrypt4: |
| 180 movups xmm0,[edx] |
| 181 movups xmm1,[16+edx] |
| 182 shl ecx,4 |
| 183 xorps xmm2,xmm0 |
| 184 pxor xmm3,xmm0 |
| 185 pxor xmm4,xmm0 |
| 186 pxor xmm5,xmm0 |
| 187 movups xmm0,[32+edx] |
| 188 lea edx,[32+ecx*1+edx] |
| 189 neg ecx |
| 190 db 15,31,64,0 |
| 191 add ecx,16 |
| 192 L$006enc4_loop: |
| 193 db 102,15,56,220,209 |
| 194 db 102,15,56,220,217 |
| 195 db 102,15,56,220,225 |
| 196 db 102,15,56,220,233 |
| 197 movups xmm1,[ecx*1+edx] |
| 198 add ecx,32 |
| 199 db 102,15,56,220,208 |
| 200 db 102,15,56,220,216 |
| 201 db 102,15,56,220,224 |
| 202 db 102,15,56,220,232 |
| 203 movups xmm0,[ecx*1+edx-16] |
| 204 jnz NEAR L$006enc4_loop |
| 205 db 102,15,56,220,209 |
| 206 db 102,15,56,220,217 |
| 207 db 102,15,56,220,225 |
| 208 db 102,15,56,220,233 |
| 209 db 102,15,56,221,208 |
| 210 db 102,15,56,221,216 |
| 211 db 102,15,56,221,224 |
| 212 db 102,15,56,221,232 |
| 213 ret |
| 214 align 16 |
| 215 __aesni_decrypt4: |
| 216 movups xmm0,[edx] |
| 217 movups xmm1,[16+edx] |
| 218 shl ecx,4 |
| 219 xorps xmm2,xmm0 |
| 220 pxor xmm3,xmm0 |
| 221 pxor xmm4,xmm0 |
| 222 pxor xmm5,xmm0 |
| 223 movups xmm0,[32+edx] |
| 224 lea edx,[32+ecx*1+edx] |
| 225 neg ecx |
| 226 db 15,31,64,0 |
| 227 add ecx,16 |
| 228 L$007dec4_loop: |
| 229 db 102,15,56,222,209 |
| 230 db 102,15,56,222,217 |
| 231 db 102,15,56,222,225 |
| 232 db 102,15,56,222,233 |
| 233 movups xmm1,[ecx*1+edx] |
| 234 add ecx,32 |
| 235 db 102,15,56,222,208 |
| 236 db 102,15,56,222,216 |
| 237 db 102,15,56,222,224 |
| 238 db 102,15,56,222,232 |
| 239 movups xmm0,[ecx*1+edx-16] |
| 240 jnz NEAR L$007dec4_loop |
| 241 db 102,15,56,222,209 |
| 242 db 102,15,56,222,217 |
| 243 db 102,15,56,222,225 |
| 244 db 102,15,56,222,233 |
| 245 db 102,15,56,223,208 |
| 246 db 102,15,56,223,216 |
| 247 db 102,15,56,223,224 |
| 248 db 102,15,56,223,232 |
| 249 ret |
| 250 align 16 |
| 251 __aesni_encrypt6: |
| 252 movups xmm0,[edx] |
| 253 shl ecx,4 |
| 254 movups xmm1,[16+edx] |
| 255 xorps xmm2,xmm0 |
| 256 pxor xmm3,xmm0 |
| 257 pxor xmm4,xmm0 |
| 258 db 102,15,56,220,209 |
| 259 pxor xmm5,xmm0 |
| 260 pxor xmm6,xmm0 |
| 261 db 102,15,56,220,217 |
| 262 lea edx,[32+ecx*1+edx] |
| 263 neg ecx |
| 264 db 102,15,56,220,225 |
| 265 pxor xmm7,xmm0 |
| 266 movups xmm0,[ecx*1+edx] |
| 267 add ecx,16 |
| 268 jmp NEAR L$008_aesni_encrypt6_inner |
| 269 align 16 |
| 270 L$009enc6_loop: |
| 271 db 102,15,56,220,209 |
| 272 db 102,15,56,220,217 |
| 273 db 102,15,56,220,225 |
| 274 L$008_aesni_encrypt6_inner: |
| 275 db 102,15,56,220,233 |
| 276 db 102,15,56,220,241 |
| 277 db 102,15,56,220,249 |
| 278 L$_aesni_encrypt6_enter: |
| 279 movups xmm1,[ecx*1+edx] |
| 280 add ecx,32 |
| 281 db 102,15,56,220,208 |
| 282 db 102,15,56,220,216 |
| 283 db 102,15,56,220,224 |
| 284 db 102,15,56,220,232 |
| 285 db 102,15,56,220,240 |
| 286 db 102,15,56,220,248 |
| 287 movups xmm0,[ecx*1+edx-16] |
| 288 jnz NEAR L$009enc6_loop |
| 289 db 102,15,56,220,209 |
| 290 db 102,15,56,220,217 |
| 291 db 102,15,56,220,225 |
| 292 db 102,15,56,220,233 |
| 293 db 102,15,56,220,241 |
| 294 db 102,15,56,220,249 |
| 295 db 102,15,56,221,208 |
| 296 db 102,15,56,221,216 |
| 297 db 102,15,56,221,224 |
| 298 db 102,15,56,221,232 |
| 299 db 102,15,56,221,240 |
| 300 db 102,15,56,221,248 |
| 301 ret |
| 302 align 16 |
| 303 __aesni_decrypt6: |
| 304 movups xmm0,[edx] |
| 305 shl ecx,4 |
| 306 movups xmm1,[16+edx] |
| 307 xorps xmm2,xmm0 |
| 308 pxor xmm3,xmm0 |
| 309 pxor xmm4,xmm0 |
| 310 db 102,15,56,222,209 |
| 311 pxor xmm5,xmm0 |
| 312 pxor xmm6,xmm0 |
| 313 db 102,15,56,222,217 |
| 314 lea edx,[32+ecx*1+edx] |
| 315 neg ecx |
| 316 db 102,15,56,222,225 |
| 317 pxor xmm7,xmm0 |
| 318 movups xmm0,[ecx*1+edx] |
| 319 add ecx,16 |
| 320 jmp NEAR L$010_aesni_decrypt6_inner |
| 321 align 16 |
| 322 L$011dec6_loop: |
| 323 db 102,15,56,222,209 |
| 324 db 102,15,56,222,217 |
| 325 db 102,15,56,222,225 |
| 326 L$010_aesni_decrypt6_inner: |
| 327 db 102,15,56,222,233 |
| 328 db 102,15,56,222,241 |
| 329 db 102,15,56,222,249 |
| 330 L$_aesni_decrypt6_enter: |
| 331 movups xmm1,[ecx*1+edx] |
| 332 add ecx,32 |
| 333 db 102,15,56,222,208 |
| 334 db 102,15,56,222,216 |
| 335 db 102,15,56,222,224 |
| 336 db 102,15,56,222,232 |
| 337 db 102,15,56,222,240 |
| 338 db 102,15,56,222,248 |
| 339 movups xmm0,[ecx*1+edx-16] |
| 340 jnz NEAR L$011dec6_loop |
| 341 db 102,15,56,222,209 |
| 342 db 102,15,56,222,217 |
| 343 db 102,15,56,222,225 |
| 344 db 102,15,56,222,233 |
| 345 db 102,15,56,222,241 |
| 346 db 102,15,56,222,249 |
| 347 db 102,15,56,223,208 |
| 348 db 102,15,56,223,216 |
| 349 db 102,15,56,223,224 |
| 350 db 102,15,56,223,232 |
| 351 db 102,15,56,223,240 |
| 352 db 102,15,56,223,248 |
| 353 ret |
| 354 global _aesni_ecb_encrypt |
| 355 align 16 |
| 356 _aesni_ecb_encrypt: |
| 357 L$_aesni_ecb_encrypt_begin: |
| 358 push ebp |
| 359 push ebx |
| 360 push esi |
| 361 push edi |
| 362 mov esi,DWORD [20+esp] |
| 363 mov edi,DWORD [24+esp] |
| 364 mov eax,DWORD [28+esp] |
| 365 mov edx,DWORD [32+esp] |
| 366 mov ebx,DWORD [36+esp] |
| 367 and eax,-16 |
| 368 jz NEAR L$012ecb_ret |
| 369 mov ecx,DWORD [240+edx] |
| 370 test ebx,ebx |
| 371 jz NEAR L$013ecb_decrypt |
| 372 mov ebp,edx |
| 373 mov ebx,ecx |
| 374 cmp eax,96 |
| 375 jb NEAR L$014ecb_enc_tail |
| 376 movdqu xmm2,[esi] |
| 377 movdqu xmm3,[16+esi] |
| 378 movdqu xmm4,[32+esi] |
| 379 movdqu xmm5,[48+esi] |
| 380 movdqu xmm6,[64+esi] |
| 381 movdqu xmm7,[80+esi] |
| 382 lea esi,[96+esi] |
| 383 sub eax,96 |
| 384 jmp NEAR L$015ecb_enc_loop6_enter |
| 385 align 16 |
| 386 L$016ecb_enc_loop6: |
| 387 movups [edi],xmm2 |
| 388 movdqu xmm2,[esi] |
| 389 movups [16+edi],xmm3 |
| 390 movdqu xmm3,[16+esi] |
| 391 movups [32+edi],xmm4 |
| 392 movdqu xmm4,[32+esi] |
| 393 movups [48+edi],xmm5 |
| 394 movdqu xmm5,[48+esi] |
| 395 movups [64+edi],xmm6 |
| 396 movdqu xmm6,[64+esi] |
| 397 movups [80+edi],xmm7 |
| 398 lea edi,[96+edi] |
| 399 movdqu xmm7,[80+esi] |
| 400 lea esi,[96+esi] |
| 401 L$015ecb_enc_loop6_enter: |
| 402 call __aesni_encrypt6 |
| 403 mov edx,ebp |
| 404 mov ecx,ebx |
| 405 sub eax,96 |
| 406 jnc NEAR L$016ecb_enc_loop6 |
| 407 movups [edi],xmm2 |
| 408 movups [16+edi],xmm3 |
| 409 movups [32+edi],xmm4 |
| 410 movups [48+edi],xmm5 |
| 411 movups [64+edi],xmm6 |
| 412 movups [80+edi],xmm7 |
| 413 lea edi,[96+edi] |
| 414 add eax,96 |
| 415 jz NEAR L$012ecb_ret |
| 416 L$014ecb_enc_tail: |
| 417 movups xmm2,[esi] |
| 418 cmp eax,32 |
| 419 jb NEAR L$017ecb_enc_one |
| 420 movups xmm3,[16+esi] |
| 421 je NEAR L$018ecb_enc_two |
| 422 movups xmm4,[32+esi] |
| 423 cmp eax,64 |
| 424 jb NEAR L$019ecb_enc_three |
| 425 movups xmm5,[48+esi] |
| 426 je NEAR L$020ecb_enc_four |
| 427 movups xmm6,[64+esi] |
| 428 xorps xmm7,xmm7 |
| 429 call __aesni_encrypt6 |
| 430 movups [edi],xmm2 |
| 431 movups [16+edi],xmm3 |
| 432 movups [32+edi],xmm4 |
| 433 movups [48+edi],xmm5 |
| 434 movups [64+edi],xmm6 |
| 435 jmp NEAR L$012ecb_ret |
| 436 align 16 |
| 437 L$017ecb_enc_one: |
| 438 movups xmm0,[edx] |
| 439 movups xmm1,[16+edx] |
| 440 lea edx,[32+edx] |
| 441 xorps xmm2,xmm0 |
| 442 L$021enc1_loop_3: |
| 443 db 102,15,56,220,209 |
| 444 dec ecx |
| 445 movups xmm1,[edx] |
| 446 lea edx,[16+edx] |
| 447 jnz NEAR L$021enc1_loop_3 |
| 448 db 102,15,56,221,209 |
| 449 movups [edi],xmm2 |
| 450 jmp NEAR L$012ecb_ret |
| 451 align 16 |
| 452 L$018ecb_enc_two: |
| 453 call __aesni_encrypt2 |
| 454 movups [edi],xmm2 |
| 455 movups [16+edi],xmm3 |
| 456 jmp NEAR L$012ecb_ret |
| 457 align 16 |
| 458 L$019ecb_enc_three: |
| 459 call __aesni_encrypt3 |
| 460 movups [edi],xmm2 |
| 461 movups [16+edi],xmm3 |
| 462 movups [32+edi],xmm4 |
| 463 jmp NEAR L$012ecb_ret |
| 464 align 16 |
| 465 L$020ecb_enc_four: |
| 466 call __aesni_encrypt4 |
| 467 movups [edi],xmm2 |
| 468 movups [16+edi],xmm3 |
| 469 movups [32+edi],xmm4 |
| 470 movups [48+edi],xmm5 |
| 471 jmp NEAR L$012ecb_ret |
| 472 align 16 |
| 473 L$013ecb_decrypt: |
| 474 mov ebp,edx |
| 475 mov ebx,ecx |
| 476 cmp eax,96 |
| 477 jb NEAR L$022ecb_dec_tail |
| 478 movdqu xmm2,[esi] |
| 479 movdqu xmm3,[16+esi] |
| 480 movdqu xmm4,[32+esi] |
| 481 movdqu xmm5,[48+esi] |
| 482 movdqu xmm6,[64+esi] |
| 483 movdqu xmm7,[80+esi] |
| 484 lea esi,[96+esi] |
| 485 sub eax,96 |
| 486 jmp NEAR L$023ecb_dec_loop6_enter |
| 487 align 16 |
| 488 L$024ecb_dec_loop6: |
| 489 movups [edi],xmm2 |
| 490 movdqu xmm2,[esi] |
| 491 movups [16+edi],xmm3 |
| 492 movdqu xmm3,[16+esi] |
| 493 movups [32+edi],xmm4 |
| 494 movdqu xmm4,[32+esi] |
| 495 movups [48+edi],xmm5 |
| 496 movdqu xmm5,[48+esi] |
| 497 movups [64+edi],xmm6 |
| 498 movdqu xmm6,[64+esi] |
| 499 movups [80+edi],xmm7 |
| 500 lea edi,[96+edi] |
| 501 movdqu xmm7,[80+esi] |
| 502 lea esi,[96+esi] |
| 503 L$023ecb_dec_loop6_enter: |
| 504 call __aesni_decrypt6 |
| 505 mov edx,ebp |
| 506 mov ecx,ebx |
| 507 sub eax,96 |
| 508 jnc NEAR L$024ecb_dec_loop6 |
| 509 movups [edi],xmm2 |
| 510 movups [16+edi],xmm3 |
| 511 movups [32+edi],xmm4 |
| 512 movups [48+edi],xmm5 |
| 513 movups [64+edi],xmm6 |
| 514 movups [80+edi],xmm7 |
| 515 lea edi,[96+edi] |
| 516 add eax,96 |
| 517 jz NEAR L$012ecb_ret |
| 518 L$022ecb_dec_tail: |
| 519 movups xmm2,[esi] |
| 520 cmp eax,32 |
| 521 jb NEAR L$025ecb_dec_one |
| 522 movups xmm3,[16+esi] |
| 523 je NEAR L$026ecb_dec_two |
| 524 movups xmm4,[32+esi] |
| 525 cmp eax,64 |
| 526 jb NEAR L$027ecb_dec_three |
| 527 movups xmm5,[48+esi] |
| 528 je NEAR L$028ecb_dec_four |
| 529 movups xmm6,[64+esi] |
| 530 xorps xmm7,xmm7 |
| 531 call __aesni_decrypt6 |
| 532 movups [edi],xmm2 |
| 533 movups [16+edi],xmm3 |
| 534 movups [32+edi],xmm4 |
| 535 movups [48+edi],xmm5 |
| 536 movups [64+edi],xmm6 |
| 537 jmp NEAR L$012ecb_ret |
| 538 align 16 |
| 539 L$025ecb_dec_one: |
| 540 movups xmm0,[edx] |
| 541 movups xmm1,[16+edx] |
| 542 lea edx,[32+edx] |
| 543 xorps xmm2,xmm0 |
| 544 L$029dec1_loop_4: |
| 545 db 102,15,56,222,209 |
| 546 dec ecx |
| 547 movups xmm1,[edx] |
| 548 lea edx,[16+edx] |
| 549 jnz NEAR L$029dec1_loop_4 |
| 550 db 102,15,56,223,209 |
| 551 movups [edi],xmm2 |
| 552 jmp NEAR L$012ecb_ret |
| 553 align 16 |
| 554 L$026ecb_dec_two: |
| 555 call __aesni_decrypt2 |
| 556 movups [edi],xmm2 |
| 557 movups [16+edi],xmm3 |
| 558 jmp NEAR L$012ecb_ret |
| 559 align 16 |
| 560 L$027ecb_dec_three: |
| 561 call __aesni_decrypt3 |
| 562 movups [edi],xmm2 |
| 563 movups [16+edi],xmm3 |
| 564 movups [32+edi],xmm4 |
| 565 jmp NEAR L$012ecb_ret |
| 566 align 16 |
| 567 L$028ecb_dec_four: |
| 568 call __aesni_decrypt4 |
| 569 movups [edi],xmm2 |
| 570 movups [16+edi],xmm3 |
| 571 movups [32+edi],xmm4 |
| 572 movups [48+edi],xmm5 |
| 573 L$012ecb_ret: |
| 574 pxor xmm0,xmm0 |
| 575 pxor xmm1,xmm1 |
| 576 pxor xmm2,xmm2 |
| 577 pxor xmm3,xmm3 |
| 578 pxor xmm4,xmm4 |
| 579 pxor xmm5,xmm5 |
| 580 pxor xmm6,xmm6 |
| 581 pxor xmm7,xmm7 |
| 582 pop edi |
| 583 pop esi |
| 584 pop ebx |
| 585 pop ebp |
| 586 ret |
| 587 global _aesni_ccm64_encrypt_blocks |
| 588 align 16 |
| 589 _aesni_ccm64_encrypt_blocks: |
| 590 L$_aesni_ccm64_encrypt_blocks_begin: |
| 591 push ebp |
| 592 push ebx |
| 593 push esi |
| 594 push edi |
| 595 mov esi,DWORD [20+esp] |
| 596 mov edi,DWORD [24+esp] |
| 597 mov eax,DWORD [28+esp] |
| 598 mov edx,DWORD [32+esp] |
| 599 mov ebx,DWORD [36+esp] |
| 600 mov ecx,DWORD [40+esp] |
| 601 mov ebp,esp |
| 602 sub esp,60 |
| 603 and esp,-16 |
| 604 mov DWORD [48+esp],ebp |
| 605 movdqu xmm7,[ebx] |
| 606 movdqu xmm3,[ecx] |
| 607 mov ecx,DWORD [240+edx] |
| 608 mov DWORD [esp],202182159 |
| 609 mov DWORD [4+esp],134810123 |
| 610 mov DWORD [8+esp],67438087 |
| 611 mov DWORD [12+esp],66051 |
| 612 mov ebx,1 |
| 613 xor ebp,ebp |
| 614 mov DWORD [16+esp],ebx |
| 615 mov DWORD [20+esp],ebp |
| 616 mov DWORD [24+esp],ebp |
| 617 mov DWORD [28+esp],ebp |
| 618 shl ecx,4 |
| 619 mov ebx,16 |
| 620 lea ebp,[edx] |
| 621 movdqa xmm5,[esp] |
| 622 movdqa xmm2,xmm7 |
| 623 lea edx,[32+ecx*1+edx] |
| 624 sub ebx,ecx |
| 625 db 102,15,56,0,253 |
| 626 L$030ccm64_enc_outer: |
| 627 movups xmm0,[ebp] |
| 628 mov ecx,ebx |
| 629 movups xmm6,[esi] |
| 630 xorps xmm2,xmm0 |
| 631 movups xmm1,[16+ebp] |
| 632 xorps xmm0,xmm6 |
| 633 xorps xmm3,xmm0 |
| 634 movups xmm0,[32+ebp] |
| 635 L$031ccm64_enc2_loop: |
| 636 db 102,15,56,220,209 |
| 637 db 102,15,56,220,217 |
| 638 movups xmm1,[ecx*1+edx] |
| 639 add ecx,32 |
| 640 db 102,15,56,220,208 |
| 641 db 102,15,56,220,216 |
| 642 movups xmm0,[ecx*1+edx-16] |
| 643 jnz NEAR L$031ccm64_enc2_loop |
| 644 db 102,15,56,220,209 |
| 645 db 102,15,56,220,217 |
| 646 paddq xmm7,[16+esp] |
| 647 dec eax |
| 648 db 102,15,56,221,208 |
| 649 db 102,15,56,221,216 |
| 650 lea esi,[16+esi] |
| 651 xorps xmm6,xmm2 |
| 652 movdqa xmm2,xmm7 |
| 653 movups [edi],xmm6 |
| 654 db 102,15,56,0,213 |
| 655 lea edi,[16+edi] |
| 656 jnz NEAR L$030ccm64_enc_outer |
| 657 mov esp,DWORD [48+esp] |
| 658 mov edi,DWORD [40+esp] |
| 659 movups [edi],xmm3 |
| 660 pxor xmm0,xmm0 |
| 661 pxor xmm1,xmm1 |
| 662 pxor xmm2,xmm2 |
| 663 pxor xmm3,xmm3 |
| 664 pxor xmm4,xmm4 |
| 665 pxor xmm5,xmm5 |
| 666 pxor xmm6,xmm6 |
| 667 pxor xmm7,xmm7 |
| 668 pop edi |
| 669 pop esi |
| 670 pop ebx |
| 671 pop ebp |
| 672 ret |
| 673 global _aesni_ccm64_decrypt_blocks |
| 674 align 16 |
| 675 _aesni_ccm64_decrypt_blocks: |
| 676 L$_aesni_ccm64_decrypt_blocks_begin: |
| 677 push ebp |
| 678 push ebx |
| 679 push esi |
| 680 push edi |
| 681 mov esi,DWORD [20+esp] |
| 682 mov edi,DWORD [24+esp] |
| 683 mov eax,DWORD [28+esp] |
| 684 mov edx,DWORD [32+esp] |
| 685 mov ebx,DWORD [36+esp] |
| 686 mov ecx,DWORD [40+esp] |
| 687 mov ebp,esp |
| 688 sub esp,60 |
| 689 and esp,-16 |
| 690 mov DWORD [48+esp],ebp |
| 691 movdqu xmm7,[ebx] |
| 692 movdqu xmm3,[ecx] |
| 693 mov ecx,DWORD [240+edx] |
| 694 mov DWORD [esp],202182159 |
| 695 mov DWORD [4+esp],134810123 |
| 696 mov DWORD [8+esp],67438087 |
| 697 mov DWORD [12+esp],66051 |
| 698 mov ebx,1 |
| 699 xor ebp,ebp |
| 700 mov DWORD [16+esp],ebx |
| 701 mov DWORD [20+esp],ebp |
| 702 mov DWORD [24+esp],ebp |
| 703 mov DWORD [28+esp],ebp |
| 704 movdqa xmm5,[esp] |
| 705 movdqa xmm2,xmm7 |
| 706 mov ebp,edx |
| 707 mov ebx,ecx |
| 708 db 102,15,56,0,253 |
| 709 movups xmm0,[edx] |
| 710 movups xmm1,[16+edx] |
| 711 lea edx,[32+edx] |
| 712 xorps xmm2,xmm0 |
| 713 L$032enc1_loop_5: |
| 714 db 102,15,56,220,209 |
| 715 dec ecx |
| 716 movups xmm1,[edx] |
| 717 lea edx,[16+edx] |
| 718 jnz NEAR L$032enc1_loop_5 |
| 719 db 102,15,56,221,209 |
| 720 shl ebx,4 |
| 721 mov ecx,16 |
| 722 movups xmm6,[esi] |
| 723 paddq xmm7,[16+esp] |
| 724 lea esi,[16+esi] |
| 725 sub ecx,ebx |
| 726 lea edx,[32+ebx*1+ebp] |
| 727 mov ebx,ecx |
| 728 jmp NEAR L$033ccm64_dec_outer |
| 729 align 16 |
| 730 L$033ccm64_dec_outer: |
| 731 xorps xmm6,xmm2 |
| 732 movdqa xmm2,xmm7 |
| 733 movups [edi],xmm6 |
| 734 lea edi,[16+edi] |
| 735 db 102,15,56,0,213 |
| 736 sub eax,1 |
| 737 jz NEAR L$034ccm64_dec_break |
| 738 movups xmm0,[ebp] |
| 739 mov ecx,ebx |
| 740 movups xmm1,[16+ebp] |
| 741 xorps xmm6,xmm0 |
| 742 xorps xmm2,xmm0 |
| 743 xorps xmm3,xmm6 |
| 744 movups xmm0,[32+ebp] |
| 745 L$035ccm64_dec2_loop: |
| 746 db 102,15,56,220,209 |
| 747 db 102,15,56,220,217 |
| 748 movups xmm1,[ecx*1+edx] |
| 749 add ecx,32 |
| 750 db 102,15,56,220,208 |
| 751 db 102,15,56,220,216 |
| 752 movups xmm0,[ecx*1+edx-16] |
| 753 jnz NEAR L$035ccm64_dec2_loop |
| 754 movups xmm6,[esi] |
| 755 paddq xmm7,[16+esp] |
| 756 db 102,15,56,220,209 |
| 757 db 102,15,56,220,217 |
| 758 db 102,15,56,221,208 |
| 759 db 102,15,56,221,216 |
| 760 lea esi,[16+esi] |
| 761 jmp NEAR L$033ccm64_dec_outer |
| 762 align 16 |
| 763 L$034ccm64_dec_break: |
| 764 mov ecx,DWORD [240+ebp] |
| 765 mov edx,ebp |
| 766 movups xmm0,[edx] |
| 767 movups xmm1,[16+edx] |
| 768 xorps xmm6,xmm0 |
| 769 lea edx,[32+edx] |
| 770 xorps xmm3,xmm6 |
| 771 L$036enc1_loop_6: |
| 772 db 102,15,56,220,217 |
| 773 dec ecx |
| 774 movups xmm1,[edx] |
| 775 lea edx,[16+edx] |
| 776 jnz NEAR L$036enc1_loop_6 |
| 777 db 102,15,56,221,217 |
| 778 mov esp,DWORD [48+esp] |
| 779 mov edi,DWORD [40+esp] |
| 780 movups [edi],xmm3 |
| 781 pxor xmm0,xmm0 |
| 782 pxor xmm1,xmm1 |
| 783 pxor xmm2,xmm2 |
| 784 pxor xmm3,xmm3 |
| 785 pxor xmm4,xmm4 |
| 786 pxor xmm5,xmm5 |
| 787 pxor xmm6,xmm6 |
| 788 pxor xmm7,xmm7 |
| 789 pop edi |
| 790 pop esi |
| 791 pop ebx |
| 792 pop ebp |
| 793 ret |
| 794 global _aesni_ctr32_encrypt_blocks |
| 795 align 16 |
| 796 _aesni_ctr32_encrypt_blocks: |
| 797 L$_aesni_ctr32_encrypt_blocks_begin: |
| 798 push ebp |
| 799 push ebx |
| 800 push esi |
| 801 push edi |
| 802 mov esi,DWORD [20+esp] |
| 803 mov edi,DWORD [24+esp] |
| 804 mov eax,DWORD [28+esp] |
| 805 mov edx,DWORD [32+esp] |
| 806 mov ebx,DWORD [36+esp] |
| 807 mov ebp,esp |
| 808 sub esp,88 |
| 809 and esp,-16 |
| 810 mov DWORD [80+esp],ebp |
| 811 cmp eax,1 |
| 812 je NEAR L$037ctr32_one_shortcut |
| 813 movdqu xmm7,[ebx] |
| 814 mov DWORD [esp],202182159 |
| 815 mov DWORD [4+esp],134810123 |
| 816 mov DWORD [8+esp],67438087 |
| 817 mov DWORD [12+esp],66051 |
| 818 mov ecx,6 |
| 819 xor ebp,ebp |
| 820 mov DWORD [16+esp],ecx |
| 821 mov DWORD [20+esp],ecx |
| 822 mov DWORD [24+esp],ecx |
| 823 mov DWORD [28+esp],ebp |
| 824 db 102,15,58,22,251,3 |
| 825 db 102,15,58,34,253,3 |
| 826 mov ecx,DWORD [240+edx] |
| 827 bswap ebx |
| 828 pxor xmm0,xmm0 |
| 829 pxor xmm1,xmm1 |
| 830 movdqa xmm2,[esp] |
| 831 db 102,15,58,34,195,0 |
| 832 lea ebp,[3+ebx] |
| 833 db 102,15,58,34,205,0 |
| 834 inc ebx |
| 835 db 102,15,58,34,195,1 |
| 836 inc ebp |
| 837 db 102,15,58,34,205,1 |
| 838 inc ebx |
| 839 db 102,15,58,34,195,2 |
| 840 inc ebp |
| 841 db 102,15,58,34,205,2 |
| 842 movdqa [48+esp],xmm0 |
| 843 db 102,15,56,0,194 |
| 844 movdqu xmm6,[edx] |
| 845 movdqa [64+esp],xmm1 |
| 846 db 102,15,56,0,202 |
| 847 pshufd xmm2,xmm0,192 |
| 848 pshufd xmm3,xmm0,128 |
| 849 cmp eax,6 |
| 850 jb NEAR L$038ctr32_tail |
| 851 pxor xmm7,xmm6 |
| 852 shl ecx,4 |
| 853 mov ebx,16 |
| 854 movdqa [32+esp],xmm7 |
| 855 mov ebp,edx |
| 856 sub ebx,ecx |
| 857 lea edx,[32+ecx*1+edx] |
| 858 sub eax,6 |
| 859 jmp NEAR L$039ctr32_loop6 |
| 860 align 16 |
| 861 L$039ctr32_loop6: |
| 862 pshufd xmm4,xmm0,64 |
| 863 movdqa xmm0,[32+esp] |
| 864 pshufd xmm5,xmm1,192 |
| 865 pxor xmm2,xmm0 |
| 866 pshufd xmm6,xmm1,128 |
| 867 pxor xmm3,xmm0 |
| 868 pshufd xmm7,xmm1,64 |
| 869 movups xmm1,[16+ebp] |
| 870 pxor xmm4,xmm0 |
| 871 pxor xmm5,xmm0 |
| 872 db 102,15,56,220,209 |
| 873 pxor xmm6,xmm0 |
| 874 pxor xmm7,xmm0 |
| 875 db 102,15,56,220,217 |
| 876 movups xmm0,[32+ebp] |
| 877 mov ecx,ebx |
| 878 db 102,15,56,220,225 |
| 879 db 102,15,56,220,233 |
| 880 db 102,15,56,220,241 |
| 881 db 102,15,56,220,249 |
| 882 call L$_aesni_encrypt6_enter |
| 883 movups xmm1,[esi] |
| 884 movups xmm0,[16+esi] |
| 885 xorps xmm2,xmm1 |
| 886 movups xmm1,[32+esi] |
| 887 xorps xmm3,xmm0 |
| 888 movups [edi],xmm2 |
| 889 movdqa xmm0,[16+esp] |
| 890 xorps xmm4,xmm1 |
| 891 movdqa xmm1,[64+esp] |
| 892 movups [16+edi],xmm3 |
| 893 movups [32+edi],xmm4 |
| 894 paddd xmm1,xmm0 |
| 895 paddd xmm0,[48+esp] |
| 896 movdqa xmm2,[esp] |
| 897 movups xmm3,[48+esi] |
| 898 movups xmm4,[64+esi] |
| 899 xorps xmm5,xmm3 |
| 900 movups xmm3,[80+esi] |
| 901 lea esi,[96+esi] |
| 902 movdqa [48+esp],xmm0 |
| 903 db 102,15,56,0,194 |
| 904 xorps xmm6,xmm4 |
| 905 movups [48+edi],xmm5 |
| 906 xorps xmm7,xmm3 |
| 907 movdqa [64+esp],xmm1 |
| 908 db 102,15,56,0,202 |
| 909 movups [64+edi],xmm6 |
| 910 pshufd xmm2,xmm0,192 |
| 911 movups [80+edi],xmm7 |
| 912 lea edi,[96+edi] |
| 913 pshufd xmm3,xmm0,128 |
| 914 sub eax,6 |
| 915 jnc NEAR L$039ctr32_loop6 |
| 916 add eax,6 |
| 917 jz NEAR L$040ctr32_ret |
| 918 movdqu xmm7,[ebp] |
| 919 mov edx,ebp |
| 920 pxor xmm7,[32+esp] |
| 921 mov ecx,DWORD [240+ebp] |
| 922 L$038ctr32_tail: |
| 923 por xmm2,xmm7 |
| 924 cmp eax,2 |
| 925 jb NEAR L$041ctr32_one |
| 926 pshufd xmm4,xmm0,64 |
| 927 por xmm3,xmm7 |
| 928 je NEAR L$042ctr32_two |
| 929 pshufd xmm5,xmm1,192 |
| 930 por xmm4,xmm7 |
| 931 cmp eax,4 |
| 932 jb NEAR L$043ctr32_three |
| 933 pshufd xmm6,xmm1,128 |
| 934 por xmm5,xmm7 |
| 935 je NEAR L$044ctr32_four |
| 936 por xmm6,xmm7 |
| 937 call __aesni_encrypt6 |
| 938 movups xmm1,[esi] |
| 939 movups xmm0,[16+esi] |
| 940 xorps xmm2,xmm1 |
| 941 movups xmm1,[32+esi] |
| 942 xorps xmm3,xmm0 |
| 943 movups xmm0,[48+esi] |
| 944 xorps xmm4,xmm1 |
| 945 movups xmm1,[64+esi] |
| 946 xorps xmm5,xmm0 |
| 947 movups [edi],xmm2 |
| 948 xorps xmm6,xmm1 |
| 949 movups [16+edi],xmm3 |
| 950 movups [32+edi],xmm4 |
| 951 movups [48+edi],xmm5 |
| 952 movups [64+edi],xmm6 |
| 953 jmp NEAR L$040ctr32_ret |
| 954 align 16 |
| 955 L$037ctr32_one_shortcut: |
| 956 movups xmm2,[ebx] |
| 957 mov ecx,DWORD [240+edx] |
| 958 L$041ctr32_one: |
| 959 movups xmm0,[edx] |
| 960 movups xmm1,[16+edx] |
| 961 lea edx,[32+edx] |
| 962 xorps xmm2,xmm0 |
| 963 L$045enc1_loop_7: |
| 964 db 102,15,56,220,209 |
| 965 dec ecx |
| 966 movups xmm1,[edx] |
| 967 lea edx,[16+edx] |
| 968 jnz NEAR L$045enc1_loop_7 |
| 969 db 102,15,56,221,209 |
| 970 movups xmm6,[esi] |
| 971 xorps xmm6,xmm2 |
| 972 movups [edi],xmm6 |
| 973 jmp NEAR L$040ctr32_ret |
| 974 align 16 |
| 975 L$042ctr32_two: |
| 976 call __aesni_encrypt2 |
| 977 movups xmm5,[esi] |
| 978 movups xmm6,[16+esi] |
| 979 xorps xmm2,xmm5 |
| 980 xorps xmm3,xmm6 |
| 981 movups [edi],xmm2 |
| 982 movups [16+edi],xmm3 |
| 983 jmp NEAR L$040ctr32_ret |
| 984 align 16 |
| 985 L$043ctr32_three: |
| 986 call __aesni_encrypt3 |
| 987 movups xmm5,[esi] |
| 988 movups xmm6,[16+esi] |
| 989 xorps xmm2,xmm5 |
| 990 movups xmm7,[32+esi] |
| 991 xorps xmm3,xmm6 |
| 992 movups [edi],xmm2 |
| 993 xorps xmm4,xmm7 |
| 994 movups [16+edi],xmm3 |
| 995 movups [32+edi],xmm4 |
| 996 jmp NEAR L$040ctr32_ret |
| 997 align 16 |
| 998 L$044ctr32_four: |
| 999 call __aesni_encrypt4 |
| 1000 movups xmm6,[esi] |
| 1001 movups xmm7,[16+esi] |
| 1002 movups xmm1,[32+esi] |
| 1003 xorps xmm2,xmm6 |
| 1004 movups xmm0,[48+esi] |
| 1005 xorps xmm3,xmm7 |
| 1006 movups [edi],xmm2 |
| 1007 xorps xmm4,xmm1 |
| 1008 movups [16+edi],xmm3 |
| 1009 xorps xmm5,xmm0 |
| 1010 movups [32+edi],xmm4 |
| 1011 movups [48+edi],xmm5 |
| 1012 L$040ctr32_ret: |
| 1013 pxor xmm0,xmm0 |
| 1014 pxor xmm1,xmm1 |
| 1015 pxor xmm2,xmm2 |
| 1016 pxor xmm3,xmm3 |
| 1017 pxor xmm4,xmm4 |
| 1018 movdqa [32+esp],xmm0 |
| 1019 pxor xmm5,xmm5 |
| 1020 movdqa [48+esp],xmm0 |
| 1021 pxor xmm6,xmm6 |
| 1022 movdqa [64+esp],xmm0 |
| 1023 pxor xmm7,xmm7 |
| 1024 mov esp,DWORD [80+esp] |
| 1025 pop edi |
| 1026 pop esi |
| 1027 pop ebx |
| 1028 pop ebp |
| 1029 ret |
| 1030 global _aesni_xts_encrypt |
| 1031 align 16 |
| 1032 _aesni_xts_encrypt: |
| 1033 L$_aesni_xts_encrypt_begin: |
| 1034 push ebp |
| 1035 push ebx |
| 1036 push esi |
| 1037 push edi |
| 1038 mov edx,DWORD [36+esp] |
| 1039 mov esi,DWORD [40+esp] |
| 1040 mov ecx,DWORD [240+edx] |
| 1041 movups xmm2,[esi] |
| 1042 movups xmm0,[edx] |
| 1043 movups xmm1,[16+edx] |
| 1044 lea edx,[32+edx] |
| 1045 xorps xmm2,xmm0 |
| 1046 L$046enc1_loop_8: |
| 1047 db 102,15,56,220,209 |
| 1048 dec ecx |
| 1049 movups xmm1,[edx] |
| 1050 lea edx,[16+edx] |
| 1051 jnz NEAR L$046enc1_loop_8 |
| 1052 db 102,15,56,221,209 |
| 1053 mov esi,DWORD [20+esp] |
| 1054 mov edi,DWORD [24+esp] |
| 1055 mov eax,DWORD [28+esp] |
| 1056 mov edx,DWORD [32+esp] |
| 1057 mov ebp,esp |
| 1058 sub esp,120 |
| 1059 mov ecx,DWORD [240+edx] |
| 1060 and esp,-16 |
| 1061 mov DWORD [96+esp],135 |
| 1062 mov DWORD [100+esp],0 |
| 1063 mov DWORD [104+esp],1 |
| 1064 mov DWORD [108+esp],0 |
| 1065 mov DWORD [112+esp],eax |
| 1066 mov DWORD [116+esp],ebp |
| 1067 movdqa xmm1,xmm2 |
| 1068 pxor xmm0,xmm0 |
| 1069 movdqa xmm3,[96+esp] |
| 1070 pcmpgtd xmm0,xmm1 |
| 1071 and eax,-16 |
| 1072 mov ebp,edx |
| 1073 mov ebx,ecx |
| 1074 sub eax,96 |
| 1075 jc NEAR L$047xts_enc_short |
| 1076 shl ecx,4 |
| 1077 mov ebx,16 |
| 1078 sub ebx,ecx |
| 1079 lea edx,[32+ecx*1+edx] |
| 1080 jmp NEAR L$048xts_enc_loop6 |
| 1081 align 16 |
| 1082 L$048xts_enc_loop6: |
| 1083 pshufd xmm2,xmm0,19 |
| 1084 pxor xmm0,xmm0 |
| 1085 movdqa [esp],xmm1 |
| 1086 paddq xmm1,xmm1 |
| 1087 pand xmm2,xmm3 |
| 1088 pcmpgtd xmm0,xmm1 |
| 1089 pxor xmm1,xmm2 |
| 1090 pshufd xmm2,xmm0,19 |
| 1091 pxor xmm0,xmm0 |
| 1092 movdqa [16+esp],xmm1 |
| 1093 paddq xmm1,xmm1 |
| 1094 pand xmm2,xmm3 |
| 1095 pcmpgtd xmm0,xmm1 |
| 1096 pxor xmm1,xmm2 |
| 1097 pshufd xmm2,xmm0,19 |
| 1098 pxor xmm0,xmm0 |
| 1099 movdqa [32+esp],xmm1 |
| 1100 paddq xmm1,xmm1 |
| 1101 pand xmm2,xmm3 |
| 1102 pcmpgtd xmm0,xmm1 |
| 1103 pxor xmm1,xmm2 |
| 1104 pshufd xmm2,xmm0,19 |
| 1105 pxor xmm0,xmm0 |
| 1106 movdqa [48+esp],xmm1 |
| 1107 paddq xmm1,xmm1 |
| 1108 pand xmm2,xmm3 |
| 1109 pcmpgtd xmm0,xmm1 |
| 1110 pxor xmm1,xmm2 |
| 1111 pshufd xmm7,xmm0,19 |
| 1112 movdqa [64+esp],xmm1 |
| 1113 paddq xmm1,xmm1 |
| 1114 movups xmm0,[ebp] |
| 1115 pand xmm7,xmm3 |
| 1116 movups xmm2,[esi] |
| 1117 pxor xmm7,xmm1 |
| 1118 mov ecx,ebx |
| 1119 movdqu xmm3,[16+esi] |
| 1120 xorps xmm2,xmm0 |
| 1121 movdqu xmm4,[32+esi] |
| 1122 pxor xmm3,xmm0 |
| 1123 movdqu xmm5,[48+esi] |
| 1124 pxor xmm4,xmm0 |
| 1125 movdqu xmm6,[64+esi] |
| 1126 pxor xmm5,xmm0 |
| 1127 movdqu xmm1,[80+esi] |
| 1128 pxor xmm6,xmm0 |
| 1129 lea esi,[96+esi] |
| 1130 pxor xmm2,[esp] |
| 1131 movdqa [80+esp],xmm7 |
| 1132 pxor xmm7,xmm1 |
| 1133 movups xmm1,[16+ebp] |
| 1134 pxor xmm3,[16+esp] |
| 1135 pxor xmm4,[32+esp] |
| 1136 db 102,15,56,220,209 |
| 1137 pxor xmm5,[48+esp] |
| 1138 pxor xmm6,[64+esp] |
| 1139 db 102,15,56,220,217 |
| 1140 pxor xmm7,xmm0 |
| 1141 movups xmm0,[32+ebp] |
| 1142 db 102,15,56,220,225 |
| 1143 db 102,15,56,220,233 |
| 1144 db 102,15,56,220,241 |
| 1145 db 102,15,56,220,249 |
| 1146 call L$_aesni_encrypt6_enter |
| 1147 movdqa xmm1,[80+esp] |
| 1148 pxor xmm0,xmm0 |
| 1149 xorps xmm2,[esp] |
| 1150 pcmpgtd xmm0,xmm1 |
| 1151 xorps xmm3,[16+esp] |
| 1152 movups [edi],xmm2 |
| 1153 xorps xmm4,[32+esp] |
| 1154 movups [16+edi],xmm3 |
| 1155 xorps xmm5,[48+esp] |
| 1156 movups [32+edi],xmm4 |
| 1157 xorps xmm6,[64+esp] |
| 1158 movups [48+edi],xmm5 |
| 1159 xorps xmm7,xmm1 |
| 1160 movups [64+edi],xmm6 |
| 1161 pshufd xmm2,xmm0,19 |
| 1162 movups [80+edi],xmm7 |
| 1163 lea edi,[96+edi] |
| 1164 movdqa xmm3,[96+esp] |
| 1165 pxor xmm0,xmm0 |
| 1166 paddq xmm1,xmm1 |
| 1167 pand xmm2,xmm3 |
| 1168 pcmpgtd xmm0,xmm1 |
| 1169 pxor xmm1,xmm2 |
| 1170 sub eax,96 |
| 1171 jnc NEAR L$048xts_enc_loop6 |
| 1172 mov ecx,DWORD [240+ebp] |
| 1173 mov edx,ebp |
| 1174 mov ebx,ecx |
| 1175 L$047xts_enc_short: |
| 1176 add eax,96 |
| 1177 jz NEAR L$049xts_enc_done6x |
| 1178 movdqa xmm5,xmm1 |
| 1179 cmp eax,32 |
| 1180 jb NEAR L$050xts_enc_one |
| 1181 pshufd xmm2,xmm0,19 |
| 1182 pxor xmm0,xmm0 |
| 1183 paddq xmm1,xmm1 |
| 1184 pand xmm2,xmm3 |
| 1185 pcmpgtd xmm0,xmm1 |
| 1186 pxor xmm1,xmm2 |
| 1187 je NEAR L$051xts_enc_two |
| 1188 pshufd xmm2,xmm0,19 |
| 1189 pxor xmm0,xmm0 |
| 1190 movdqa xmm6,xmm1 |
| 1191 paddq xmm1,xmm1 |
| 1192 pand xmm2,xmm3 |
| 1193 pcmpgtd xmm0,xmm1 |
| 1194 pxor xmm1,xmm2 |
| 1195 cmp eax,64 |
| 1196 jb NEAR L$052xts_enc_three |
| 1197 pshufd xmm2,xmm0,19 |
| 1198 pxor xmm0,xmm0 |
| 1199 movdqa xmm7,xmm1 |
| 1200 paddq xmm1,xmm1 |
| 1201 pand xmm2,xmm3 |
| 1202 pcmpgtd xmm0,xmm1 |
| 1203 pxor xmm1,xmm2 |
| 1204 movdqa [esp],xmm5 |
| 1205 movdqa [16+esp],xmm6 |
| 1206 je NEAR L$053xts_enc_four |
| 1207 movdqa [32+esp],xmm7 |
| 1208 pshufd xmm7,xmm0,19 |
| 1209 movdqa [48+esp],xmm1 |
| 1210 paddq xmm1,xmm1 |
| 1211 pand xmm7,xmm3 |
| 1212 pxor xmm7,xmm1 |
| 1213 movdqu xmm2,[esi] |
| 1214 movdqu xmm3,[16+esi] |
| 1215 movdqu xmm4,[32+esi] |
| 1216 pxor xmm2,[esp] |
| 1217 movdqu xmm5,[48+esi] |
| 1218 pxor xmm3,[16+esp] |
| 1219 movdqu xmm6,[64+esi] |
| 1220 pxor xmm4,[32+esp] |
| 1221 lea esi,[80+esi] |
| 1222 pxor xmm5,[48+esp] |
| 1223 movdqa [64+esp],xmm7 |
| 1224 pxor xmm6,xmm7 |
| 1225 call __aesni_encrypt6 |
| 1226 movaps xmm1,[64+esp] |
| 1227 xorps xmm2,[esp] |
| 1228 xorps xmm3,[16+esp] |
| 1229 xorps xmm4,[32+esp] |
| 1230 movups [edi],xmm2 |
| 1231 xorps xmm5,[48+esp] |
| 1232 movups [16+edi],xmm3 |
| 1233 xorps xmm6,xmm1 |
| 1234 movups [32+edi],xmm4 |
| 1235 movups [48+edi],xmm5 |
| 1236 movups [64+edi],xmm6 |
| 1237 lea edi,[80+edi] |
| 1238 jmp NEAR L$054xts_enc_done |
| 1239 align 16 |
| 1240 L$050xts_enc_one: |
| 1241 movups xmm2,[esi] |
| 1242 lea esi,[16+esi] |
| 1243 xorps xmm2,xmm5 |
| 1244 movups xmm0,[edx] |
| 1245 movups xmm1,[16+edx] |
| 1246 lea edx,[32+edx] |
| 1247 xorps xmm2,xmm0 |
| 1248 L$055enc1_loop_9: |
| 1249 db 102,15,56,220,209 |
| 1250 dec ecx |
| 1251 movups xmm1,[edx] |
| 1252 lea edx,[16+edx] |
| 1253 jnz NEAR L$055enc1_loop_9 |
| 1254 db 102,15,56,221,209 |
| 1255 xorps xmm2,xmm5 |
| 1256 movups [edi],xmm2 |
| 1257 lea edi,[16+edi] |
| 1258 movdqa xmm1,xmm5 |
| 1259 jmp NEAR L$054xts_enc_done |
| 1260 align 16 |
| 1261 L$051xts_enc_two: |
| 1262 movaps xmm6,xmm1 |
| 1263 movups xmm2,[esi] |
| 1264 movups xmm3,[16+esi] |
| 1265 lea esi,[32+esi] |
| 1266 xorps xmm2,xmm5 |
| 1267 xorps xmm3,xmm6 |
| 1268 call __aesni_encrypt2 |
| 1269 xorps xmm2,xmm5 |
| 1270 xorps xmm3,xmm6 |
| 1271 movups [edi],xmm2 |
| 1272 movups [16+edi],xmm3 |
| 1273 lea edi,[32+edi] |
| 1274 movdqa xmm1,xmm6 |
| 1275 jmp NEAR L$054xts_enc_done |
| 1276 align 16 |
| 1277 L$052xts_enc_three: |
| 1278 movaps xmm7,xmm1 |
| 1279 movups xmm2,[esi] |
| 1280 movups xmm3,[16+esi] |
| 1281 movups xmm4,[32+esi] |
| 1282 lea esi,[48+esi] |
| 1283 xorps xmm2,xmm5 |
| 1284 xorps xmm3,xmm6 |
| 1285 xorps xmm4,xmm7 |
| 1286 call __aesni_encrypt3 |
| 1287 xorps xmm2,xmm5 |
| 1288 xorps xmm3,xmm6 |
| 1289 xorps xmm4,xmm7 |
| 1290 movups [edi],xmm2 |
| 1291 movups [16+edi],xmm3 |
| 1292 movups [32+edi],xmm4 |
| 1293 lea edi,[48+edi] |
| 1294 movdqa xmm1,xmm7 |
| 1295 jmp NEAR L$054xts_enc_done |
| 1296 align 16 |
| 1297 L$053xts_enc_four: |
| 1298 movaps xmm6,xmm1 |
| 1299 movups xmm2,[esi] |
| 1300 movups xmm3,[16+esi] |
| 1301 movups xmm4,[32+esi] |
| 1302 xorps xmm2,[esp] |
| 1303 movups xmm5,[48+esi] |
| 1304 lea esi,[64+esi] |
| 1305 xorps xmm3,[16+esp] |
| 1306 xorps xmm4,xmm7 |
| 1307 xorps xmm5,xmm6 |
| 1308 call __aesni_encrypt4 |
| 1309 xorps xmm2,[esp] |
| 1310 xorps xmm3,[16+esp] |
| 1311 xorps xmm4,xmm7 |
| 1312 movups [edi],xmm2 |
| 1313 xorps xmm5,xmm6 |
| 1314 movups [16+edi],xmm3 |
| 1315 movups [32+edi],xmm4 |
| 1316 movups [48+edi],xmm5 |
| 1317 lea edi,[64+edi] |
| 1318 movdqa xmm1,xmm6 |
| 1319 jmp NEAR L$054xts_enc_done |
| 1320 align 16 |
| 1321 L$049xts_enc_done6x: |
| 1322 mov eax,DWORD [112+esp] |
| 1323 and eax,15 |
| 1324 jz NEAR L$056xts_enc_ret |
| 1325 movdqa xmm5,xmm1 |
| 1326 mov DWORD [112+esp],eax |
| 1327 jmp NEAR L$057xts_enc_steal |
| 1328 align 16 |
| 1329 L$054xts_enc_done: |
| 1330 mov eax,DWORD [112+esp] |
| 1331 pxor xmm0,xmm0 |
| 1332 and eax,15 |
| 1333 jz NEAR L$056xts_enc_ret |
| 1334 pcmpgtd xmm0,xmm1 |
| 1335 mov DWORD [112+esp],eax |
| 1336 pshufd xmm5,xmm0,19 |
| 1337 paddq xmm1,xmm1 |
| 1338 pand xmm5,[96+esp] |
| 1339 pxor xmm5,xmm1 |
| 1340 L$057xts_enc_steal: |
| 1341 movzx ecx,BYTE [esi] |
| 1342 movzx edx,BYTE [edi-16] |
| 1343 lea esi,[1+esi] |
| 1344 mov BYTE [edi-16],cl |
| 1345 mov BYTE [edi],dl |
| 1346 lea edi,[1+edi] |
| 1347 sub eax,1 |
| 1348 jnz NEAR L$057xts_enc_steal |
| 1349 sub edi,DWORD [112+esp] |
| 1350 mov edx,ebp |
| 1351 mov ecx,ebx |
| 1352 movups xmm2,[edi-16] |
| 1353 xorps xmm2,xmm5 |
| 1354 movups xmm0,[edx] |
| 1355 movups xmm1,[16+edx] |
| 1356 lea edx,[32+edx] |
| 1357 xorps xmm2,xmm0 |
| 1358 L$058enc1_loop_10: |
| 1359 db 102,15,56,220,209 |
| 1360 dec ecx |
| 1361 movups xmm1,[edx] |
| 1362 lea edx,[16+edx] |
| 1363 jnz NEAR L$058enc1_loop_10 |
| 1364 db 102,15,56,221,209 |
| 1365 xorps xmm2,xmm5 |
| 1366 movups [edi-16],xmm2 |
| 1367 L$056xts_enc_ret: |
| 1368 pxor xmm0,xmm0 |
| 1369 pxor xmm1,xmm1 |
| 1370 pxor xmm2,xmm2 |
| 1371 movdqa [esp],xmm0 |
| 1372 pxor xmm3,xmm3 |
| 1373 movdqa [16+esp],xmm0 |
| 1374 pxor xmm4,xmm4 |
| 1375 movdqa [32+esp],xmm0 |
| 1376 pxor xmm5,xmm5 |
| 1377 movdqa [48+esp],xmm0 |
| 1378 pxor xmm6,xmm6 |
| 1379 movdqa [64+esp],xmm0 |
| 1380 pxor xmm7,xmm7 |
| 1381 movdqa [80+esp],xmm0 |
| 1382 mov esp,DWORD [116+esp] |
| 1383 pop edi |
| 1384 pop esi |
| 1385 pop ebx |
| 1386 pop ebp |
| 1387 ret |
| 1388 global _aesni_xts_decrypt |
| 1389 align 16 |
| 1390 _aesni_xts_decrypt: |
| 1391 L$_aesni_xts_decrypt_begin: |
| 1392 push ebp |
| 1393 push ebx |
| 1394 push esi |
| 1395 push edi |
| 1396 mov edx,DWORD [36+esp] |
| 1397 mov esi,DWORD [40+esp] |
| 1398 mov ecx,DWORD [240+edx] |
| 1399 movups xmm2,[esi] |
| 1400 movups xmm0,[edx] |
| 1401 movups xmm1,[16+edx] |
| 1402 lea edx,[32+edx] |
| 1403 xorps xmm2,xmm0 |
| 1404 L$059enc1_loop_11: |
| 1405 db 102,15,56,220,209 |
| 1406 dec ecx |
| 1407 movups xmm1,[edx] |
| 1408 lea edx,[16+edx] |
| 1409 jnz NEAR L$059enc1_loop_11 |
| 1410 db 102,15,56,221,209 |
| 1411 mov esi,DWORD [20+esp] |
| 1412 mov edi,DWORD [24+esp] |
| 1413 mov eax,DWORD [28+esp] |
| 1414 mov edx,DWORD [32+esp] |
| 1415 mov ebp,esp |
| 1416 sub esp,120 |
| 1417 and esp,-16 |
| 1418 xor ebx,ebx |
| 1419 test eax,15 |
| 1420 setnz bl |
| 1421 shl ebx,4 |
| 1422 sub eax,ebx |
| 1423 mov DWORD [96+esp],135 |
| 1424 mov DWORD [100+esp],0 |
| 1425 mov DWORD [104+esp],1 |
| 1426 mov DWORD [108+esp],0 |
| 1427 mov DWORD [112+esp],eax |
| 1428 mov DWORD [116+esp],ebp |
| 1429 mov ecx,DWORD [240+edx] |
| 1430 mov ebp,edx |
| 1431 mov ebx,ecx |
| 1432 movdqa xmm1,xmm2 |
| 1433 pxor xmm0,xmm0 |
| 1434 movdqa xmm3,[96+esp] |
| 1435 pcmpgtd xmm0,xmm1 |
| 1436 and eax,-16 |
| 1437 sub eax,96 |
| 1438 jc NEAR L$060xts_dec_short |
| 1439 shl ecx,4 |
| 1440 mov ebx,16 |
| 1441 sub ebx,ecx |
| 1442 lea edx,[32+ecx*1+edx] |
| 1443 jmp NEAR L$061xts_dec_loop6 |
| 1444 align 16 |
| 1445 L$061xts_dec_loop6: |
| 1446 pshufd xmm2,xmm0,19 |
| 1447 pxor xmm0,xmm0 |
| 1448 movdqa [esp],xmm1 |
| 1449 paddq xmm1,xmm1 |
| 1450 pand xmm2,xmm3 |
| 1451 pcmpgtd xmm0,xmm1 |
| 1452 pxor xmm1,xmm2 |
| 1453 pshufd xmm2,xmm0,19 |
| 1454 pxor xmm0,xmm0 |
| 1455 movdqa [16+esp],xmm1 |
| 1456 paddq xmm1,xmm1 |
| 1457 pand xmm2,xmm3 |
| 1458 pcmpgtd xmm0,xmm1 |
| 1459 pxor xmm1,xmm2 |
| 1460 pshufd xmm2,xmm0,19 |
| 1461 pxor xmm0,xmm0 |
| 1462 movdqa [32+esp],xmm1 |
| 1463 paddq xmm1,xmm1 |
| 1464 pand xmm2,xmm3 |
| 1465 pcmpgtd xmm0,xmm1 |
| 1466 pxor xmm1,xmm2 |
| 1467 pshufd xmm2,xmm0,19 |
| 1468 pxor xmm0,xmm0 |
| 1469 movdqa [48+esp],xmm1 |
| 1470 paddq xmm1,xmm1 |
| 1471 pand xmm2,xmm3 |
| 1472 pcmpgtd xmm0,xmm1 |
| 1473 pxor xmm1,xmm2 |
| 1474 pshufd xmm7,xmm0,19 |
| 1475 movdqa [64+esp],xmm1 |
| 1476 paddq xmm1,xmm1 |
| 1477 movups xmm0,[ebp] |
| 1478 pand xmm7,xmm3 |
| 1479 movups xmm2,[esi] |
| 1480 pxor xmm7,xmm1 |
| 1481 mov ecx,ebx |
| 1482 movdqu xmm3,[16+esi] |
| 1483 xorps xmm2,xmm0 |
| 1484 movdqu xmm4,[32+esi] |
| 1485 pxor xmm3,xmm0 |
| 1486 movdqu xmm5,[48+esi] |
| 1487 pxor xmm4,xmm0 |
| 1488 movdqu xmm6,[64+esi] |
| 1489 pxor xmm5,xmm0 |
| 1490 movdqu xmm1,[80+esi] |
| 1491 pxor xmm6,xmm0 |
| 1492 lea esi,[96+esi] |
| 1493 pxor xmm2,[esp] |
| 1494 movdqa [80+esp],xmm7 |
| 1495 pxor xmm7,xmm1 |
| 1496 movups xmm1,[16+ebp] |
| 1497 pxor xmm3,[16+esp] |
| 1498 pxor xmm4,[32+esp] |
| 1499 db 102,15,56,222,209 |
| 1500 pxor xmm5,[48+esp] |
| 1501 pxor xmm6,[64+esp] |
| 1502 db 102,15,56,222,217 |
| 1503 pxor xmm7,xmm0 |
| 1504 movups xmm0,[32+ebp] |
| 1505 db 102,15,56,222,225 |
| 1506 db 102,15,56,222,233 |
| 1507 db 102,15,56,222,241 |
| 1508 db 102,15,56,222,249 |
| 1509 call L$_aesni_decrypt6_enter |
| 1510 movdqa xmm1,[80+esp] |
| 1511 pxor xmm0,xmm0 |
| 1512 xorps xmm2,[esp] |
| 1513 pcmpgtd xmm0,xmm1 |
| 1514 xorps xmm3,[16+esp] |
| 1515 movups [edi],xmm2 |
| 1516 xorps xmm4,[32+esp] |
| 1517 movups [16+edi],xmm3 |
| 1518 xorps xmm5,[48+esp] |
| 1519 movups [32+edi],xmm4 |
| 1520 xorps xmm6,[64+esp] |
| 1521 movups [48+edi],xmm5 |
| 1522 xorps xmm7,xmm1 |
| 1523 movups [64+edi],xmm6 |
| 1524 pshufd xmm2,xmm0,19 |
| 1525 movups [80+edi],xmm7 |
| 1526 lea edi,[96+edi] |
| 1527 movdqa xmm3,[96+esp] |
| 1528 pxor xmm0,xmm0 |
| 1529 paddq xmm1,xmm1 |
| 1530 pand xmm2,xmm3 |
| 1531 pcmpgtd xmm0,xmm1 |
| 1532 pxor xmm1,xmm2 |
| 1533 sub eax,96 |
| 1534 jnc NEAR L$061xts_dec_loop6 |
| 1535 mov ecx,DWORD [240+ebp] |
| 1536 mov edx,ebp |
| 1537 mov ebx,ecx |
| 1538 L$060xts_dec_short: |
| 1539 add eax,96 |
| 1540 jz NEAR L$062xts_dec_done6x |
| 1541 movdqa xmm5,xmm1 |
| 1542 cmp eax,32 |
| 1543 jb NEAR L$063xts_dec_one |
| 1544 pshufd xmm2,xmm0,19 |
| 1545 pxor xmm0,xmm0 |
| 1546 paddq xmm1,xmm1 |
| 1547 pand xmm2,xmm3 |
| 1548 pcmpgtd xmm0,xmm1 |
| 1549 pxor xmm1,xmm2 |
| 1550 je NEAR L$064xts_dec_two |
| 1551 pshufd xmm2,xmm0,19 |
| 1552 pxor xmm0,xmm0 |
| 1553 movdqa xmm6,xmm1 |
| 1554 paddq xmm1,xmm1 |
| 1555 pand xmm2,xmm3 |
| 1556 pcmpgtd xmm0,xmm1 |
| 1557 pxor xmm1,xmm2 |
| 1558 cmp eax,64 |
| 1559 jb NEAR L$065xts_dec_three |
| 1560 pshufd xmm2,xmm0,19 |
| 1561 pxor xmm0,xmm0 |
| 1562 movdqa xmm7,xmm1 |
| 1563 paddq xmm1,xmm1 |
| 1564 pand xmm2,xmm3 |
| 1565 pcmpgtd xmm0,xmm1 |
| 1566 pxor xmm1,xmm2 |
| 1567 movdqa [esp],xmm5 |
| 1568 movdqa [16+esp],xmm6 |
| 1569 je NEAR L$066xts_dec_four |
| 1570 movdqa [32+esp],xmm7 |
| 1571 pshufd xmm7,xmm0,19 |
| 1572 movdqa [48+esp],xmm1 |
| 1573 paddq xmm1,xmm1 |
| 1574 pand xmm7,xmm3 |
| 1575 pxor xmm7,xmm1 |
| 1576 movdqu xmm2,[esi] |
| 1577 movdqu xmm3,[16+esi] |
| 1578 movdqu xmm4,[32+esi] |
| 1579 pxor xmm2,[esp] |
| 1580 movdqu xmm5,[48+esi] |
| 1581 pxor xmm3,[16+esp] |
| 1582 movdqu xmm6,[64+esi] |
| 1583 pxor xmm4,[32+esp] |
| 1584 lea esi,[80+esi] |
| 1585 pxor xmm5,[48+esp] |
| 1586 movdqa [64+esp],xmm7 |
| 1587 pxor xmm6,xmm7 |
| 1588 call __aesni_decrypt6 |
| 1589 movaps xmm1,[64+esp] |
| 1590 xorps xmm2,[esp] |
| 1591 xorps xmm3,[16+esp] |
| 1592 xorps xmm4,[32+esp] |
| 1593 movups [edi],xmm2 |
| 1594 xorps xmm5,[48+esp] |
| 1595 movups [16+edi],xmm3 |
| 1596 xorps xmm6,xmm1 |
| 1597 movups [32+edi],xmm4 |
| 1598 movups [48+edi],xmm5 |
| 1599 movups [64+edi],xmm6 |
| 1600 lea edi,[80+edi] |
| 1601 jmp NEAR L$067xts_dec_done |
| 1602 align 16 |
| 1603 L$063xts_dec_one: |
| 1604 movups xmm2,[esi] |
| 1605 lea esi,[16+esi] |
| 1606 xorps xmm2,xmm5 |
| 1607 movups xmm0,[edx] |
| 1608 movups xmm1,[16+edx] |
| 1609 lea edx,[32+edx] |
| 1610 xorps xmm2,xmm0 |
| 1611 L$068dec1_loop_12: |
| 1612 db 102,15,56,222,209 |
| 1613 dec ecx |
| 1614 movups xmm1,[edx] |
| 1615 lea edx,[16+edx] |
| 1616 jnz NEAR L$068dec1_loop_12 |
| 1617 db 102,15,56,223,209 |
| 1618 xorps xmm2,xmm5 |
| 1619 movups [edi],xmm2 |
| 1620 lea edi,[16+edi] |
| 1621 movdqa xmm1,xmm5 |
| 1622 jmp NEAR L$067xts_dec_done |
| 1623 align 16 |
| 1624 L$064xts_dec_two: |
| 1625 movaps xmm6,xmm1 |
| 1626 movups xmm2,[esi] |
| 1627 movups xmm3,[16+esi] |
| 1628 lea esi,[32+esi] |
| 1629 xorps xmm2,xmm5 |
| 1630 xorps xmm3,xmm6 |
| 1631 call __aesni_decrypt2 |
| 1632 xorps xmm2,xmm5 |
| 1633 xorps xmm3,xmm6 |
| 1634 movups [edi],xmm2 |
| 1635 movups [16+edi],xmm3 |
| 1636 lea edi,[32+edi] |
| 1637 movdqa xmm1,xmm6 |
| 1638 jmp NEAR L$067xts_dec_done |
| 1639 align 16 |
| 1640 L$065xts_dec_three: |
| 1641 movaps xmm7,xmm1 |
| 1642 movups xmm2,[esi] |
| 1643 movups xmm3,[16+esi] |
| 1644 movups xmm4,[32+esi] |
| 1645 lea esi,[48+esi] |
| 1646 xorps xmm2,xmm5 |
| 1647 xorps xmm3,xmm6 |
| 1648 xorps xmm4,xmm7 |
| 1649 call __aesni_decrypt3 |
| 1650 xorps xmm2,xmm5 |
| 1651 xorps xmm3,xmm6 |
| 1652 xorps xmm4,xmm7 |
| 1653 movups [edi],xmm2 |
| 1654 movups [16+edi],xmm3 |
| 1655 movups [32+edi],xmm4 |
| 1656 lea edi,[48+edi] |
| 1657 movdqa xmm1,xmm7 |
| 1658 jmp NEAR L$067xts_dec_done |
| 1659 align 16 |
| 1660 L$066xts_dec_four: |
| 1661 movaps xmm6,xmm1 |
| 1662 movups xmm2,[esi] |
| 1663 movups xmm3,[16+esi] |
| 1664 movups xmm4,[32+esi] |
| 1665 xorps xmm2,[esp] |
| 1666 movups xmm5,[48+esi] |
| 1667 lea esi,[64+esi] |
| 1668 xorps xmm3,[16+esp] |
| 1669 xorps xmm4,xmm7 |
| 1670 xorps xmm5,xmm6 |
| 1671 call __aesni_decrypt4 |
| 1672 xorps xmm2,[esp] |
| 1673 xorps xmm3,[16+esp] |
| 1674 xorps xmm4,xmm7 |
| 1675 movups [edi],xmm2 |
| 1676 xorps xmm5,xmm6 |
| 1677 movups [16+edi],xmm3 |
| 1678 movups [32+edi],xmm4 |
| 1679 movups [48+edi],xmm5 |
| 1680 lea edi,[64+edi] |
| 1681 movdqa xmm1,xmm6 |
| 1682 jmp NEAR L$067xts_dec_done |
| 1683 align 16 |
| 1684 L$062xts_dec_done6x: |
| 1685 mov eax,DWORD [112+esp] |
| 1686 and eax,15 |
| 1687 jz NEAR L$069xts_dec_ret |
| 1688 mov DWORD [112+esp],eax |
| 1689 jmp NEAR L$070xts_dec_only_one_more |
| 1690 align 16 |
| 1691 L$067xts_dec_done: |
| 1692 mov eax,DWORD [112+esp] |
| 1693 pxor xmm0,xmm0 |
| 1694 and eax,15 |
| 1695 jz NEAR L$069xts_dec_ret |
| 1696 pcmpgtd xmm0,xmm1 |
| 1697 mov DWORD [112+esp],eax |
| 1698 pshufd xmm2,xmm0,19 |
| 1699 pxor xmm0,xmm0 |
| 1700 movdqa xmm3,[96+esp] |
| 1701 paddq xmm1,xmm1 |
| 1702 pand xmm2,xmm3 |
| 1703 pcmpgtd xmm0,xmm1 |
| 1704 pxor xmm1,xmm2 |
| 1705 L$070xts_dec_only_one_more: |
| 1706 pshufd xmm5,xmm0,19 |
| 1707 movdqa xmm6,xmm1 |
| 1708 paddq xmm1,xmm1 |
| 1709 pand xmm5,xmm3 |
| 1710 pxor xmm5,xmm1 |
| 1711 mov edx,ebp |
| 1712 mov ecx,ebx |
| 1713 movups xmm2,[esi] |
| 1714 xorps xmm2,xmm5 |
| 1715 movups xmm0,[edx] |
| 1716 movups xmm1,[16+edx] |
| 1717 lea edx,[32+edx] |
| 1718 xorps xmm2,xmm0 |
| 1719 L$071dec1_loop_13: |
| 1720 db 102,15,56,222,209 |
| 1721 dec ecx |
| 1722 movups xmm1,[edx] |
| 1723 lea edx,[16+edx] |
| 1724 jnz NEAR L$071dec1_loop_13 |
| 1725 db 102,15,56,223,209 |
| 1726 xorps xmm2,xmm5 |
| 1727 movups [edi],xmm2 |
| 1728 L$072xts_dec_steal: |
| 1729 movzx ecx,BYTE [16+esi] |
| 1730 movzx edx,BYTE [edi] |
| 1731 lea esi,[1+esi] |
| 1732 mov BYTE [edi],cl |
| 1733 mov BYTE [16+edi],dl |
| 1734 lea edi,[1+edi] |
| 1735 sub eax,1 |
| 1736 jnz NEAR L$072xts_dec_steal |
| 1737 sub edi,DWORD [112+esp] |
| 1738 mov edx,ebp |
| 1739 mov ecx,ebx |
| 1740 movups xmm2,[edi] |
| 1741 xorps xmm2,xmm6 |
| 1742 movups xmm0,[edx] |
| 1743 movups xmm1,[16+edx] |
| 1744 lea edx,[32+edx] |
| 1745 xorps xmm2,xmm0 |
| 1746 L$073dec1_loop_14: |
| 1747 db 102,15,56,222,209 |
| 1748 dec ecx |
| 1749 movups xmm1,[edx] |
| 1750 lea edx,[16+edx] |
| 1751 jnz NEAR L$073dec1_loop_14 |
| 1752 db 102,15,56,223,209 |
| 1753 xorps xmm2,xmm6 |
| 1754 movups [edi],xmm2 |
| 1755 L$069xts_dec_ret: |
| 1756 pxor xmm0,xmm0 |
| 1757 pxor xmm1,xmm1 |
| 1758 pxor xmm2,xmm2 |
| 1759 movdqa [esp],xmm0 |
| 1760 pxor xmm3,xmm3 |
| 1761 movdqa [16+esp],xmm0 |
| 1762 pxor xmm4,xmm4 |
| 1763 movdqa [32+esp],xmm0 |
| 1764 pxor xmm5,xmm5 |
| 1765 movdqa [48+esp],xmm0 |
| 1766 pxor xmm6,xmm6 |
| 1767 movdqa [64+esp],xmm0 |
| 1768 pxor xmm7,xmm7 |
| 1769 movdqa [80+esp],xmm0 |
| 1770 mov esp,DWORD [116+esp] |
| 1771 pop edi |
| 1772 pop esi |
| 1773 pop ebx |
| 1774 pop ebp |
| 1775 ret |
| 1776 global _aesni_cbc_encrypt |
| 1777 align 16 |
| 1778 _aesni_cbc_encrypt: |
| 1779 L$_aesni_cbc_encrypt_begin: |
| 1780 push ebp |
| 1781 push ebx |
| 1782 push esi |
| 1783 push edi |
| 1784 mov esi,DWORD [20+esp] |
| 1785 mov ebx,esp |
| 1786 mov edi,DWORD [24+esp] |
| 1787 sub ebx,24 |
| 1788 mov eax,DWORD [28+esp] |
| 1789 and ebx,-16 |
| 1790 mov edx,DWORD [32+esp] |
| 1791 mov ebp,DWORD [36+esp] |
| 1792 test eax,eax |
| 1793 jz NEAR L$074cbc_abort |
| 1794 cmp DWORD [40+esp],0 |
| 1795 xchg ebx,esp |
| 1796 movups xmm7,[ebp] |
| 1797 mov ecx,DWORD [240+edx] |
| 1798 mov ebp,edx |
| 1799 mov DWORD [16+esp],ebx |
| 1800 mov ebx,ecx |
| 1801 je NEAR L$075cbc_decrypt |
| 1802 movaps xmm2,xmm7 |
| 1803 cmp eax,16 |
| 1804 jb NEAR L$076cbc_enc_tail |
| 1805 sub eax,16 |
| 1806 jmp NEAR L$077cbc_enc_loop |
| 1807 align 16 |
| 1808 L$077cbc_enc_loop: |
| 1809 movups xmm7,[esi] |
| 1810 lea esi,[16+esi] |
| 1811 movups xmm0,[edx] |
| 1812 movups xmm1,[16+edx] |
| 1813 xorps xmm7,xmm0 |
| 1814 lea edx,[32+edx] |
| 1815 xorps xmm2,xmm7 |
| 1816 L$078enc1_loop_15: |
| 1817 db 102,15,56,220,209 |
| 1818 dec ecx |
| 1819 movups xmm1,[edx] |
| 1820 lea edx,[16+edx] |
| 1821 jnz NEAR L$078enc1_loop_15 |
| 1822 db 102,15,56,221,209 |
| 1823 mov ecx,ebx |
| 1824 mov edx,ebp |
| 1825 movups [edi],xmm2 |
| 1826 lea edi,[16+edi] |
| 1827 sub eax,16 |
| 1828 jnc NEAR L$077cbc_enc_loop |
| 1829 add eax,16 |
| 1830 jnz NEAR L$076cbc_enc_tail |
| 1831 movaps xmm7,xmm2 |
| 1832 pxor xmm2,xmm2 |
| 1833 jmp NEAR L$079cbc_ret |
| 1834 L$076cbc_enc_tail: |
| 1835 mov ecx,eax |
| 1836 dd 2767451785 |
| 1837 mov ecx,16 |
| 1838 sub ecx,eax |
| 1839 xor eax,eax |
| 1840 dd 2868115081 |
| 1841 lea edi,[edi-16] |
| 1842 mov ecx,ebx |
| 1843 mov esi,edi |
| 1844 mov edx,ebp |
| 1845 jmp NEAR L$077cbc_enc_loop |
| 1846 align 16 |
| 1847 L$075cbc_decrypt: |
| 1848 cmp eax,80 |
| 1849 jbe NEAR L$080cbc_dec_tail |
| 1850 movaps [esp],xmm7 |
| 1851 sub eax,80 |
| 1852 jmp NEAR L$081cbc_dec_loop6_enter |
| 1853 align 16 |
| 1854 L$082cbc_dec_loop6: |
| 1855 movaps [esp],xmm0 |
| 1856 movups [edi],xmm7 |
| 1857 lea edi,[16+edi] |
| 1858 L$081cbc_dec_loop6_enter: |
| 1859 movdqu xmm2,[esi] |
| 1860 movdqu xmm3,[16+esi] |
| 1861 movdqu xmm4,[32+esi] |
| 1862 movdqu xmm5,[48+esi] |
| 1863 movdqu xmm6,[64+esi] |
| 1864 movdqu xmm7,[80+esi] |
| 1865 call __aesni_decrypt6 |
| 1866 movups xmm1,[esi] |
| 1867 movups xmm0,[16+esi] |
| 1868 xorps xmm2,[esp] |
| 1869 xorps xmm3,xmm1 |
| 1870 movups xmm1,[32+esi] |
| 1871 xorps xmm4,xmm0 |
| 1872 movups xmm0,[48+esi] |
| 1873 xorps xmm5,xmm1 |
| 1874 movups xmm1,[64+esi] |
| 1875 xorps xmm6,xmm0 |
| 1876 movups xmm0,[80+esi] |
| 1877 xorps xmm7,xmm1 |
| 1878 movups [edi],xmm2 |
| 1879 movups [16+edi],xmm3 |
| 1880 lea esi,[96+esi] |
| 1881 movups [32+edi],xmm4 |
| 1882 mov ecx,ebx |
| 1883 movups [48+edi],xmm5 |
| 1884 mov edx,ebp |
| 1885 movups [64+edi],xmm6 |
| 1886 lea edi,[80+edi] |
| 1887 sub eax,96 |
| 1888 ja NEAR L$082cbc_dec_loop6 |
| 1889 movaps xmm2,xmm7 |
| 1890 movaps xmm7,xmm0 |
| 1891 add eax,80 |
| 1892 jle NEAR L$083cbc_dec_clear_tail_collected |
| 1893 movups [edi],xmm2 |
| 1894 lea edi,[16+edi] |
| 1895 L$080cbc_dec_tail: |
| 1896 movups xmm2,[esi] |
| 1897 movaps xmm6,xmm2 |
| 1898 cmp eax,16 |
| 1899 jbe NEAR L$084cbc_dec_one |
| 1900 movups xmm3,[16+esi] |
| 1901 movaps xmm5,xmm3 |
| 1902 cmp eax,32 |
| 1903 jbe NEAR L$085cbc_dec_two |
| 1904 movups xmm4,[32+esi] |
| 1905 cmp eax,48 |
| 1906 jbe NEAR L$086cbc_dec_three |
| 1907 movups xmm5,[48+esi] |
| 1908 cmp eax,64 |
| 1909 jbe NEAR L$087cbc_dec_four |
| 1910 movups xmm6,[64+esi] |
| 1911 movaps [esp],xmm7 |
| 1912 movups xmm2,[esi] |
| 1913 xorps xmm7,xmm7 |
| 1914 call __aesni_decrypt6 |
| 1915 movups xmm1,[esi] |
| 1916 movups xmm0,[16+esi] |
| 1917 xorps xmm2,[esp] |
| 1918 xorps xmm3,xmm1 |
| 1919 movups xmm1,[32+esi] |
| 1920 xorps xmm4,xmm0 |
| 1921 movups xmm0,[48+esi] |
| 1922 xorps xmm5,xmm1 |
| 1923 movups xmm7,[64+esi] |
| 1924 xorps xmm6,xmm0 |
| 1925 movups [edi],xmm2 |
| 1926 movups [16+edi],xmm3 |
| 1927 pxor xmm3,xmm3 |
| 1928 movups [32+edi],xmm4 |
| 1929 pxor xmm4,xmm4 |
| 1930 movups [48+edi],xmm5 |
| 1931 pxor xmm5,xmm5 |
| 1932 lea edi,[64+edi] |
| 1933 movaps xmm2,xmm6 |
| 1934 pxor xmm6,xmm6 |
| 1935 sub eax,80 |
| 1936 jmp NEAR L$088cbc_dec_tail_collected |
| 1937 align 16 |
| 1938 L$084cbc_dec_one: |
| 1939 movups xmm0,[edx] |
| 1940 movups xmm1,[16+edx] |
| 1941 lea edx,[32+edx] |
| 1942 xorps xmm2,xmm0 |
| 1943 L$089dec1_loop_16: |
| 1944 db 102,15,56,222,209 |
| 1945 dec ecx |
| 1946 movups xmm1,[edx] |
| 1947 lea edx,[16+edx] |
| 1948 jnz NEAR L$089dec1_loop_16 |
| 1949 db 102,15,56,223,209 |
| 1950 xorps xmm2,xmm7 |
| 1951 movaps xmm7,xmm6 |
| 1952 sub eax,16 |
| 1953 jmp NEAR L$088cbc_dec_tail_collected |
| 1954 align 16 |
| 1955 L$085cbc_dec_two: |
| 1956 call __aesni_decrypt2 |
| 1957 xorps xmm2,xmm7 |
| 1958 xorps xmm3,xmm6 |
| 1959 movups [edi],xmm2 |
| 1960 movaps xmm2,xmm3 |
| 1961 pxor xmm3,xmm3 |
| 1962 lea edi,[16+edi] |
| 1963 movaps xmm7,xmm5 |
| 1964 sub eax,32 |
| 1965 jmp NEAR L$088cbc_dec_tail_collected |
| 1966 align 16 |
| 1967 L$086cbc_dec_three: |
| 1968 call __aesni_decrypt3 |
| 1969 xorps xmm2,xmm7 |
| 1970 xorps xmm3,xmm6 |
| 1971 xorps xmm4,xmm5 |
| 1972 movups [edi],xmm2 |
| 1973 movaps xmm2,xmm4 |
| 1974 pxor xmm4,xmm4 |
| 1975 movups [16+edi],xmm3 |
| 1976 pxor xmm3,xmm3 |
| 1977 lea edi,[32+edi] |
| 1978 movups xmm7,[32+esi] |
| 1979 sub eax,48 |
| 1980 jmp NEAR L$088cbc_dec_tail_collected |
| 1981 align 16 |
| 1982 L$087cbc_dec_four: |
| 1983 call __aesni_decrypt4 |
| 1984 movups xmm1,[16+esi] |
| 1985 movups xmm0,[32+esi] |
| 1986 xorps xmm2,xmm7 |
| 1987 movups xmm7,[48+esi] |
| 1988 xorps xmm3,xmm6 |
| 1989 movups [edi],xmm2 |
| 1990 xorps xmm4,xmm1 |
| 1991 movups [16+edi],xmm3 |
| 1992 pxor xmm3,xmm3 |
| 1993 xorps xmm5,xmm0 |
| 1994 movups [32+edi],xmm4 |
| 1995 pxor xmm4,xmm4 |
| 1996 lea edi,[48+edi] |
| 1997 movaps xmm2,xmm5 |
| 1998 pxor xmm5,xmm5 |
| 1999 sub eax,64 |
| 2000 jmp NEAR L$088cbc_dec_tail_collected |
| 2001 align 16 |
| 2002 L$083cbc_dec_clear_tail_collected: |
| 2003 pxor xmm3,xmm3 |
| 2004 pxor xmm4,xmm4 |
| 2005 pxor xmm5,xmm5 |
| 2006 pxor xmm6,xmm6 |
| 2007 L$088cbc_dec_tail_collected: |
| 2008 and eax,15 |
| 2009 jnz NEAR L$090cbc_dec_tail_partial |
| 2010 movups [edi],xmm2 |
| 2011 pxor xmm0,xmm0 |
| 2012 jmp NEAR L$079cbc_ret |
| 2013 align 16 |
| 2014 L$090cbc_dec_tail_partial: |
| 2015 movaps [esp],xmm2 |
| 2016 pxor xmm0,xmm0 |
| 2017 mov ecx,16 |
| 2018 mov esi,esp |
| 2019 sub ecx,eax |
| 2020 dd 2767451785 |
| 2021 movdqa [esp],xmm2 |
| 2022 L$079cbc_ret: |
| 2023 mov esp,DWORD [16+esp] |
| 2024 mov ebp,DWORD [36+esp] |
| 2025 pxor xmm2,xmm2 |
| 2026 pxor xmm1,xmm1 |
| 2027 movups [ebp],xmm7 |
| 2028 pxor xmm7,xmm7 |
| 2029 L$074cbc_abort: |
| 2030 pop edi |
| 2031 pop esi |
| 2032 pop ebx |
| 2033 pop ebp |
| 2034 ret |
| 2035 align 16 |
| 2036 __aesni_set_encrypt_key: |
| 2037 push ebp |
| 2038 push ebx |
| 2039 test eax,eax |
| 2040 jz NEAR L$091bad_pointer |
| 2041 test edx,edx |
| 2042 jz NEAR L$091bad_pointer |
| 2043 call L$092pic |
| 2044 L$092pic: |
| 2045 pop ebx |
| 2046 lea ebx,[(L$key_const-L$092pic)+ebx] |
| 2047 lea ebp,[_OPENSSL_ia32cap_P] |
| 2048 movups xmm0,[eax] |
| 2049 xorps xmm4,xmm4 |
| 2050 mov ebp,DWORD [4+ebp] |
| 2051 lea edx,[16+edx] |
| 2052 and ebp,268437504 |
| 2053 cmp ecx,256 |
| 2054 je NEAR L$09314rounds |
| 2055 cmp ecx,192 |
| 2056 je NEAR L$09412rounds |
| 2057 cmp ecx,128 |
| 2058 jne NEAR L$095bad_keybits |
| 2059 align 16 |
| 2060 L$09610rounds: |
| 2061 cmp ebp,268435456 |
| 2062 je NEAR L$09710rounds_alt |
| 2063 mov ecx,9 |
| 2064 movups [edx-16],xmm0 |
| 2065 db 102,15,58,223,200,1 |
| 2066 call L$098key_128_cold |
| 2067 db 102,15,58,223,200,2 |
| 2068 call L$099key_128 |
| 2069 db 102,15,58,223,200,4 |
| 2070 call L$099key_128 |
| 2071 db 102,15,58,223,200,8 |
| 2072 call L$099key_128 |
| 2073 db 102,15,58,223,200,16 |
| 2074 call L$099key_128 |
| 2075 db 102,15,58,223,200,32 |
| 2076 call L$099key_128 |
| 2077 db 102,15,58,223,200,64 |
| 2078 call L$099key_128 |
| 2079 db 102,15,58,223,200,128 |
| 2080 call L$099key_128 |
| 2081 db 102,15,58,223,200,27 |
| 2082 call L$099key_128 |
| 2083 db 102,15,58,223,200,54 |
| 2084 call L$099key_128 |
| 2085 movups [edx],xmm0 |
| 2086 mov DWORD [80+edx],ecx |
| 2087 jmp NEAR L$100good_key |
| 2088 align 16 |
| 2089 L$099key_128: |
| 2090 movups [edx],xmm0 |
| 2091 lea edx,[16+edx] |
| 2092 L$098key_128_cold: |
| 2093 shufps xmm4,xmm0,16 |
| 2094 xorps xmm0,xmm4 |
| 2095 shufps xmm4,xmm0,140 |
| 2096 xorps xmm0,xmm4 |
| 2097 shufps xmm1,xmm1,255 |
| 2098 xorps xmm0,xmm1 |
| 2099 ret |
| 2100 align 16 |
| 2101 L$09710rounds_alt: |
| 2102 movdqa xmm5,[ebx] |
| 2103 mov ecx,8 |
| 2104 movdqa xmm4,[32+ebx] |
| 2105 movdqa xmm2,xmm0 |
| 2106 movdqu [edx-16],xmm0 |
| 2107 L$101loop_key128: |
| 2108 db 102,15,56,0,197 |
| 2109 db 102,15,56,221,196 |
| 2110 pslld xmm4,1 |
| 2111 lea edx,[16+edx] |
| 2112 movdqa xmm3,xmm2 |
| 2113 pslldq xmm2,4 |
| 2114 pxor xmm3,xmm2 |
| 2115 pslldq xmm2,4 |
| 2116 pxor xmm3,xmm2 |
| 2117 pslldq xmm2,4 |
| 2118 pxor xmm2,xmm3 |
| 2119 pxor xmm0,xmm2 |
| 2120 movdqu [edx-16],xmm0 |
| 2121 movdqa xmm2,xmm0 |
| 2122 dec ecx |
| 2123 jnz NEAR L$101loop_key128 |
| 2124 movdqa xmm4,[48+ebx] |
| 2125 db 102,15,56,0,197 |
| 2126 db 102,15,56,221,196 |
| 2127 pslld xmm4,1 |
| 2128 movdqa xmm3,xmm2 |
| 2129 pslldq xmm2,4 |
| 2130 pxor xmm3,xmm2 |
| 2131 pslldq xmm2,4 |
| 2132 pxor xmm3,xmm2 |
| 2133 pslldq xmm2,4 |
| 2134 pxor xmm2,xmm3 |
| 2135 pxor xmm0,xmm2 |
| 2136 movdqu [edx],xmm0 |
| 2137 movdqa xmm2,xmm0 |
| 2138 db 102,15,56,0,197 |
| 2139 db 102,15,56,221,196 |
| 2140 movdqa xmm3,xmm2 |
| 2141 pslldq xmm2,4 |
| 2142 pxor xmm3,xmm2 |
| 2143 pslldq xmm2,4 |
| 2144 pxor xmm3,xmm2 |
| 2145 pslldq xmm2,4 |
| 2146 pxor xmm2,xmm3 |
| 2147 pxor xmm0,xmm2 |
| 2148 movdqu [16+edx],xmm0 |
| 2149 mov ecx,9 |
| 2150 mov DWORD [96+edx],ecx |
| 2151 jmp NEAR L$100good_key |
| 2152 align 16 |
| 2153 L$09412rounds: |
| 2154 movq xmm2,[16+eax] |
| 2155 cmp ebp,268435456 |
| 2156 je NEAR L$10212rounds_alt |
| 2157 mov ecx,11 |
| 2158 movups [edx-16],xmm0 |
| 2159 db 102,15,58,223,202,1 |
| 2160 call L$103key_192a_cold |
| 2161 db 102,15,58,223,202,2 |
| 2162 call L$104key_192b |
| 2163 db 102,15,58,223,202,4 |
| 2164 call L$105key_192a |
| 2165 db 102,15,58,223,202,8 |
| 2166 call L$104key_192b |
| 2167 db 102,15,58,223,202,16 |
| 2168 call L$105key_192a |
| 2169 db 102,15,58,223,202,32 |
| 2170 call L$104key_192b |
| 2171 db 102,15,58,223,202,64 |
| 2172 call L$105key_192a |
| 2173 db 102,15,58,223,202,128 |
| 2174 call L$104key_192b |
| 2175 movups [edx],xmm0 |
| 2176 mov DWORD [48+edx],ecx |
| 2177 jmp NEAR L$100good_key |
| 2178 align 16 |
| 2179 L$105key_192a: |
| 2180 movups [edx],xmm0 |
| 2181 lea edx,[16+edx] |
| 2182 align 16 |
| 2183 L$103key_192a_cold: |
| 2184 movaps xmm5,xmm2 |
| 2185 L$106key_192b_warm: |
| 2186 shufps xmm4,xmm0,16 |
| 2187 movdqa xmm3,xmm2 |
| 2188 xorps xmm0,xmm4 |
| 2189 shufps xmm4,xmm0,140 |
| 2190 pslldq xmm3,4 |
| 2191 xorps xmm0,xmm4 |
| 2192 pshufd xmm1,xmm1,85 |
| 2193 pxor xmm2,xmm3 |
| 2194 pxor xmm0,xmm1 |
| 2195 pshufd xmm3,xmm0,255 |
| 2196 pxor xmm2,xmm3 |
| 2197 ret |
| 2198 align 16 |
| 2199 L$104key_192b: |
| 2200 movaps xmm3,xmm0 |
| 2201 shufps xmm5,xmm0,68 |
| 2202 movups [edx],xmm5 |
| 2203 shufps xmm3,xmm2,78 |
| 2204 movups [16+edx],xmm3 |
| 2205 lea edx,[32+edx] |
| 2206 jmp NEAR L$106key_192b_warm |
| 2207 align 16 |
| 2208 L$10212rounds_alt: |
| 2209 movdqa xmm5,[16+ebx] |
| 2210 movdqa xmm4,[32+ebx] |
| 2211 mov ecx,8 |
| 2212 movdqu [edx-16],xmm0 |
| 2213 L$107loop_key192: |
| 2214 movq [edx],xmm2 |
| 2215 movdqa xmm1,xmm2 |
| 2216 db 102,15,56,0,213 |
| 2217 db 102,15,56,221,212 |
| 2218 pslld xmm4,1 |
| 2219 lea edx,[24+edx] |
| 2220 movdqa xmm3,xmm0 |
| 2221 pslldq xmm0,4 |
| 2222 pxor xmm3,xmm0 |
| 2223 pslldq xmm0,4 |
| 2224 pxor xmm3,xmm0 |
| 2225 pslldq xmm0,4 |
| 2226 pxor xmm0,xmm3 |
| 2227 pshufd xmm3,xmm0,255 |
| 2228 pxor xmm3,xmm1 |
| 2229 pslldq xmm1,4 |
| 2230 pxor xmm3,xmm1 |
| 2231 pxor xmm0,xmm2 |
| 2232 pxor xmm2,xmm3 |
| 2233 movdqu [edx-16],xmm0 |
| 2234 dec ecx |
| 2235 jnz NEAR L$107loop_key192 |
| 2236 mov ecx,11 |
| 2237 mov DWORD [32+edx],ecx |
| 2238 jmp NEAR L$100good_key |
| 2239 align 16 |
| 2240 L$09314rounds: |
| 2241 movups xmm2,[16+eax] |
| 2242 lea edx,[16+edx] |
| 2243 cmp ebp,268435456 |
| 2244 je NEAR L$10814rounds_alt |
| 2245 mov ecx,13 |
| 2246 movups [edx-32],xmm0 |
| 2247 movups [edx-16],xmm2 |
| 2248 db 102,15,58,223,202,1 |
| 2249 call L$109key_256a_cold |
| 2250 db 102,15,58,223,200,1 |
| 2251 call L$110key_256b |
| 2252 db 102,15,58,223,202,2 |
| 2253 call L$111key_256a |
| 2254 db 102,15,58,223,200,2 |
| 2255 call L$110key_256b |
| 2256 db 102,15,58,223,202,4 |
| 2257 call L$111key_256a |
| 2258 db 102,15,58,223,200,4 |
| 2259 call L$110key_256b |
| 2260 db 102,15,58,223,202,8 |
| 2261 call L$111key_256a |
| 2262 db 102,15,58,223,200,8 |
| 2263 call L$110key_256b |
| 2264 db 102,15,58,223,202,16 |
| 2265 call L$111key_256a |
| 2266 db 102,15,58,223,200,16 |
| 2267 call L$110key_256b |
| 2268 db 102,15,58,223,202,32 |
| 2269 call L$111key_256a |
| 2270 db 102,15,58,223,200,32 |
| 2271 call L$110key_256b |
| 2272 db 102,15,58,223,202,64 |
| 2273 call L$111key_256a |
| 2274 movups [edx],xmm0 |
| 2275 mov DWORD [16+edx],ecx |
| 2276 xor eax,eax |
| 2277 jmp NEAR L$100good_key |
| 2278 align 16 |
| 2279 L$111key_256a: |
| 2280 movups [edx],xmm2 |
| 2281 lea edx,[16+edx] |
| 2282 L$109key_256a_cold: |
| 2283 shufps xmm4,xmm0,16 |
| 2284 xorps xmm0,xmm4 |
| 2285 shufps xmm4,xmm0,140 |
| 2286 xorps xmm0,xmm4 |
| 2287 shufps xmm1,xmm1,255 |
| 2288 xorps xmm0,xmm1 |
| 2289 ret |
| 2290 align 16 |
| 2291 L$110key_256b: |
| 2292 movups [edx],xmm0 |
| 2293 lea edx,[16+edx] |
| 2294 shufps xmm4,xmm2,16 |
| 2295 xorps xmm2,xmm4 |
| 2296 shufps xmm4,xmm2,140 |
| 2297 xorps xmm2,xmm4 |
| 2298 shufps xmm1,xmm1,170 |
| 2299 xorps xmm2,xmm1 |
| 2300 ret |
| 2301 align 16 |
| 2302 L$10814rounds_alt: |
| 2303 movdqa xmm5,[ebx] |
| 2304 movdqa xmm4,[32+ebx] |
| 2305 mov ecx,7 |
| 2306 movdqu [edx-32],xmm0 |
| 2307 movdqa xmm1,xmm2 |
| 2308 movdqu [edx-16],xmm2 |
| 2309 L$112loop_key256: |
| 2310 db 102,15,56,0,213 |
| 2311 db 102,15,56,221,212 |
| 2312 movdqa xmm3,xmm0 |
| 2313 pslldq xmm0,4 |
| 2314 pxor xmm3,xmm0 |
| 2315 pslldq xmm0,4 |
| 2316 pxor xmm3,xmm0 |
| 2317 pslldq xmm0,4 |
| 2318 pxor xmm0,xmm3 |
| 2319 pslld xmm4,1 |
| 2320 pxor xmm0,xmm2 |
| 2321 movdqu [edx],xmm0 |
| 2322 dec ecx |
| 2323 jz NEAR L$113done_key256 |
| 2324 pshufd xmm2,xmm0,255 |
| 2325 pxor xmm3,xmm3 |
| 2326 db 102,15,56,221,211 |
| 2327 movdqa xmm3,xmm1 |
| 2328 pslldq xmm1,4 |
| 2329 pxor xmm3,xmm1 |
| 2330 pslldq xmm1,4 |
| 2331 pxor xmm3,xmm1 |
| 2332 pslldq xmm1,4 |
| 2333 pxor xmm1,xmm3 |
| 2334 pxor xmm2,xmm1 |
| 2335 movdqu [16+edx],xmm2 |
| 2336 lea edx,[32+edx] |
| 2337 movdqa xmm1,xmm2 |
| 2338 jmp NEAR L$112loop_key256 |
| 2339 L$113done_key256: |
| 2340 mov ecx,13 |
| 2341 mov DWORD [16+edx],ecx |
| 2342 L$100good_key: |
| 2343 pxor xmm0,xmm0 |
| 2344 pxor xmm1,xmm1 |
| 2345 pxor xmm2,xmm2 |
| 2346 pxor xmm3,xmm3 |
| 2347 pxor xmm4,xmm4 |
| 2348 pxor xmm5,xmm5 |
| 2349 xor eax,eax |
| 2350 pop ebx |
| 2351 pop ebp |
| 2352 ret |
| 2353 align 4 |
| 2354 L$091bad_pointer: |
| 2355 mov eax,-1 |
| 2356 pop ebx |
| 2357 pop ebp |
| 2358 ret |
| 2359 align 4 |
| 2360 L$095bad_keybits: |
| 2361 pxor xmm0,xmm0 |
| 2362 mov eax,-2 |
| 2363 pop ebx |
| 2364 pop ebp |
| 2365 ret |
| 2366 global _aesni_set_encrypt_key |
| 2367 align 16 |
| 2368 _aesni_set_encrypt_key: |
| 2369 L$_aesni_set_encrypt_key_begin: |
| 2370 mov eax,DWORD [4+esp] |
| 2371 mov ecx,DWORD [8+esp] |
| 2372 mov edx,DWORD [12+esp] |
| 2373 call __aesni_set_encrypt_key |
| 2374 ret |
| 2375 global _aesni_set_decrypt_key |
| 2376 align 16 |
| 2377 _aesni_set_decrypt_key: |
| 2378 L$_aesni_set_decrypt_key_begin: |
| 2379 mov eax,DWORD [4+esp] |
| 2380 mov ecx,DWORD [8+esp] |
| 2381 mov edx,DWORD [12+esp] |
| 2382 call __aesni_set_encrypt_key |
| 2383 mov edx,DWORD [12+esp] |
| 2384 shl ecx,4 |
| 2385 test eax,eax |
| 2386 jnz NEAR L$114dec_key_ret |
| 2387 lea eax,[16+ecx*1+edx] |
| 2388 movups xmm0,[edx] |
| 2389 movups xmm1,[eax] |
| 2390 movups [eax],xmm0 |
| 2391 movups [edx],xmm1 |
| 2392 lea edx,[16+edx] |
| 2393 lea eax,[eax-16] |
| 2394 L$115dec_key_inverse: |
| 2395 movups xmm0,[edx] |
| 2396 movups xmm1,[eax] |
| 2397 db 102,15,56,219,192 |
| 2398 db 102,15,56,219,201 |
| 2399 lea edx,[16+edx] |
| 2400 lea eax,[eax-16] |
| 2401 movups [16+eax],xmm0 |
| 2402 movups [edx-16],xmm1 |
| 2403 cmp eax,edx |
| 2404 ja NEAR L$115dec_key_inverse |
| 2405 movups xmm0,[edx] |
| 2406 db 102,15,56,219,192 |
| 2407 movups [edx],xmm0 |
| 2408 pxor xmm0,xmm0 |
| 2409 pxor xmm1,xmm1 |
| 2410 xor eax,eax |
| 2411 L$114dec_key_ret: |
| 2412 ret |
| 2413 align 64 |
| 2414 L$key_const: |
| 2415 dd 202313229,202313229,202313229,202313229 |
| 2416 dd 67569157,67569157,67569157,67569157 |
| 2417 dd 1,1,1,1 |
| 2418 dd 27,27,27,27 |
| 2419 db 65,69,83,32,102,111,114,32,73,110,116,101,108,32,65,69 |
| 2420 db 83,45,78,73,44,32,67,82,89,80,84,79,71,65,77,83 |
| 2421 db 32,98,121,32,60,97,112,112,114,111,64,111,112,101,110,115 |
| 2422 db 115,108,46,111,114,103,62,0 |
| 2423 segment .bss |
| 2424 common _OPENSSL_ia32cap_P 16 |
OLD | NEW |