/external/llvm/test/MC/X86/ |
H A D | x86-32-avx.s | 3 // CHECK: vaddss %xmm4, %xmm6, %xmm2 5 vaddss %xmm4, %xmm6, %xmm2 7 // CHECK: vmulss %xmm4, %xmm6, %xmm2 9 vmulss %xmm4, %xmm6, %xmm2 11 // CHECK: vsubss %xmm4, %xmm6, %xmm2 13 vsubss %xmm4, %xmm6, %xmm2 15 // CHECK: vdivss %xmm4, %xmm6, %xmm2 17 vdivss %xmm4, %xmm6, %xmm2 19 // CHECK: vaddsd %xmm4, %xmm6, %xmm2 21 vaddsd %xmm4, %xmm6, %xmm2 [all...] |
H A D | x86_64-xop-encoding.s | 27 // CHECK: vphsubbw %xmm2, %xmm1 29 vphsubbw %xmm2, %xmm1 35 // CHECK: vphaddwq %xmm6, %xmm2 37 vphaddwq %xmm6, %xmm2 59 // CHECK: vphadduwd %xmm2, %xmm1 61 vphadduwd %xmm2, %xmm1 67 // CHECK: vphaddudq %xmm6, %xmm2 69 vphaddudq %xmm6, %xmm2 83 // CHECK: vphaddubq %xmm2, %xmm2 [all...] |
H A D | x86_64-encoding.s | 123 // CHECK: sha1rnds4 $1, %xmm1, %xmm2 125 sha1rnds4 $1, %xmm1, %xmm2 127 // CHECK: sha1rnds4 $1, (%rax), %xmm2 129 sha1rnds4 $1, (%rax), %xmm2 131 // CHECK: sha1nexte %xmm1, %xmm2 133 sha1nexte %xmm1, %xmm2 135 // CHECK: sha1msg1 %xmm1, %xmm2 137 sha1msg1 %xmm1, %xmm2 139 // CHECK: sha1msg1 (%rax), %xmm2 141 sha1msg1 (%rax), %xmm2 [all...] |
H A D | shuffle-comments.s | 18 vpalignr $8, %xmm0, %xmm1, %xmm2 19 # CHECK: xmm2 = xmm0[8,9,10,11,12,13,14,15],xmm1[0,1,2,3,4,5,6,7] 20 vpalignr $8, (%rax), %xmm1, %xmm2 21 # CHECK: xmm2 = mem[8,9,10,11,12,13,14,15],xmm1[0,1,2,3,4,5,6,7] 23 vpalignr $16, %xmm0, %xmm1, %xmm2 24 # CHECK: xmm2 = xmm1[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15] 25 vpalignr $16, (%rax), %xmm1, %xmm2 26 # CHECK: xmm2 = xmm1[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15] 28 vpalignr $0, %xmm0, %xmm1, %xmm2 29 # CHECK: xmm2 [all...] |
H A D | x86-32-fma3.s | 3 // CHECK: vfmadd132pd %xmm2, %xmm5, %xmm1 5 vfmadd132pd %xmm2, %xmm5, %xmm1 11 // CHECK: vfmadd132ps %xmm2, %xmm5, %xmm1 13 vfmadd132ps %xmm2, %xmm5, %xmm1 19 // CHECK: vfmadd213pd %xmm2, %xmm5, %xmm1 21 vfmadd213pd %xmm2, %xmm5, %xmm1 27 // CHECK: vfmadd213ps %xmm2, %xmm5, %xmm1 29 vfmadd213ps %xmm2, %xmm5, %xmm1 35 // CHECK: vfmadd231pd %xmm2, %xmm5, %xmm1 37 vfmadd231pd %xmm2, [all...] |
H A D | intel-syntax-x86-64-avx.s | 3 // CHECK: vgatherdpd xmm2, xmmword ptr [rdi + 2*xmm1], xmm0 5 vgatherdpd xmm2, xmmword ptr [rdi + 2*xmm1], xmm0 7 // CHECK: vgatherqpd xmm2, xmmword ptr [rdi + 2*xmm1], xmm0 9 vgatherqpd xmm2, xmmword ptr [rdi + 2*xmm1], xmm0 35 // CHECK: vpgatherdq xmm2, xmmword ptr [rdi + 2*xmm1], xmm0 37 vpgatherdq xmm2, xmmword ptr [rdi + 2*xmm1], xmm0 39 // CHECK: vpgatherqq xmm2, xmmword ptr [rdi + 2*xmm1], xmm0 41 vpgatherqq xmm2, xmmword ptr [rdi + 2*xmm1], xmm0
|
/external/swiftshader/third_party/LLVM/test/MC/X86/ |
H A D | x86-32-avx.s | 3 // CHECK: vaddss %xmm4, %xmm6, %xmm2 5 vaddss %xmm4, %xmm6, %xmm2 7 // CHECK: vmulss %xmm4, %xmm6, %xmm2 9 vmulss %xmm4, %xmm6, %xmm2 11 // CHECK: vsubss %xmm4, %xmm6, %xmm2 13 vsubss %xmm4, %xmm6, %xmm2 15 // CHECK: vdivss %xmm4, %xmm6, %xmm2 17 vdivss %xmm4, %xmm6, %xmm2 19 // CHECK: vaddsd %xmm4, %xmm6, %xmm2 21 vaddsd %xmm4, %xmm6, %xmm2 [all...] |
H A D | x86-32-fma3.s | 3 // CHECK: vfmadd132pd %xmm2, %xmm5, %xmm1 5 vfmadd132pd %xmm2, %xmm5, %xmm1 11 // CHECK: vfmadd132ps %xmm2, %xmm5, %xmm1 13 vfmadd132ps %xmm2, %xmm5, %xmm1 19 // CHECK: vfmadd213pd %xmm2, %xmm5, %xmm1 21 vfmadd213pd %xmm2, %xmm5, %xmm1 27 // CHECK: vfmadd213ps %xmm2, %xmm5, %xmm1 29 vfmadd213ps %xmm2, %xmm5, %xmm1 35 // CHECK: vfmadd231pd %xmm2, %xmm5, %xmm1 37 vfmadd231pd %xmm2, [all...] |
/external/libvpx/libvpx/third_party/libyuv/source/ |
H A D | compare_win.cc | 36 movdqu xmm2, [edx] local 39 psubusb xmm1, xmm2 40 psubusb xmm2, xmm3 local 41 por xmm1, xmm2 42 movdqa xmm2, xmm1 local 44 punpckhbw xmm2, xmm5 local 46 pmaddwd xmm2, xmm2 local 48 paddd xmm0, xmm2 145 movdqa xmm2, xmm local 146 punpcklbw xmm2, xmm7 // src[0-7] local 156 movdqa xmm2, xmm1 local 157 punpcklwd xmm2, xmm7 // src[8-11] local 158 pmulld xmm2, xmm5 local 166 pshufd xmm2, xmm1, 0x0e // upper 2 dwords local 168 pshufd xmm2, xmm1, 0x01 local 193 vpmovzxbd xmm2, [eax + 8] // src[8-11] local 196 vpmulld xmm2, xmm2, xmmword ptr kHashMul2 local 202 vpshufd xmm2, xmm1, 0x0e // upper 2 dwords local 204 vpshufd xmm2, xmm1, 0x01 local [all...] |
/external/libyuv/files/source/ |
H A D | compare_win.cc | 36 movdqu xmm2, [edx] local 39 psubusb xmm1, xmm2 40 psubusb xmm2, xmm3 local 41 por xmm1, xmm2 42 movdqa xmm2, xmm1 local 44 punpckhbw xmm2, xmm5 local 46 pmaddwd xmm2, xmm2 local 48 paddd xmm0, xmm2 145 movdqa xmm2, xmm local 146 punpcklbw xmm2, xmm7 // src[0-7] local 156 movdqa xmm2, xmm1 local 157 punpcklwd xmm2, xmm7 // src[8-11] local 158 pmulld xmm2, xmm5 local 166 pshufd xmm2, xmm1, 0x0e // upper 2 dwords local 168 pshufd xmm2, xmm1, 0x01 local 193 vpmovzxbd xmm2, [eax + 8] // src[8-11] local 196 vpmulld xmm2, xmm2, xmmword ptr kHashMul2 local 202 vpshufd xmm2, xmm1, 0x0e // upper 2 dwords local 204 vpshufd xmm2, xmm1, 0x01 local [all...] |
/external/compiler-rt/lib/builtins/i386/ |
H A D | floatdidf.S | 30 movsd REL_ADDR(twop52), %xmm2 // 0x1.0p52 31 subsd %xmm2, %xmm1 // a_hi - 0x1p52 (no rounding occurs) 32 orpd %xmm2, %xmm0 // 0x1p52 + a_lo (no rounding occurs)
|
H A D | ashrdi3.S | 14 movd 12(%esp), %xmm2 // Load count 24 psrlq %xmm2, %xmm0 // unsigned shift input by count 33 pandn %xmm1, %xmm2 // 63 - count 35 psubq %xmm1, %xmm2 // 64 - count 36 psllq %xmm2, %xmm1 // -1 << (64 - count) = leading sign bits
|
/external/libvpx/libvpx/vp8/common/x86/ |
H A D | idctllm_sse2.asm | 61 movq xmm2, [rax+2*rdx] 66 punpcklbw xmm2, xmm5 73 paddw xmm2, xmm4 79 packuswb xmm2, xmm5 88 movq [rax], xmm2 126 ; note the transpose of xmm1 and xmm2, necessary for shuffle 129 movdqa xmm2, [rax+16] 141 pmullw xmm2, [rdx+16] 154 movdqa xmm4, xmm2 155 punpckldq xmm2, xmm [all...] |
/external/libjpeg-turbo/simd/ |
H A D | jfdctflt-sse-64.asm | 87 movaps xmm2, XMMWORD [XMMBLOCK(2,1,rdx,SIZEOF_FAST_FLOAT)] 90 ; xmm0=(20 21 22 23), xmm2=(24 25 26 27) 96 movaps xmm5,xmm2 ; transpose coefficients(phase 1) 97 unpcklps xmm2,xmm3 ; xmm2=(24 34 25 35) 109 movaps XMMWORD [wk(1)], xmm2 ; wk(1)=(24 34 25 35) 114 movaps xmm2,xmm1 ; transpose coefficients(phase 1) 116 unpckhps xmm2,xmm3 ; xmm2=(06 16 07 17) 121 movaps xmm3,xmm2 ; transpos [all...] |
H A D | jidctflt-sse2-64.asm | 102 movq xmm2, XMM_MMWORD [MMBLOCK(2,0,rsi,SIZEOF_JCOEF)] 108 por xmm1,xmm2 130 movaps xmm2,xmm0 135 shufps xmm2,xmm2,0xAA ; xmm2=(02 02 02 02) 142 movaps XMMWORD [XMMBLOCK(2,0,rdi,SIZEOF_FAST_FLOAT)], xmm2 143 movaps XMMWORD [XMMBLOCK(2,1,rdi,SIZEOF_FAST_FLOAT)], xmm2 154 movq xmm2, XMM_MMWORD [MMBLOCK(4,0,rsi,SIZEOF_JCOEF)] 164 punpcklwd xmm2,xmm [all...] |
H A D | jfdctfst-sse2-64.asm | 100 movdqa xmm2, XMMWORD [XMMBLOCK(2,0,rdx,SIZEOF_DCTELEM)] 103 ; xmm0=(00 01 02 03 04 05 06 07), xmm2=(20 21 22 23 24 25 26 27) 109 movdqa xmm5,xmm2 ; transpose coefficients(phase 1) 110 punpcklwd xmm2,xmm3 ; xmm2=(20 30 21 31 22 32 23 33) 121 movdqa XMMWORD [wk(0)], xmm2 ; wk(0)=(20 30 21 31 22 32 23 33) 124 movdqa xmm2,xmm6 ; transpose coefficients(phase 1) 126 punpckhwd xmm2,xmm7 ; xmm2=(44 54 45 55 46 56 47 57) 134 movdqa xmm3,xmm2 ; transpos [all...] |
H A D | jfdctfst-sse2.asm | 106 movdqa xmm2, XMMWORD [XMMBLOCK(2,0,edx,SIZEOF_DCTELEM)] 109 ; xmm0=(00 01 02 03 04 05 06 07), xmm2=(20 21 22 23 24 25 26 27) 115 movdqa xmm5,xmm2 ; transpose coefficients(phase 1) 116 punpcklwd xmm2,xmm3 ; xmm2=(20 30 21 31 22 32 23 33) 127 movdqa XMMWORD [wk(0)], xmm2 ; wk(0)=(20 30 21 31 22 32 23 33) 130 movdqa xmm2,xmm6 ; transpose coefficients(phase 1) 132 punpckhwd xmm2,xmm7 ; xmm2=(44 54 45 55 46 56 47 57) 140 movdqa xmm3,xmm2 ; transpos [all...] |
/external/boringssl/linux-x86/crypto/chacha/ |
H A D | chacha-x86.S | 409 pshufd $170,%xmm3,%xmm2 419 movdqa %xmm2,96(%ebp) 430 pshufd $170,%xmm3,%xmm2 438 movdqa %xmm2,32(%ebp) 450 movdqa -96(%ebp),%xmm2 456 movdqa %xmm2,-96(%ebx) 461 movdqa 32(%ebp),%xmm2 468 movdqa %xmm2,32(%ebx) 485 movdqa %xmm3,%xmm2 489 pxor %xmm4,%xmm2 [all...] |
/external/boringssl/mac-x86/crypto/chacha/ |
H A D | chacha-x86.S | 406 pshufd $170,%xmm3,%xmm2 416 movdqa %xmm2,96(%ebp) 427 pshufd $170,%xmm3,%xmm2 435 movdqa %xmm2,32(%ebp) 447 movdqa -96(%ebp),%xmm2 453 movdqa %xmm2,-96(%ebx) 458 movdqa 32(%ebp),%xmm2 465 movdqa %xmm2,32(%ebx) 482 movdqa %xmm3,%xmm2 486 pxor %xmm4,%xmm2 [all...] |
/external/boringssl/win-x86/crypto/aes/ |
H A D | aesni-x86.asm | 24 movups xmm2,[eax] 30 xorps xmm2,xmm0 40 movups [eax],xmm2 41 pxor xmm2,xmm2 49 movups xmm2,[eax] 55 xorps xmm2,xmm0 65 movups [eax],xmm2 66 pxor xmm2,xmm2 [all...] |
/external/libvpx/libvpx/vp8/encoder/x86/ |
H A D | fwalsh_sse2.asm | 34 movq xmm2, MMWORD PTR [rsi] 38 punpcklwd xmm2, xmm3 41 punpckldq xmm0, xmm2 ; ip[1] ip[0] 42 punpckhdq xmm1, xmm2 ; ip[3] ip[2] 44 movdqa xmm2, xmm0 46 psubw xmm2, xmm1 49 psllw xmm2, 2 ; c1 b1 52 punpcklqdq xmm0, xmm2 ; b1 a1 53 punpckhqdq xmm1, xmm2 ; c1 d1 61 movdqa xmm2, xmm [all...] |
H A D | dct_sse2.asm | 70 movq xmm2, MMWORD PTR[input+ pitch] ;13 12 11 10 75 punpcklqdq xmm0, xmm2 ;13 12 11 10 03 02 01 00 78 movdqa xmm2, xmm0 80 punpckhdq xmm2, xmm1 ;33 32 13 12 31 30 11 10 82 punpckldq xmm0, xmm2 ;31 21 30 20 11 10 01 00 84 pshufhw xmm2, xmm2, 0b1h ;32 33 12 13 xx xx xx xx 86 punpckhdq xmm1, xmm2 ;32 33 22 23 12 13 02 03 111 movdqa xmm2, xmm0 113 punpckhqdq xmm2, xmm [all...] |
H A D | encodeopt.asm | 30 movdqa xmm2, [rsi+16] 34 psubw xmm2, xmm3 37 pmaddwd xmm2, xmm2 39 paddd xmm0, xmm2 90 movdqa xmm2, [rsi+16] 94 psubw xmm2, xmm3 95 pmaddwd xmm2, xmm2 106 paddd xmm4, xmm2 [all...] |
/external/boringssl/linux-x86/crypto/aes/ |
H A D | aesni-x86.S | 12 movups (%eax),%xmm2 18 xorps %xmm0,%xmm2 28 movups %xmm2,(%eax) 29 pxor %xmm2,%xmm2 40 movups (%eax),%xmm2 46 xorps %xmm0,%xmm2 56 movups %xmm2,(%eax) 57 pxor %xmm2,%xmm2 [all...] |
/external/boringssl/mac-x86/crypto/aes/ |
H A D | aesni-x86.S | 11 movups (%eax),%xmm2 17 xorps %xmm0,%xmm2 27 movups %xmm2,(%eax) 28 pxor %xmm2,%xmm2 37 movups (%eax),%xmm2 43 xorps %xmm0,%xmm2 53 movups %xmm2,(%eax) 54 pxor %xmm2,%xmm2 [all...] |