/external/llvm/test/MC/X86/ |
H A D | x86-32-avx.s | 330 // CHECK: vshufps $8, %xmm1, %xmm2, %xmm3 332 vshufps $8, %xmm1, %xmm2, %xmm3 334 // CHECK: vshufps $8, -4(%ebx,%ecx,8), %xmm2, %xmm3 336 vshufps $8, -4(%ebx,%ecx,8), %xmm2, %xmm3 338 // CHECK: vshufpd $8, %xmm1, %xmm2, %xmm3 340 vshufpd $8, %xmm1, %xmm2, %xmm3 342 // CHECK: vshufpd $8, -4(%ebx,%ecx,8), %xmm2, %xmm3 344 vshufpd $8, -4(%ebx,%ecx,8), %xmm2, %xmm3 346 // CHECK: vcmpeqps %xmm1, %xmm2, %xmm3 348 vcmpeqps %xmm1, %xmm2, %xmm3 [all...] |
H A D | x86_64-xop-encoding.s | 43 // CHECK: vphaddwd %xmm3, %xmm4 45 vphaddwd %xmm3, %xmm4 72 // CHECK: vphaddubw (%rcx), %xmm3 74 vphaddubw (%rcx), %xmm3 123 // CHECK: vphaddbd %xmm1, %xmm3 125 vphaddbd %xmm1, %xmm3 144 // CHECK: vfrczps 4(%rax), %xmm3 146 vfrczps 4(%rax), %xmm3 200 // CHECK: vpshld %xmm7, %xmm5, %xmm3 202 vpshld %xmm7, %xmm5, %xmm3 [all...] |
/external/swiftshader/third_party/LLVM/test/MC/X86/ |
H A D | x86-32-avx.s | 330 // CHECK: vshufps $8, %xmm1, %xmm2, %xmm3 332 vshufps $8, %xmm1, %xmm2, %xmm3 334 // CHECK: vshufps $8, -4(%ebx,%ecx,8), %xmm2, %xmm3 336 vshufps $8, -4(%ebx,%ecx,8), %xmm2, %xmm3 338 // CHECK: vshufpd $8, %xmm1, %xmm2, %xmm3 340 vshufpd $8, %xmm1, %xmm2, %xmm3 342 // CHECK: vshufpd $8, -4(%ebx,%ecx,8), %xmm2, %xmm3 344 vshufpd $8, -4(%ebx,%ecx,8), %xmm2, %xmm3 346 // CHECK: vcmpps $0, %xmm1, %xmm2, %xmm3 348 vcmpeqps %xmm1, %xmm2, %xmm3 [all...] |
/external/libjpeg-turbo/simd/ |
H A D | jidctflt-sse2-64.asm | 103 movq xmm3, XMM_MMWORD [MMBLOCK(3,0,rsi,SIZEOF_JCOEF)] 109 por xmm3,xmm4 111 por xmm1,xmm3 131 movaps xmm3,xmm0 136 shufps xmm3,xmm3,0xFF ; xmm3=(03 03 03 03) 144 movaps XMMWORD [XMMBLOCK(3,0,rdi,SIZEOF_FAST_FLOAT)], xmm3 145 movaps XMMWORD [XMMBLOCK(3,1,rdi,SIZEOF_FAST_FLOAT)], xmm3 155 movq xmm3, XMM_MMWOR [all...] |
H A D | jfdctflt-sse-64.asm | 88 movaps xmm3, XMMWORD [XMMBLOCK(3,1,rdx,SIZEOF_FAST_FLOAT)] 91 ; xmm1=(30 31 32 33), xmm3=(34 35 36 37) 97 unpcklps xmm2,xmm3 ; xmm2=(24 34 25 35) 98 unpckhps xmm5,xmm3 ; xmm5=(26 36 27 37) 103 movaps xmm3, XMMWORD [XMMBLOCK(1,1,rdx,SIZEOF_FAST_FLOAT)] 106 ; xmm7=(10 11 12 13), xmm3=(14 15 16 17) 115 unpcklps xmm1,xmm3 ; xmm1=(04 14 05 15) 116 unpckhps xmm2,xmm3 ; xmm2=(06 16 07 17) 121 movaps xmm3,xmm2 ; transpose coefficients(phase 2) 123 unpckhps2 xmm3,xmm [all...] |
H A D | jidctflt-sse2.asm | 109 movq xmm3, XMM_MMWORD [MMBLOCK(3,0,esi,SIZEOF_JCOEF)] 115 por xmm3,xmm4 117 por xmm1,xmm3 137 movaps xmm3,xmm0 142 shufps xmm3,xmm3,0xFF ; xmm3=(03 03 03 03) 150 movaps XMMWORD [XMMBLOCK(3,0,edi,SIZEOF_FAST_FLOAT)], xmm3 151 movaps XMMWORD [XMMBLOCK(3,1,edi,SIZEOF_FAST_FLOAT)], xmm3 162 movq xmm3, XMM_MMWOR [all...] |
H A D | jfdctfst-sse2-64.asm | 101 movdqa xmm3, XMMWORD [XMMBLOCK(3,0,rdx,SIZEOF_DCTELEM)] 104 ; xmm1=(10 11 12 13 14 15 16 17), xmm3=(30 31 32 33 34 35 36 37) 110 punpcklwd xmm2,xmm3 ; xmm2=(20 30 21 31 22 32 23 33) 111 punpckhwd xmm5,xmm3 ; xmm5=(24 34 25 35 26 36 27 37) 116 movdqa xmm3, XMMWORD [XMMBLOCK(7,0,rdx,SIZEOF_DCTELEM)] 119 ; xmm7=( 5 13 21 29 37 45 53 61), xmm3=( 7 15 23 31 39 47 55 63) 128 punpcklwd xmm1,xmm3 ; xmm1=(60 70 61 71 62 72 63 73) 129 punpckhwd xmm5,xmm3 ; xmm5=(64 74 65 75 66 76 67 77) 134 movdqa xmm3,xmm2 ; transpose coefficients(phase 2) 136 punpckhdq xmm3,xmm [all...] |
H A D | jfdctfst-sse2.asm | 107 movdqa xmm3, XMMWORD [XMMBLOCK(3,0,edx,SIZEOF_DCTELEM)] 110 ; xmm1=(10 11 12 13 14 15 16 17), xmm3=(30 31 32 33 34 35 36 37) 116 punpcklwd xmm2,xmm3 ; xmm2=(20 30 21 31 22 32 23 33) 117 punpckhwd xmm5,xmm3 ; xmm5=(24 34 25 35 26 36 27 37) 122 movdqa xmm3, XMMWORD [XMMBLOCK(7,0,edx,SIZEOF_DCTELEM)] 125 ; xmm7=( 5 13 21 29 37 45 53 61), xmm3=( 7 15 23 31 39 47 55 63) 134 punpcklwd xmm1,xmm3 ; xmm1=(60 70 61 71 62 72 63 73) 135 punpckhwd xmm5,xmm3 ; xmm5=(64 74 65 75 66 76 67 77) 140 movdqa xmm3,xmm2 ; transpose coefficients(phase 2) 142 punpckhdq xmm3,xmm [all...] |
H A D | jfdctflt-sse.asm | 95 movaps xmm3, XMMWORD [XMMBLOCK(3,1,edx,SIZEOF_FAST_FLOAT)] 98 ; xmm1=(30 31 32 33), xmm3=(34 35 36 37) 104 unpcklps xmm2,xmm3 ; xmm2=(24 34 25 35) 105 unpckhps xmm5,xmm3 ; xmm5=(26 36 27 37) 110 movaps xmm3, XMMWORD [XMMBLOCK(1,1,edx,SIZEOF_FAST_FLOAT)] 113 ; xmm7=(10 11 12 13), xmm3=(14 15 16 17) 122 unpcklps xmm1,xmm3 ; xmm1=(04 14 05 15) 123 unpckhps xmm2,xmm3 ; xmm2=(06 16 07 17) 128 movaps xmm3,xmm2 ; transpose coefficients(phase 2) 130 unpckhps2 xmm3,xmm [all...] |
H A D | jfdctint-sse2-64.asm | 122 movdqa xmm3, XMMWORD [XMMBLOCK(3,0,rdx,SIZEOF_DCTELEM)] 125 ; xmm1=(10 11 12 13 14 15 16 17), xmm3=(30 31 32 33 34 35 36 37) 131 punpcklwd xmm2,xmm3 ; xmm2=(20 30 21 31 22 32 23 33) 132 punpckhwd xmm5,xmm3 ; xmm5=(24 34 25 35 26 36 27 37) 137 movdqa xmm3, XMMWORD [XMMBLOCK(7,0,rdx,SIZEOF_DCTELEM)] 140 ; xmm7=( 5 13 21 29 37 45 53 61), xmm3=( 7 15 23 31 39 47 55 63) 149 punpcklwd xmm1,xmm3 ; xmm1=(60 70 61 71 62 72 63 73) 150 punpckhwd xmm5,xmm3 ; xmm5=(64 74 65 75 66 76 67 77) 155 movdqa xmm3,xmm2 ; transpose coefficients(phase 2) 157 punpckhdq xmm3,xmm [all...] |
H A D | jfdctint-sse2.asm | 128 movdqa xmm3, XMMWORD [XMMBLOCK(3,0,edx,SIZEOF_DCTELEM)] 131 ; xmm1=(10 11 12 13 14 15 16 17), xmm3=(30 31 32 33 34 35 36 37) 137 punpcklwd xmm2,xmm3 ; xmm2=(20 30 21 31 22 32 23 33) 138 punpckhwd xmm5,xmm3 ; xmm5=(24 34 25 35 26 36 27 37) 143 movdqa xmm3, XMMWORD [XMMBLOCK(7,0,edx,SIZEOF_DCTELEM)] 146 ; xmm7=( 5 13 21 29 37 45 53 61), xmm3=( 7 15 23 31 39 47 55 63) 155 punpcklwd xmm1,xmm3 ; xmm1=(60 70 61 71 62 72 63 73) 156 punpckhwd xmm5,xmm3 ; xmm5=(64 74 65 75 66 76 67 77) 161 movdqa xmm3,xmm2 ; transpose coefficients(phase 2) 163 punpckhdq xmm3,xmm [all...] |
H A D | jidctfst-sse2-64.asm | 146 pshufd xmm3,xmm7,0xAA ; xmm3=col6=(06 06 06 06 06 06 06 06) 162 movdqa xmm3, XMMWORD [XMMBLOCK(6,0,rsi,SIZEOF_JCOEF)] 164 pmullw xmm3, XMMWORD [XMMBLOCK(6,0,rdx,SIZEOF_IFAST_MULT_TYPE)] 169 psubw xmm1,xmm3 171 paddw xmm5,xmm3 ; xmm5=tmp13 190 movdqa xmm3, XMMWORD [XMMBLOCK(3,0,rsi,SIZEOF_JCOEF)] 192 pmullw xmm3, XMMWORD [XMMBLOCK(3,0,rdx,SIZEOF_IFAST_MULT_TYPE)] 201 psubw xmm5,xmm3 ; xmm5=z10 203 paddw xmm0,xmm3 ; xmm [all...] |
H A D | jidctfst-sse2.asm | 152 pshufd xmm3,xmm7,0xAA ; xmm3=col6=(06 06 06 06 06 06 06 06) 169 movdqa xmm3, XMMWORD [XMMBLOCK(6,0,esi,SIZEOF_JCOEF)] 171 pmullw xmm3, XMMWORD [XMMBLOCK(6,0,edx,SIZEOF_IFAST_MULT_TYPE)] 176 psubw xmm1,xmm3 178 paddw xmm5,xmm3 ; xmm5=tmp13 197 movdqa xmm3, XMMWORD [XMMBLOCK(3,0,esi,SIZEOF_JCOEF)] 199 pmullw xmm3, XMMWORD [XMMBLOCK(3,0,edx,SIZEOF_IFAST_MULT_TYPE)] 208 psubw xmm5,xmm3 ; xmm5=z10 210 paddw xmm0,xmm3 ; xmm [all...] |
H A D | jidctflt-sse.asm | 128 cvtpi2ps xmm3,mm1 ; xmm3=(02 03 ** **) 130 movlhps xmm0,xmm3 ; xmm0=in0=(00 01 02 03) 136 movaps xmm3,xmm0 141 shufps xmm3,xmm3,0xFF ; xmm3=(03 03 03 03) 149 movaps XMMWORD [XMMBLOCK(3,0,edi,SIZEOF_FAST_FLOAT)], xmm3 150 movaps XMMWORD [XMMBLOCK(3,1,edi,SIZEOF_FAST_FLOAT)], xmm3 189 cvtpi2ps xmm3,mm [all...] |
/external/boringssl/linux-x86/crypto/chacha/ |
H A D | chacha-x86.S | 399 movdqu (%ebx),%xmm3 407 pshufd $0,%xmm3,%xmm0 408 pshufd $85,%xmm3,%xmm1 409 pshufd $170,%xmm3,%xmm2 410 pshufd $255,%xmm3,%xmm3 420 movdqa %xmm3,112(%ebp) 421 movdqu 16(%edx),%xmm3 428 pshufd $0,%xmm3,%xmm0 429 pshufd $85,%xmm3, [all...] |
/external/boringssl/mac-x86/crypto/chacha/ |
H A D | chacha-x86.S | 396 movdqu (%ebx),%xmm3 404 pshufd $0,%xmm3,%xmm0 405 pshufd $85,%xmm3,%xmm1 406 pshufd $170,%xmm3,%xmm2 407 pshufd $255,%xmm3,%xmm3 417 movdqa %xmm3,112(%ebp) 418 movdqu 16(%edx),%xmm3 425 pshufd $0,%xmm3,%xmm0 426 pshufd $85,%xmm3, [all...] |
/external/libvpx/libvpx/vp8/encoder/x86/ |
H A D | dct_sse2.asm | 73 movq xmm3, MMWORD PTR[input+ pitch] ;33 32 31 30 76 punpcklqdq xmm1, xmm3 ;33 32 31 30 23 22 21 20 87 movdqa xmm3, xmm0 89 psubw xmm3, xmm1 ;c1 d1 c1 d1 c1 d1 c1 d1 91 psllw xmm3, 3 ;c1 <<= 3 d1 <<= 3 96 movdqa xmm4, xmm3 97 pmaddwd xmm3, XMMWORD PTR[GLOBAL(_5352_2217)] ;c1*2217 + d1*5352 100 paddd xmm3, XMMWORD PTR[GLOBAL(_14500)] 102 psrad xmm3, 12 ;(c1 * 2217 + d1 * 5352 + 14500)>>12 106 packssdw xmm3, xmm [all...] |
/external/boringssl/linux-x86_64/crypto/modes/ |
H A D | ghash-x86_64.S | 678 movdqa %xmm2,%xmm3 681 psrlq $63,%xmm3 683 pslldq $8,%xmm3 684 por %xmm3,%xmm2 695 pshufd $78,%xmm0,%xmm3 696 pxor %xmm0,%xmm3 700 pxor %xmm0,%xmm3 701 pxor %xmm1,%xmm3 703 movdqa %xmm3,%xmm4 704 psrldq $8,%xmm3 [all...] |
/external/boringssl/mac-x86_64/crypto/modes/ |
H A D | ghash-x86_64.S | 677 movdqa %xmm2,%xmm3 680 psrlq $63,%xmm3 682 pslldq $8,%xmm3 683 por %xmm3,%xmm2 694 pshufd $78,%xmm0,%xmm3 695 pxor %xmm0,%xmm3 699 pxor %xmm0,%xmm3 700 pxor %xmm1,%xmm3 702 movdqa %xmm3,%xmm4 703 psrldq $8,%xmm3 [all...] |
/external/libvpx/libvpx/vp8/common/x86/ |
H A D | idctllm_sse2.asm | 62 movq xmm3, [rax+rcx] 67 punpcklbw xmm3, xmm5 74 paddw xmm3, xmm4 80 packuswb xmm3, xmm5 89 movq [rax + rdx], xmm3 131 movdqa xmm3, [rax+48] 143 pmullw xmm3, [rdx+16] 155 punpckldq xmm2, xmm3 156 punpckhdq xmm4, xmm3 159 pshufd xmm3, xmm [all...] |
H A D | subpixel_sse2.asm | 60 movq xmm3, MMWORD PTR [rsi - 2] 66 por xmm1, xmm3 74 punpcklbw xmm3, xmm0 ; xx05 xx04 xx03 xx02 xx01 xx01 xx-1 xx-2 77 pmullw xmm3, XMMWORD PTR [rdx] ; x[-2] * H[-2]; Tap 1 107 paddsw xmm4, xmm3 181 movq xmm3, MMWORD PTR [rsi - 2] 195 por xmm1, xmm3 203 punpcklbw xmm3, xmm0 ; xx05 xx04 xx03 xx02 xx01 xx01 xx-1 xx-2 206 pmullw xmm3, XMMWORD PTR [rdx] ; x[-2] * H[-2]; Tap 1 235 paddsw xmm4, xmm3 [all...] |
H A D | loopfilter_block_sse2_x86_64.asm | 202 movdqa xmm3, i3 207 LF_FILTER_HEV_MASK xmm0, xmm1, xmm2, xmm3, xmm4, xmm8, xmm9, xmm10 211 movdqa xmm3, i4 213 LF_FILTER xmm1, xmm2, xmm3, xmm8, xmm0, xmm4 218 movdqa i4, xmm3 227 LF_FILTER_HEV_MASK xmm3, xmm8, xmm0, xmm1, xmm2, xmm4, xmm10, xmm11, xmm9 233 LF_FILTER xmm0, xmm1, xmm4, xmm8, xmm3, xmm2 244 movdqa xmm3, i13 247 LF_FILTER_HEV_MASK xmm4, xmm8, xmm0, xmm1, xmm2, xmm3, xmm9, xmm11, xmm10 251 movdqa xmm3, i1 [all...] |
/external/compiler-rt/lib/builtins/i386/ |
H A D | floatundisf.S | 90 movd %edx, %xmm3 93 psrlq %xmm3, %xmm0 // (big input) ? input >> 12 : input 98 pslld $23, %xmm3 99 paddd %xmm3, %xmm0 // (float)input
|
/external/boringssl/win-x86/crypto/chacha/ |
H A D | chacha-x86.asm | 407 movdqu xmm3,[ebx] 415 pshufd xmm0,xmm3,0 416 pshufd xmm1,xmm3,85 417 pshufd xmm2,xmm3,170 418 pshufd xmm3,xmm3,255 428 movdqa [112+ebp],xmm3 429 movdqu xmm3,[16+edx] 436 pshufd xmm0,xmm3,0 437 pshufd xmm1,xmm3,8 [all...] |
/external/libvpx/libvpx/vpx_dsp/x86/ |
H A D | sad_sse4.asm | 18 movq xmm3, MMWORD PTR [rdi+8] 20 punpcklqdq xmm1, xmm3 21 punpcklqdq xmm3, xmm2 29 movdqa xmm4, xmm3 30 mpsadbw xmm3, xmm0, 0x0 34 paddw xmm1, xmm3 39 movq xmm3, MMWORD PTR [rdi+8] 41 punpcklqdq xmm5, xmm3 42 punpcklqdq xmm3, xmm2 50 movdqa xmm4, xmm3 [all...] |