/external/libjpeg-turbo/simd/ |
jquanti-sse2.asm | 69 movq xmm3, XMM_MMWORD [edx+eax*SIZEOF_JSAMPLE] ; xmm3=(OPQRSTUV) 76 punpcklbw xmm3,xmm6 ; xmm3=(OPQRSTUV) 78 paddw xmm3,xmm7 83 movdqa XMMWORD [XMMBLOCK(3,0,edi,SIZEOF_DCTELEM)], xmm3 144 movdqa xmm3,xmm7 152 pxor xmm3,xmm7 156 psubw xmm3,xmm7 ; if (xmm3 < 0) xmm3 = -xmm3 [all...] |
jidctfst-sse2-64.asm | 147 pshufd xmm3,xmm7,0xAA ; xmm3=col6=(06 06 06 06 06 06 06 06) 163 movdqa xmm3, XMMWORD [XMMBLOCK(6,0,rsi,SIZEOF_JCOEF)] 165 pmullw xmm3, XMMWORD [XMMBLOCK(6,0,rdx,SIZEOF_IFAST_MULT_TYPE)] 170 psubw xmm1,xmm3 172 paddw xmm5,xmm3 ; xmm5=tmp13 191 movdqa xmm3, XMMWORD [XMMBLOCK(3,0,rsi,SIZEOF_JCOEF)] 193 pmullw xmm3, XMMWORD [XMMBLOCK(3,0,rdx,SIZEOF_IFAST_MULT_TYPE)] 202 psubw xmm5,xmm3 ; xmm5=z10 204 paddw xmm0,xmm3 ; xmm0=z1 [all...] |
jidctfst-sse2.asm | 153 pshufd xmm3,xmm7,0xAA ; xmm3=col6=(06 06 06 06 06 06 06 06) 170 movdqa xmm3, XMMWORD [XMMBLOCK(6,0,esi,SIZEOF_JCOEF)] 172 pmullw xmm3, XMMWORD [XMMBLOCK(6,0,edx,SIZEOF_IFAST_MULT_TYPE)] 177 psubw xmm1,xmm3 179 paddw xmm5,xmm3 ; xmm5=tmp13 198 movdqa xmm3, XMMWORD [XMMBLOCK(3,0,esi,SIZEOF_JCOEF)] 200 pmullw xmm3, XMMWORD [XMMBLOCK(3,0,edx,SIZEOF_IFAST_MULT_TYPE)] 209 psubw xmm5,xmm3 ; xmm5=z10 211 paddw xmm0,xmm3 ; xmm0=z1 [all...] |
jquantf-sse2-64.asm | 71 punpcklwd xmm3,xmm1 ; xmm3=(***8***9***A***B) 78 psrad xmm3,(DWORD_BIT-BYTE_BIT) ; xmm3=(89AB) 80 cvtdq2ps xmm3,xmm3 ; xmm3=(89AB) 85 movaps XMMWORD [XMMBLOCK(1,0,rdi,SIZEOF_FAST_FLOAT)], xmm3 131 movaps xmm3, XMMWORD [XMMBLOCK(1,1,rsi,SIZEOF_FAST_FLOAT)] 133 mulps xmm3, XMMWORD [XMMBLOCK(1,1,rdx,SIZEOF_FAST_FLOAT) [all...] |
jquantf-sse2.asm | 73 punpcklwd xmm3,xmm1 ; xmm3=(***8***9***A***B) 80 psrad xmm3,(DWORD_BIT-BYTE_BIT) ; xmm3=(89AB) 82 cvtdq2ps xmm3,xmm3 ; xmm3=(89AB) 87 movaps XMMWORD [XMMBLOCK(1,0,edi,SIZEOF_FAST_FLOAT)], xmm3 140 movaps xmm3, XMMWORD [XMMBLOCK(1,1,esi,SIZEOF_FAST_FLOAT)] 142 mulps xmm3, XMMWORD [XMMBLOCK(1,1,edx,SIZEOF_FAST_FLOAT) [all...] |
/external/libvpx/libvpx/vpx_dsp/x86/ |
sad_ssse3.asm | 28 lddqu xmm3, XMMWORD PTR [rdi+2] 32 psadbw xmm3, xmm0 36 paddw xmm7, xmm3 41 lddqu xmm3, XMMWORD PTR [rdi+rdx+2] 48 psadbw xmm3, xmm0 52 paddw xmm7, xmm3 75 movdqa xmm3, XMMWORD PTR [rdi+16] 77 movdqa xmm1, xmm3 80 movdqa xmm2, xmm3 83 palignr xmm3, xmm4, (%2+2 [all...] |
vpx_high_subpixel_bilinear_sse2.asm | 19 movdqa xmm3, [rdx] ;load filters 20 pshuflw xmm4, xmm3, 11111111b ;k3 21 psrldq xmm3, 8 22 pshuflw xmm3, xmm3, 0b ;k4 23 punpcklwd xmm4, xmm3 ;k3k4 25 movq xmm3, rcx ;rounding 26 pshufd xmm3, xmm3, 0 48 paddd xmm0, xmm3 ;roundin [all...] |
vpx_subpixel_bilinear_sse2.asm | 19 movdqa xmm3, [rdx] ;load filters 20 pshuflw xmm4, xmm3, 11111111b ;k3 21 psrldq xmm3, 8 22 pshuflw xmm3, xmm3, 0b ;k4 23 punpcklqdq xmm4, xmm3 ;k3k4 25 movq xmm3, rcx ;rounding 26 pshufd xmm3, xmm3, 0 45 paddsw xmm0, xmm3 ;roundin [all...] |
/hardware/intel/common/omx-components/videocodec/libvpx_internal/libvpx/vp8/common/x86/ |
sad_ssse3.asm | 28 lddqu xmm3, XMMWORD PTR [rdi+2] 32 psadbw xmm3, xmm0 36 paddw xmm7, xmm3 41 lddqu xmm3, XMMWORD PTR [rdi+rdx+2] 48 psadbw xmm3, xmm0 52 paddw xmm7, xmm3 75 movdqa xmm3, XMMWORD PTR [rdi+16] 77 movdqa xmm1, xmm3 80 movdqa xmm2, xmm3 83 palignr xmm3, xmm4, (%2+2 [all...] |
/hardware/intel/common/omx-components/videocodec/libvpx_internal/libvpx/vp9/encoder/x86/ |
vp9_sad_ssse3.asm | 28 lddqu xmm3, XMMWORD PTR [rdi+2] 32 psadbw xmm3, xmm0 36 paddw xmm7, xmm3 41 lddqu xmm3, XMMWORD PTR [rdi+rdx+2] 48 psadbw xmm3, xmm0 52 paddw xmm7, xmm3 75 movdqa xmm3, XMMWORD PTR [rdi+16] 77 movdqa xmm1, xmm3 80 movdqa xmm2, xmm3 83 palignr xmm3, xmm4, (%2+2 [all...] |
/external/libvpx/libvpx/vp8/common/x86/ |
recon_sse2.asm | 48 movdqu xmm3, [rsi] 56 movdqa [rdi], xmm3 77 movdqu xmm3, [rsi] 86 movdqa [rdi], xmm3 106 movdqu xmm3, [rsi+rax] 109 movdqa [rdi+rcx], xmm3
|
/external/llvm/test/CodeGen/X86/ |
vector-popcnt-512.ll | 18 ; ALL-NEXT: vmovq %rax, %xmm3 22 ; ALL-NEXT: vpunpcklqdq {{.*#+}} xmm2 = xmm2[0],xmm3[0] 27 ; ALL-NEXT: vmovq %rax, %xmm3 31 ; ALL-NEXT: vpunpcklqdq {{.*#+}} xmm2 = xmm2[0],xmm3[0] 34 ; ALL-NEXT: vmovq %rax, %xmm3 38 ; ALL-NEXT: vpunpcklqdq {{.*#+}} xmm0 = xmm0[0],xmm3[0] 67 ; ALL-NEXT: vmovd %ecx, %xmm3 68 ; ALL-NEXT: vpinsrd $1, %eax, %xmm3, %xmm3 71 ; ALL-NEXT: vpinsrd $2, %eax, %xmm3, %xmm [all...] |
bswap-vector.ll | 122 ; CHECK-NOSSSE3-NEXT: movdqa %xmm0, %xmm3 123 ; CHECK-NOSSSE3-NEXT: punpckhbw {{.*#+}} xmm3 = xmm3[8],xmm2[8],xmm3[9],xmm2[9],xmm3[10],xmm2[10],xmm3[11],xmm2[11],xmm3[12],xmm2[12],xmm3[13],xmm2[13],xmm3[14],xmm2[14],xmm3[15],xmm2[15 [all...] |
vector-lzcnt-128.ll | 515 ; SSE2-NEXT: movd %ecx, %xmm3 521 ; SSE2-NEXT: punpcklwd {{.*#+}} xmm1 = xmm1[0],xmm3[0],xmm1[1],xmm3[1],xmm1[2],xmm3[2],xmm1[3],xmm3[3] 532 ; SSE2-NEXT: movd %ecx, %xmm3 533 ; SSE2-NEXT: punpcklwd {{.*#+}} xmm3 = xmm3[0],xmm2[0],xmm3[1],xmm2[1],xmm3[2],xmm2[2],xmm3[3],xmm2[3 [all...] |
vec_minmax_uint.ll | 18 ; SSE2-NEXT: movdqa %xmm1, %xmm3 19 ; SSE2-NEXT: pxor %xmm2, %xmm3 22 ; SSE2-NEXT: pcmpgtd %xmm3, %xmm4 24 ; SSE2-NEXT: pcmpeqd %xmm3, %xmm2 27 ; SSE2-NEXT: pshufd {{.*#+}} xmm3 = xmm4[1,1,3,3] 28 ; SSE2-NEXT: por %xmm2, %xmm3 29 ; SSE2-NEXT: pand %xmm3, %xmm0 30 ; SSE2-NEXT: pandn %xmm1, %xmm3 31 ; SSE2-NEXT: por %xmm3, %xmm0 38 ; SSE41-NEXT: movdqa %xmm1, %xmm3 [all...] |
fast-isel-select-sse.ll | 12 ; CHECK-NEXT: andnps %xmm3, %xmm0 16 ; AVX-NEXT: vblendvps %xmm0, %xmm2, %xmm3, %xmm0 26 ; CHECK-NEXT: andnpd %xmm3, %xmm0 30 ; AVX-NEXT: vblendvpd %xmm0, %xmm2, %xmm3, %xmm0 40 ; CHECK-NEXT: andnps %xmm3, %xmm1 44 ; AVX-NEXT: vblendvps %xmm0, %xmm2, %xmm3, %xmm0 54 ; CHECK-NEXT: andnpd %xmm3, %xmm1 58 ; AVX-NEXT: vblendvpd %xmm0, %xmm2, %xmm3, %xmm0 68 ; CHECK-NEXT: andnps %xmm3, %xmm1 72 ; AVX-NEXT: vblendvps %xmm0, %xmm2, %xmm3, %xmm [all...] |
/external/v8/test/cctest/ |
test-assembler-x64.cc | 766 __ movaps(xmm3, xmm0); 767 __ mulsd(xmm3, xmm1); 768 __ addsd(xmm3, xmm2); // Expected result in xmm3 775 __ ucomisd(xmm8, xmm3); 781 __ ucomisd(xmm8, xmm3); 787 __ ucomisd(xmm8, xmm3); 795 __ ucomisd(xmm8, xmm3); 802 __ ucomisd(xmm8, xmm3); 809 __ ucomisd(xmm8, xmm3); [all...] |
/hardware/intel/common/omx-components/videocodec/libvpx_internal/libvpx/vp9/common/x86/ |
vp9_subpixel_bilinear_sse2.asm | 19 movdqa xmm3, [rdx] ;load filters 20 pshuflw xmm4, xmm3, 11111111b ;k3 21 psrldq xmm3, 8 22 pshuflw xmm3, xmm3, 0b ;k4 23 punpcklqdq xmm4, xmm3 ;k3k4 25 movq xmm3, rcx ;rounding 26 pshufd xmm3, xmm3, 0 45 paddsw xmm0, xmm3 ;roundin [all...] |
/external/libyuv/files/source/ |
compare_win.cc | 38 movdqa xmm3, xmm1 // abs trick local 40 psubusb xmm2, xmm3 147 movdqa xmm3, xmm2 local 148 punpcklwd xmm3, xmm7 // src[0-3] local 149 pmulld xmm3, xmm5 local 162 paddd xmm3, xmm4 // add 16 results local 164 paddd xmm1, xmm3 189 vpmovzxbd xmm3, [eax] // src[0-3] local 192 vpmulld xmm3, xmm3, xmmword ptr kHashMul local 199 vpaddd xmm3, xmm3, xmm4 \/\/ add 16 results local [all...] |
/bionic/libc/arch-x86/atom/string/ |
ssse3-strcpy-atom.S | 283 movaps 16(%ecx, %esi), %xmm3 285 pcmpeqb %xmm3, %xmm0 296 movaps %xmm3, (%edx, %esi) 331 movaps 16(%ecx, %esi), %xmm3 333 pcmpeqb %xmm3, %xmm0 343 movaps %xmm3, (%edx, %esi) 356 movaps 32(%ecx), %xmm3 359 movaps %xmm3, %xmm6 362 pminub %xmm7, %xmm3 363 pminub %xmm2, %xmm3 [all...] |
/external/boringssl/win-x86_64/crypto/ec/ |
p256-x86_64-asm.asm | 722 pxor xmm3,xmm3 750 por xmm3,xmm10 763 movdqu XMMWORD[16+rcx],xmm3 806 pxor xmm3,xmm3 828 por xmm3,xmm10 838 movdqu XMMWORD[16+rcx],xmm3 1227 movdqu xmm3,XMMWORD[48+rsi] 1236 movdqa XMMWORD[(416+16)+rsp],xmm3 [all...] |
/external/libvpx/libvpx/third_party/libyuv/source/ |
rotate_gcc.cc | 38 "movq (%0,%3),%%xmm3 \n" 40 "punpcklbw %%xmm3,%%xmm2 \n" 41 "movdqa %%xmm2,%%xmm3 \n" 43 "palignr $0x8,%%xmm3,%%xmm3 \n" 60 "punpcklwd %%xmm3,%%xmm1 \n" 62 "movdqa %%xmm1,%%xmm3 \n" 64 "palignr $0x8,%%xmm3,%%xmm3 \n" 91 "punpckldq %%xmm7,%%xmm3 \n [all...] |
compare_win.cc | 37 movdqa xmm3, xmm1 // abs trick local 39 psubusb xmm2, xmm3 131 // 44: 66 0F 38 40 DD pmulld xmm3,xmm5 155 movdqa xmm3, xmm2 local 156 punpcklwd xmm3, xmm7 // src[0-3] local 157 pmulld(0xdd) // pmulld xmm3, xmm5 170 paddd xmm3, xmm4 // add 16 results local 172 paddd xmm1, xmm3 198 vpmovzxbd xmm3, dword ptr [eax] // src[0-3] local 201 pmulld xmm3, kHashMul local 208 paddd xmm3, xmm4 \/\/ add 16 results local [all...] |
/external/boringssl/linux-x86/crypto/aes/ |
aesni-x86.S | 68 pxor %xmm0,%xmm3 96 pxor %xmm0,%xmm3 124 pxor %xmm0,%xmm3 157 pxor %xmm0,%xmm3 190 pxor %xmm0,%xmm3 229 pxor %xmm0,%xmm3 268 pxor %xmm0,%xmm3 323 pxor %xmm0,%xmm3 395 movdqu 16(%esi),%xmm3 407 movups %xmm3,16(%edi [all...] |
/external/boringssl/mac-x86/crypto/aes/ |
aesni-x86.S | 63 pxor %xmm0,%xmm3 89 pxor %xmm0,%xmm3 115 pxor %xmm0,%xmm3 146 pxor %xmm0,%xmm3 177 pxor %xmm0,%xmm3 214 pxor %xmm0,%xmm3 251 pxor %xmm0,%xmm3 304 pxor %xmm0,%xmm3 374 movdqu 16(%esi),%xmm3 386 movups %xmm3,16(%edi [all...] |