Home | History | Annotate | Download | only in source

Lines Matching full:xmm2

253     movdqa    xmm2, xmm3
254 palignr xmm2, xmm1, 8 // xmm2 = { xmm3[0:3] xmm1[8:15]}
255 pshufb xmm2, xmm4
256 por xmm2, xmm5
259 movdqa [edx + 32], xmm2
293 movdqa xmm2, xmm3
294 palignr xmm2, xmm1, 8 // xmm2 = { xmm3[0:3] xmm1[8:15]}
295 pshufb xmm2, xmm4
296 por xmm2, xmm5
299 movdqa [edx + 32], xmm2
351 movdqa xmm2, xmm0
353 psllw xmm2, 11 // B in upper 5 bits
355 pmulhuw xmm2, xmm5 // * (256 + 8)
357 por xmm1, xmm2 // RB
361 movdqa xmm2, xmm1
363 punpckhbw xmm2, xmm0
365 movdqa [eax * 2 + edx + 16], xmm2 // store next 4 pixels of ARGB
401 movdqa xmm2, xmm0
403 psllw xmm2, 11 // B in upper 5 bits
405 pmulhuw xmm2, xmm5 // * (256 + 8)
408 por xmm1, xmm2 // RB
409 movdqa xmm2, xmm0
411 psraw xmm2, 8 // A
413 pand xmm2, xmm7
414 por xmm0, xmm2 // AG
415 movdqa xmm2, xmm1
417 punpckhbw xmm2, xmm0
419 movdqa [eax * 2 + edx + 16], xmm2 // store next 4 pixels of ARGB
446 movdqa xmm2, xmm0
448 pand xmm2, xmm5 // mask high nibbles
450 movdqa xmm3, xmm2
454 por xmm2, xmm3
456 punpcklbw xmm0, xmm2
457 punpckhbw xmm1, xmm2
479 movdqa xmm2, [eax + 32]
484 pshufb xmm2, xmm6
489 movdqa xmm5, xmm2 // 8 bytes from 2 for 1
494 psrldq xmm2, 8 // 4 bytes from 2
496 por xmm2, xmm3 // 12 bytes from 3 for 2
498 movdqa [edx + 32], xmm2 // store 2
518 movdqa xmm2, [eax + 32]
523 pshufb xmm2, xmm6
528 movdqa xmm5, xmm2 // 8 bytes from 2 for 1
533 psrldq xmm2, 8 // 4 bytes from 2
535 por xmm2, xmm3 // 12 bytes from 3 for 2
537 movdqa [edx + 32], xmm2 // store 2
563 movdqa xmm2, xmm0 // G
566 psrld xmm2, 5 // G
569 pand xmm2, xmm4 // G
571 por xmm1, xmm2 // BG
603 movdqa xmm2, xmm0 // G
607 psrld xmm2, 6 // G
611 pand xmm2, xmm5 // G
614 por xmm2, xmm3 // GR
615 por xmm0, xmm2 // BGRA
670 movdqa xmm2, [eax + 32]
674 pmaddubsw xmm2, xmm4
678 phaddw xmm2, xmm3
680 psrlw xmm2, 7
681 packuswb xmm0, xmm2
704 movdqu xmm2, [eax + 32]
708 pmaddubsw xmm2, xmm4
712 phaddw xmm2, xmm3
714 psrlw xmm2, 7
715 packuswb xmm0, xmm2
738 movdqa xmm2, [eax + 32]
742 pmaddubsw xmm2, xmm4
746 phaddw xmm2, xmm3
748 psrlw xmm2, 7
749 packuswb xmm0, xmm2
772 movdqu xmm2, [eax + 32]
776 pmaddubsw xmm2, xmm4
780 phaddw xmm2, xmm3
782 psrlw xmm2, 7
783 packuswb xmm0, xmm2
806 movdqa xmm2, [eax + 32]
810 pmaddubsw xmm2, xmm4
814 phaddw xmm2, xmm3
816 psrlw xmm2, 7
817 packuswb xmm0, xmm2
840 movdqu xmm2, [eax + 32]
844 pmaddubsw xmm2, xmm4
848 phaddw xmm2, xmm3
850 psrlw xmm2, 7
851 packuswb xmm0, xmm2
874 movdqa xmm2, [eax + 32]
878 pmaddubsw xmm2, xmm4
882 phaddw xmm2, xmm3
884 psrlw xmm2, 7
885 packuswb xmm0, xmm2
908 movdqu xmm2, [eax + 32]
912 pmaddubsw xmm2, xmm4
916 phaddw xmm2, xmm3
918 psrlw xmm2, 7
919 packuswb xmm0, xmm2
950 movdqa xmm2, [eax + 32]
954 pavgb xmm2, [eax + esi + 32]
961 movdqa xmm4, xmm2
962 shufps xmm2, xmm3, 0x88
964 pavgb xmm2, xmm4
970 movdqa xmm3, xmm2
972 pmaddubsw xmm2, xmm7
975 phaddw xmm0, xmm2
1016 movdqu xmm2, [eax + 32]
1023 pavgb xmm2, xmm4
1031 movdqa xmm4, xmm2
1032 shufps xmm2, xmm3, 0x88
1034 pavgb xmm2, xmm4
1040 movdqa xmm3, xmm2
1042 pmaddubsw xmm2, xmm7
1045 phaddw xmm0, xmm2
1086 movdqa xmm2, [eax + 32]
1090 pavgb xmm2, [eax + esi + 32]
1097 movdqa xmm4, xmm2
1098 shufps xmm2, xmm3, 0x88
1100 pavgb xmm2, xmm4
1106 movdqa xmm3, xmm2
1108 pmaddubsw xmm2, xmm7
1111 phaddw xmm0, xmm2
1152 movdqu xmm2, [eax + 32]
1159 pavgb xmm2, xmm4
1167 movdqa xmm4, xmm2
1168 shufps xmm2, xmm3, 0x88
1170 pavgb xmm2, xmm4
1176 movdqa xmm3, xmm2
1178 pmaddubsw xmm2, xmm7
1181 phaddw xmm0, xmm2
1222 movdqa xmm2, [eax + 32]
1226 pavgb xmm2, [eax + esi + 32]
1233 movdqa xmm4, xmm2
1234 shufps xmm2, xmm3, 0x88
1236 pavgb xmm2, xmm4
1242 movdqa xmm3, xmm2
1244 pmaddubsw xmm2, xmm7
1247 phaddw xmm0, xmm2
1288 movdqu xmm2, [eax + 32]
1295 pavgb xmm2, xmm4
1303 movdqa xmm4, xmm2
1304 shufps xmm2, xmm3, 0x88
1306 pavgb xmm2, xmm4
1312 movdqa xmm3, xmm2
1314 pmaddubsw xmm2, xmm7
1317 phaddw xmm0, xmm2
1358 movdqa xmm2, [eax + 32]
1362 pavgb xmm2, [eax + esi + 32]
1369 movdqa xmm4, xmm2
1370 shufps xmm2, xmm3, 0x88
1372 pavgb xmm2, xmm4
1378 movdqa xmm3, xmm2
1380 pmaddubsw xmm2, xmm7
1383 phaddw xmm0, xmm2
1424 movdqu xmm2, [eax + 32]
1431 pavgb xmm2, xmm4
1439 movdqa xmm4, xmm2
1440 shufps xmm2, xmm3, 0x88
1442 pavgb xmm2, xmm4
1448 movdqa xmm3, xmm2
1450 pmaddubsw xmm2, xmm7
1453 phaddw xmm0, xmm2
1562 __asm movdqa xmm2, xmm0 \
1565 __asm pmaddubsw xmm2, kUVToR /* scale R UV */ \
1568 __asm psubw xmm2, kUVBiasR \
1577 __asm paddsw xmm2, xmm3 /* R += Y */ \
1580 __asm psraw xmm2, 6 \
1583 __asm packuswb xmm2, xmm2 /* R */ \
1590 __asm movdqa xmm2, xmm0 \
1593 __asm pmaddubsw xmm2, kVUToR /* scale R UV */ \
1596 __asm psubw xmm2, kUVBiasR \
1605 __asm paddsw xmm2, xmm3 /* R += Y */ \
1608 __asm psraw xmm2, 6 \
1611 __asm packuswb xmm2, xmm2 /* R */ \
1641 punpcklbw xmm2, xmm5 // RA
1643 punpcklwd xmm0, xmm2 // BGRA first 4 pixels
1644 punpckhwd xmm1, xmm2 // BGRA next 4 pixels
1684 punpcklbw xmm2, xmm5 // RA
1686 punpcklwd xmm0, xmm2 // BGRA first 4 pixels
1687 punpckhwd xmm1, xmm2 // BGRA next 4 pixels
1728 punpcklbw xmm2, xmm5 // RA
1730 punpcklwd xmm0, xmm2 // BGRA first 4 pixels
1731 punpckhwd xmm1, xmm2 // BGRA next 4 pixels
1767 punpcklbw xmm2, xmm5 // RA
1769 punpcklwd xmm0, xmm2 // BGRA first 4 pixels
1770 punpckhwd xmm1, xmm2 // BGRA next 4 pixels
1805 punpcklbw xmm2, xmm5 // RA
1807 punpcklwd xmm0, xmm2 // BGRA first 4 pixels
1808 punpckhwd xmm1, xmm2 // BGRA next 4 pixels
1847 punpcklbw xmm2, xmm5 // RA
1849 punpcklwd xmm0, xmm2 // BGRA first 4 pixels
1850 punpckhwd xmm1, xmm2 // BGRA next 4 pixels
1890 punpcklbw xmm2, xmm5 // RA
1892 punpcklwd xmm0, xmm2 // BGRA first 4 pixels
1893 punpckhwd xmm1, xmm2 // BGRA next 4 pixels
1934 punpcklbw xmm2, xmm5 // RA
1936 punpcklwd xmm0, xmm2 // BGRA first 4 pixels
1937 punpckhwd xmm1, xmm2 // BGRA next 4 pixels
1974 punpcklbw xmm2, xmm5 // RA
1976 punpcklwd xmm0, xmm2 // BGRA first 4 pixels
1977 punpckhwd xmm1, xmm2 // BGRA next 4 pixels
2012 punpcklbw xmm2, xmm5 // RA
2014 punpcklwd xmm0, xmm2 // BGRA first 4 pixels
2015 punpckhwd xmm1, xmm2 // BGRA next 4 pixels
2052 punpcklbw xmm5, xmm2 // AR
2093 punpcklbw xmm5, xmm2 // AR
2133 punpcklbw xmm2, xmm1 // RG
2135 movdqa xmm1, xmm2
2136 punpcklwd xmm2, xmm0 // RGBA first 4 pixels
2138 movdqa [edx], xmm2
2174 punpcklbw xmm2, xmm1 // RG
2176 movdqa xmm1, xmm2
2177 punpcklwd xmm2, xmm0 // RGBA first 4 pixels
2179 movdqu [edx], xmm2
2215 punpcklbw xmm1, xmm2 // GR
2256 punpcklbw xmm1, xmm2 // GR
2287 movd xmm2,eax
2288 pshufd xmm2,xmm2,0
2300 pmulhuw xmm0, xmm2
2463 movdqa xmm2, xmm0
2468 psrlw xmm2, 8 // odd bytes
2470 packuswb xmm2, xmm3
2472 movdqa [edx + edi], xmm2
2619 movdqa xmm2, [eax + esi]
2622 pavgb xmm0, xmm2
2726 movdqu xmm2, [eax + esi]
2729 pavgb xmm0, xmm2
2831 movdqa xmm2, [eax + esi]
2834 pavgb xmm0, xmm2
2936 movdqu xmm2, [eax + esi]
2939 pavgb xmm0, xmm2
3031 movd xmm2, [esi] // _r_b
3035 pand xmm2, xmm6 // _r_b
3037 pmullw xmm2, xmm3 // _r_b * alpha
3043 psrlw xmm2, 8 // _r_b convert to 8 bits again
3044 paddusb xmm0, xmm2 // + src argb
3062 movdqu xmm2, [esi] // _r_b
3066 pand xmm2, xmm6 // _r_b
3068 pmullw xmm2, xmm3 // _r_b * alpha
3074 psrlw xmm2, 8 // _r_b convert to 8 bits again
3075 paddusb xmm0, xmm2 // + src argb
3093 movd xmm2, [esi] // _r_b
3097 pand xmm2, xmm6 // _r_b
3099 pmullw xmm2, xmm3 // _r_b * alpha
3105 psrlw xmm2, 8 // _r_b convert to 8 bits again
3106 paddusb xmm0, xmm2 // + src argb
3165 movd xmm2, [esi] // _r_b
3167 pand xmm2, xmm6 // _r_b
3169 pmullw xmm2, xmm3 // _r_b * alpha
3175 psrlw xmm2, 8 // _r_b convert to 8 bits again
3176 paddusb xmm0, xmm2 // + src argb
3199 movdqa xmm2, [esi] // _r_b
3201 pand xmm2, xmm6 // _r_b
3203 pmullw xmm2, xmm3 // _r_b * alpha
3209 psrlw xmm2, 8 // _r_b convert to 8 bits again
3210 paddusb xmm0, xmm2 // + src argb
3225 movdqu xmm2, [esi] // _r_b
3227 xmm2, xmm6 // _r_b
3229 pmullw xmm2, xmm3 // _r_b * alpha
3235 psrlw xmm2, 8 // _r_b convert to 8 bits again
3236 paddusb xmm0, xmm2 // + src argb
3254 movd xmm2, [esi] // _r_b
3256 pand xmm2, xmm6 // _r_b
3258 pmullw xmm2, xmm3 // _r_b * alpha
3264 psrlw xmm2, 8 // _r_b convert to 8 bits again
3265 paddusb xmm0, xmm2 // + src argb
3299 pshufhw xmm2, xmm0,0FFh // 8 alpha words
3300 pshuflw xmm2, xmm2,0FFh
3301 pmulhuw xmm0, xmm2 // rgb * a
3304 pshufhw xmm2, xmm1,0FFh // 8 alpha words
3305 pshuflw xmm2, xmm2,0FFh
3306 pmulhuw xmm1, xmm2 // rgb * a
3307 movdqa xmm2, [eax] // alphas
3309 pand xmm2, xmm4
3313 por xmm0, xmm2
3354 movdqa xmm2, [eax] // read 4 pixels
3355 punpckhbw xmm2, xmm2 // next 2 pixel rgbs
3356 pmulhuw xmm1, xmm2 // rgb * a
3357 movdqa xmm2, [eax] // mask original alpha
3358 pand xmm2, xmm3
3362 por xmm0, xmm2 // copy original alpha
3395 movd xmm2, dword ptr fixed_invtbl8[esi * 4]
3397 pshuflw xmm2, xmm2,0C0h // first 4 inv_alpha words
3399 movlhps xmm2, xmm3
3400 pmulhuw xmm0, xmm2 // rgb * a
3406 movd xmm2, dword ptr fixed_invtbl8[esi * 4]
3408 pshuflw xmm2, xmm2,0C0h // first 4 inv_alpha words
3410 movlhps xmm2, xmm3
3411 pmulhuw xmm1, xmm2 // rgb * a
3413 movdqa xmm2, [eax] // alphas
3414 pand xmm2, xmm4
3416 por xmm0, xmm2
3453 movdqa xmm2, [eax] // A
3455 psrld xmm2, 24
3457 packuswb xmm2, xmm3
3458 packuswb xmm2, xmm2 // 8 A bytes
3461 punpcklbw xmm3, xmm2 // 8 GA words
3498 movdqa xmm2, kARGBToSepiaB
3506 pmaddubsw xmm0, xmm2
3507 pmaddubsw xmm6, xmm2
3558 movd xmm2, [edx]
3561 pshufd xmm2, xmm2, 0
3569 pmaddubsw xmm0, xmm2
3570 pmaddubsw xmm6, xmm2
3665 movd xmm2, [esp + 8] /* scale */
3669 pshuflw xmm2, xmm2, 040h
3670 pshufd xmm2, xmm2, 044h
3683 pmulhuw xmm0, xmm2 // pixel * scale >> 16
3686 pmulhuw xmm1, xmm2
3739 movdqa xmm2, [eax + 32]
3745 psubd xmm2, [eax + edx * 4 + 32]
3752 psubd xmm2, [esi + 32]
3758 paddd xmm2, [esi + edx * 4 + 32]
3766 cvtdq2ps xmm2, xmm2
3768 mulps xmm2, xmm4
3772 cvtps2dq xmm2, xmm2
3775 packssdw xmm2, xmm3
3776 packuswb xmm0, xmm2
3831 movdqu xmm2, [eax] // 4 argb pixels 16 bytes.
3833 movdqa xmm4, xmm2
3835 punpcklbw xmm2, xmm1
3836 movdqa xmm3, xmm2
3837 punpcklwd xmm2, xmm1
3845 paddd xmm0, xmm2
3846 movdqa xmm2, [edx + esi] // previous row above.
3847 paddd xmm2, xmm0
3861 movdqa [edx], xmm2
3877 movd xmm2, dword ptr [eax] // 1 argb pixel 4 bytes.
3879 punpcklbw xmm2, xmm1
3880 punpcklwd xmm2, xmm1
3881 paddd xmm0, xmm2
3882 movdqu xmm2, [edx + esi]
3883 paddd xmm2, xmm0
3884 movdqu [edx], xmm2
3904 movd xmm2, [esp + 16] // value
3906 punpcklbw xmm2, xmm2
3907 punpcklqdq xmm2, xmm2
3915 pmulhuw xmm0, xmm2 // argb * value
3916 pmulhuw xmm1, xmm2 // argb * value
3943 movq xmm2, qword ptr [ecx] // uv
3955 movdqa xmm0, xmm2 // x0, y0, x1, y1
3957 movlhps xmm2, xmm0
3960 movdqa xmm3, xmm2 // x2, y2, x3, y3
3967 cvttps2dq xmm0, xmm2 // x, y float to int first 2
3978 addps xmm2, xmm4 // x, y += dx, dy first 2
3999 cvttps2dq xmm0, xmm2 // x, y float to int
4002 addps xmm2, xmm7 // x, y += dx, dy
4047 movdqa xmm2, [esi + edx]
4049 punpcklbw xmm0, xmm2
4050 punpckhbw xmm1, xmm2