Home | History | Annotate | Download | only in source

Lines Matching full:xmm3

251     movdqu    xmm3, [eax + 32]
253 movdqa xmm2, xmm3
254 palignr xmm2, xmm1, 8 // xmm2 = { xmm3[0:3] xmm1[8:15]}
257 palignr xmm1, xmm0, 12 // xmm1 = { xmm3[0:7] xmm0[12:15]}
264 palignr xmm3, xmm3, 4 // xmm3 = { xmm3[4:15]}
265 pshufb xmm3, xmm4
267 por xmm3, xmm5
269 movdqa [edx + 48], xmm3
291 movdqu xmm3, [eax + 32]
293 movdqa xmm2, xmm3
294 palignr xmm2, xmm1, 8 // xmm2 = { xmm3[0:3] xmm1[8:15]}
297 palignr xmm1, xmm0, 12 // xmm1 = { xmm3[0:7] xmm0[12:15]}
304 palignr xmm3, xmm3, 4 // xmm3 = { xmm3[4:15]}
305 pshufb xmm3, xmm4
307 por xmm3, xmm5
309 movdqa [edx + 48], xmm3
333 pcmpeqb xmm3, xmm3 // generate mask 0xf800f800 for Red
334 psllw xmm3, 11
352 pand xmm1, xmm3 // R in upper 5 bits
384 pcmpeqb xmm3, xmm3 // generate mask 0xf800f800 for Red
385 psllw xmm3, 11
386 movdqa xmm4, xmm3 // generate mask 0x03e003e0 for Green
404 pand xmm1, xmm3
450 movdqa xmm3, xmm2
452 psrlw xmm3, 4
454 por xmm2, xmm3
480 movdqa xmm3, [eax + 48]
485 pshufb xmm3, xmm6
495 pslldq xmm3, 4 // 12 bytes from 3 for 2
496 por xmm2, xmm3 // 12 bytes from 3 for 2
519 movdqa xmm3, [eax + 48]
524 pshufb xmm3, xmm6
534 pslldq xmm3, 4 // 12 bytes from 3 for 2
535 por xmm2, xmm3 // 12 bytes from 3 for 2
551 pcmpeqb xmm3, xmm3 // generate mask 0x0000001f
552 psrld xmm3, 27
568 pand xmm1, xmm3 // B
604 movdqa xmm3, xmm0 // R
608 psrld xmm3, 9 // R
612 pand xmm3, xmm6 // R
614 por xmm2, xmm3 // GR
634 movdqa xmm3, xmm4 // generate mask 0x00f000f0
635 psrlw xmm3, 8
641 pand xmm0, xmm3 // low nibble
671 movdqa xmm3, [eax + 48]
675 pmaddubsw xmm3, xmm4
678 phaddw xmm2, xmm3
705 movdqu xmm3, [eax + 48]
709 pmaddubsw xmm3, xmm4
712 phaddw xmm2, xmm3
739 movdqa xmm3, [eax + 48]
743 pmaddubsw xmm3, xmm4
746 phaddw xmm2, xmm3
773 movdqu xmm3, [eax + 48]
777 pmaddubsw xmm3, xmm4
780 phaddw xmm2, xmm3
807 movdqa xmm3, [eax + 48]
811 pmaddubsw xmm3, xmm4
814 phaddw xmm2, xmm3
841 movdqu xmm3, [eax + 48]
845 pmaddubsw xmm3, xmm4
848 phaddw xmm2, xmm3
875 movdqa xmm3, [eax + 48]
879 pmaddubsw xmm3, xmm4
882 phaddw xmm2, xmm3
909 movdqu xmm3, [eax + 48]
913 pmaddubsw xmm3, xmm4
916 phaddw xmm2, xmm3
951 movdqa xmm3, [eax + 48]
955 pavgb xmm3, [eax + esi + 48]
962 shufps xmm2, xmm3, 0x88
963 shufps xmm4, xmm3, 0xdd
970 movdqa xmm3, xmm2
974 pmaddubsw xmm3, xmm6
976 phaddw xmm1, xmm3
1017 movdqu xmm3, [eax + 48]
1025 pavgb xmm3, xmm4
1032 shufps xmm2, xmm3, 0x88
1033 shufps xmm4, xmm3, 0xdd
1040 movdqa xmm3, xmm2
1044 pmaddubsw xmm3, xmm6
1046 phaddw xmm1, xmm3
1087 movdqa xmm3, [eax + 48]
1091 pavgb xmm3, [eax + esi + 48]
1098 shufps xmm2, xmm3, 0x88
1099 shufps xmm4, xmm3, 0xdd
1106 movdqa xmm3, xmm2
1110 pmaddubsw xmm3, xmm6
1112 phaddw xmm1, xmm3
1153 movdqu xmm3, [eax + 48]
1161 pavgb xmm3, xmm4
1168 shufps xmm2, xmm3, 0x88
1169 shufps xmm4, xmm3, 0xdd
1176 movdqa xmm3, xmm2
1180 pmaddubsw xmm3, xmm6
1182 phaddw xmm1, xmm3
1223 movdqa xmm3, [eax + 48]
1227 pavgb xmm3, [eax + esi + 48]
1234 shufps xmm2, xmm3, 0x88
1235 shufps xmm4, xmm3, 0xdd
1242 movdqa xmm3, xmm2
1246 pmaddubsw xmm3, xmm6
1248 phaddw xmm1, xmm3
1289 movdqu xmm3, [eax + 48]
1297 pavgb xmm3, xmm4
1304 shufps xmm2, xmm3, 0x88
1305 shufps xmm4, xmm3, 0xdd
1312 movdqa xmm3, xmm2
1316 pmaddubsw xmm3, xmm6
1318 phaddw xmm1, xmm3
1359 movdqa xmm3, [eax + 48]
1363 pavgb xmm3, [eax + esi + 48]
1370 shufps xmm2, xmm3, 0x88
1371 shufps xmm4, xmm3, 0xdd
1378 movdqa xmm3, xmm2
1382 pmaddubsw xmm3, xmm6
1384 phaddw xmm1, xmm3
1425 movdqu xmm3, [eax + 48]
1433 pavgb xmm3, xmm4
1440 shufps xmm2, xmm3, 0x88
1441 shufps xmm4, xmm3, 0xdd
1448 movdqa xmm3, xmm2
1452 pmaddubsw xmm3, xmm6
1454 phaddw xmm1, xmm3
1570 __asm movq xmm3, qword ptr [eax] /* NOLINT */ \
1572 __asm punpcklbw xmm3, xmm4 \
1573 __asm psubsw xmm3, kYSub16 \
1574 __asm pmullw xmm3, kYToRgb \
1575 __asm paddsw xmm0, xmm3 /* B += Y */ \
1576 __asm paddsw xmm1, xmm3 /* G += Y */ \
1577 __asm paddsw xmm2, xmm3 /* R += Y */ \
1598 __asm movq xmm3, qword ptr [eax] /* NOLINT */ \
1600 __asm punpcklbw xmm3, xmm4 \
1601 __asm psubsw xmm3, kYSub16 \
1602 __asm pmullw xmm3, kYToRgb \
1603 __asm paddsw xmm0, xmm3 /* B += Y */ \
1604 __asm paddsw xmm1, xmm3 /* G += Y */ \
1605 __asm paddsw xmm2, xmm3 /* R += Y */ \
2284 movd xmm3,eax
2285 pshufd xmm3,xmm3,0
2299 psubusw xmm0, xmm3
2464 movdqa xmm3, xmm1
2469 psrlw xmm3, 8
2470 packuswb xmm2, xmm3
2620 movdqa xmm3, [eax + esi + 16]
2623 pavgb xmm1, xmm3
2727 movdqu xmm3, [eax + esi + 16]
2730 pavgb xmm1, xmm3
2832 movdqa xmm3, [eax + esi + 16]
2835 pavgb xmm1, xmm3
2937 movdqu xmm3, [eax + esi + 16]
2940 pavgb xmm1, xmm3
3027 movd xmm3, [eax]
3029 movdqa xmm0, xmm3 // src argb
3030 pxor xmm3, xmm4 // ~alpha
3032 psrlw xmm3, 8 // alpha
3033 pshufhw xmm3, xmm3,0F5h // 8 alpha words
3034 pshuflw xmm3, xmm3,0F5h
3036 paddw xmm3, xmm7 // 256 - alpha
3037 pmullw xmm2, xmm3 // _r_b * alpha
3042 pmullw xmm1, xmm3 // _a_g * alpha
3058 movdqu xmm3, [eax] // src argb
3060 movdqa xmm0, xmm3 // src argb
3061 pxor xmm3, xmm4 // ~alpha
3063 psrlw xmm3, 8 // alpha
3064 pshufhw xmm3, xmm3,0F5h // 8 alpha words
3065 pshuflw xmm3, xmm3,0F5h
3067 paddw xmm3, xmm7 // 256 - alpha
3068 pmullw xmm2, xmm3 // _r_b * alpha
3073 pmullw xmm1, xmm3 // _a_g * alpha
3089 movd xmm3, [eax] // src argb
3091 movdqa xmm0, xmm3 // src argb
3092 pxor xmm3, xmm4 // ~alpha
3094 psrlw xmm3, 8 // alpha
3095 pshufhw xmm3, xmm3,0F5h // 8 alpha words
3096 pshuflw xmm3, xmm3,0F5h
3098 paddw xmm3, xmm7 // 256 - alpha
3099 pmullw xmm2, xmm3 // _r_b * alpha
3104 pmullw xmm1, xmm3 // _a_g * alpha
3128 // psrlw xmm3, 8 // alpha
3129 // pshufhw xmm3, xmm3,0F5h // 8 alpha words
3130 // pshuflw xmm3, xmm3,0F5h
3132 // pshufb xmm3, kShuffleAlpha // alpha
3161 movd xmm3, [eax]
3163 movdqa xmm0, xmm3 // src argb
3164 pxor xmm3, xmm4 // ~alpha
3166 pshufb xmm3, kShuffleAlpha // alpha
3168 paddw xmm3, xmm7 // 256 - alpha
3169 pmullw xmm2, xmm3 // _r_b * alpha
3174 pmullw xmm1, xmm3 // _a_g * alpha
3195 movdqa xmm3, [eax] // src argb
3197 movdqa xmm0, xmm3 // src argb
3198 pxor xmm3, xmm4 // ~alpha
3200 pshufb xmm3, kShuffleAlpha // alpha
3202 paddw xmm3, xmm7 // 256 - alpha
3203 pmullw xmm2, xmm3 // _r_b * alpha
3208 pmullw xmm1, xmm3 // _a_g * alpha
3221 movdqu xmm3, [eax] // src argb
3223 movdqa xmm0, xmm3 // src argb
3224 pxor xmm3, xmm4 // ~alpha
3226 pshufb xmm3, kShuffleAlpha // alpha
3228 paddw xmm3, xmm7 // 256 - alpha
3229 pmullw xmm2, xmm3 // _r_b * alpha
3234 pmullw xmm1, xmm3 // _a_g * alpha
3250 movd xmm3, [eax] // src argb
3252 movdqa xmm0, xmm3 // src argb
3253 pxor xmm3, xmm4 // ~alpha
3255 pshufb xmm3, kShuffleAlpha // alpha
3257 paddw xmm3, xmm7 // 256 - alpha
3258 pmullw xmm2, xmm3 // _r_b * alpha
3263 pmullw xmm1, xmm3 // _a_g * alpha
3340 pcmpeqb xmm3, xmm3 // generate mask 0xff000000
3341 pslld xmm3, 24
3358 pand xmm2, xmm3
3396 movd xmm3, dword ptr fixed_invtbl8[edi * 4]
3398 pshuflw xmm3, xmm3,0C0h // next 4 inv_alpha words
3399 movlhps xmm2, xmm3
3407 movd xmm3, dword ptr fixed_invtbl8[edi * 4]
3409 pshuflw xmm3, xmm3,0C0h // next 4 inv_alpha words
3410 movlhps xmm2, xmm3
3454 movdqa xmm3, [eax + 16]
3456 psrld xmm3, 24
3457 packuswb xmm2, xmm3
3459 movdqa xmm3, xmm0 // Weave into GG, GA, then GGGA
3461 punpcklbw xmm3, xmm2 // 8 GA words
3463 punpcklwd xmm0, xmm3 // GGGA first 4
3464 punpckhwd xmm1, xmm3 // GGGA next 4
3499 movdqa xmm3, kARGBToSepiaG
3513 pmaddubsw xmm5, xmm3
3514 pmaddubsw xmm1, xmm3
3559 movd xmm3, [edx + 4]
3562 pshufd xmm3, xmm3, 0
3573 pmaddubsw xmm5, xmm3
3574 pmaddubsw xmm1, xmm3
3666 movd xmm3, [esp + 12] /* interval_size */
3671 pshuflw xmm3, xmm3, 040h
3672 pshufd xmm3, xmm3, 044h
3687 pmullw xmm0, xmm3 // * interval_size
3689 pmullw xmm1, xmm3
3740 movdqa xmm3, [eax + 48]
3746 psubd xmm3, [eax + edx * 4 + 48]
3753 psubd xmm3, [esi + 48]
3759 paddd xmm3, [esi + edx * 4 + 48]
3767 cvtdq2ps xmm3, xmm3
3769 mulps xmm3, xmm4
3773 cvtps2dq xmm3, xmm3
3775 packssdw xmm2, xmm3
3836 movdqa xmm3, xmm2
3838 punpckhwd xmm3, xmm1
3849 paddd xmm0, xmm3
3850 movdqa xmm3, [edx + esi + 16]
3851 paddd xmm3, xmm0
3862 movdqa [edx + 16], xmm3
3960 movdqa xmm3, xmm2 // x2, y2, x3, y3
3961 addps xmm3, xmm4
3968 cvttps2dq xmm1, xmm3 // x, y float to int next 2
3986 addps xmm3, xmm4 // x, y += dx, dy next 2