Home | History | Annotate | Download | only in source

Lines Matching full:xmm0

214     movdqa     xmm0, [eax]
217 pand xmm0, xmm5
219 packuswb xmm0, xmm1
221 movdqa [edx], xmm0
244 movdqa xmm0, [eax]
249 pavgb xmm0, xmm2 // average rows
252 movdqa xmm2, xmm0 // average columns (32 to 16 pixels)
253 psrlw xmm0, 8
258 pavgw xmm0, xmm2
260 packuswb xmm0, xmm1
263 movdqa [edx], xmm0
288 movdqu xmm0, [eax]
291 pand xmm0, xmm5
293 packuswb xmm0, xmm1
295 movdqu [edx], xmm0
319 movdqu xmm0, [eax]
324 pavgb xmm0, xmm2 // average rows
327 movdqa xmm2, xmm0 // average columns (32 to 16 pixels)
328 psrlw xmm0, 8
333 pavgw xmm0, xmm2
335 packuswb xmm0, xmm1
338 movdqu [edx], xmm0
363 movdqa xmm0, [eax]
366 pand xmm0, xmm5
368 packuswb xmm0, xmm1
369 packuswb xmm0, xmm0
371 movq qword ptr [edx], xmm0
397 movdqa xmm0, [eax]
401 pavgb xmm0, xmm2 // average rows
410 pavgb xmm0, xmm2
413 movdqa xmm2, xmm0 // average columns (32 to 16 pixels)
414 psrlw xmm0, 8
419 pavgw xmm0, xmm2
421 packuswb xmm0, xmm1
423 movdqa xmm2, xmm0 // average columns (16 to 8 pixels)
424 psrlw xmm0, 8
426 pavgw xmm0, xmm2
427 packuswb xmm0, xmm0
430 movq qword ptr [edx], xmm0
456 movdqa xmm0, [eax]
459 pand xmm0, xmm5
461 packuswb xmm0, xmm1 // 32->16
462 packuswb xmm0, xmm0 // 16->8
463 packuswb xmm0, xmm0 // 8->4
465 movd dword ptr [edx], xmm0
491 movdqa xmm0, [eax] // average 8 rows to 1
495 pavgb xmm0, xmm2
505 pavgb xmm0, xmm2
522 pavgb xmm0, xmm2
525 psadbw xmm0, xmm7 // average 32 pixels to 4
527 pshufd xmm0, xmm0, 0xd8 // x1x0 -> xx01
529 por xmm0, xmm1 // -> 3201
530 psrlw xmm0, 3
531 packuswb xmm0, xmm0
532 packuswb xmm0, xmm0
535 movd dword ptr [edx], xmm0
567 movdqa xmm0, [eax]
571 palignr xmm1, xmm0, 8
572 pshufb xmm0, xmm3
575 movq qword ptr [edx], xmm0
591 // xmm0 src_row 0
621 movdqa xmm0, [eax] // pixels 0..7
623 pavgb xmm0, xmm1
624 pshufb xmm0, xmm2
625 pmaddubsw xmm0, xmm5
626 paddsw xmm0, xmm7
627 psrlw xmm0, 2
628 packuswb xmm0, xmm0
629 movq qword ptr [edx], xmm0
630 movdqu xmm0, [eax + 8] // pixels 8..15
632 pavgb xmm0, xmm1
633 pshufb xmm0, xmm3
634 pmaddubsw xmm0, xmm6
635 paddsw xmm0, xmm7
636 psrlw xmm0, 2
637 packuswb xmm0, xmm0
638 movq qword ptr [edx + 8], xmm0
639 movdqa xmm0, [eax + 16] // pixels 16..23
642 pavgb xmm0, xmm1
643 pshufb xmm0, xmm4
645 pmaddubsw xmm0, xmm1
646 paddsw xmm0, xmm7
647 psrlw xmm0, 2
648 packuswb xmm0, xmm0
650 movq qword ptr [edx + 16], xmm0
680 movdqa xmm0, [eax] // pixels 0..7
682 pavgb xmm1, xmm0
683 pavgb xmm0, xmm1
684 pshufb xmm0, xmm2
685 pmaddubsw xmm0, xmm5
686 paddsw xmm0, xmm7
687 psrlw xmm0, 2
688 packuswb xmm0, xmm0
689 movq qword ptr [edx], xmm0
690 movdqu xmm0, [eax + 8] // pixels 8..15
692 pavgb xmm1, xmm0
693 pavgb xmm0, xmm1
694 pshufb xmm0, xmm3
695 pmaddubsw xmm0, xmm6
696 paddsw xmm0, xmm7
697 psrlw xmm0, 2
698 packuswb xmm0, xmm0
699 movq qword ptr [edx + 8], xmm0
700 movdqa xmm0, [eax + 16] // pixels 16..23
703 pavgb xmm1, xmm0
704 pavgb xmm0, xmm1
705 pshufb xmm0, xmm4
707 pmaddubsw xmm0, xmm1
708 paddsw xmm0, xmm7
709 psrlw xmm0, 2
710 packuswb xmm0, xmm0
712 movq qword ptr [edx + 16], xmm0
738 movdqa xmm0, [eax] // 16 pixels -> 0,1,2,3,4,5
741 pshufb xmm0, xmm4
743 paddusb xmm0, xmm1
746 movq qword ptr [edx], xmm0 // write 12 pixels
747 movhlps xmm1, xmm0
774 movdqa xmm0, [eax] // sum up 3 rows into xmm0/1
776 movhlps xmm1, xmm0
778 punpcklbw xmm0, xmm5
782 paddusw xmm0, xmm6
789 paddusw xmm0, xmm6
792 movdqa xmm6, xmm0 // 8 pixels -> 0,1,2 of xmm6
793 psrldq xmm0, 2
794 paddusw xmm6, xmm0
795 psrldq xmm0, 2
796 paddusw xmm6, xmm0
840 movdqa xmm0, [eax] // average 2 rows into xmm0
841 pavgb xmm0, [eax + esi]
844 movdqa xmm1, xmm0 // 16 pixels -> 0,1,2,3,4,5 of xmm1
846 movdqa xmm6, xmm0
849 pshufb xmm0, xmm4
850 paddusw xmm1, xmm0
890 movdqa xmm0, [esi]
892 movdqa xmm1, xmm0
893 punpcklbw xmm0, xmm4
908 paddusw xmm0, xmm2 // sum 16 words
913 movdqa [edi], xmm0
961 movdqa xmm0, [esi] // row0
963 movdqa xmm1, xmm0
967 punpcklbw xmm0, xmm4
969 psubw xmm2, xmm0 // row1 - row0
973 paddw xmm0, xmm2 // sum rows
975 packuswb xmm0, xmm1
977 movdqa [esi + edi], xmm0
981 punpckhbw xmm0, xmm0 // duplicate last pixel for filtering
982 pshufhw xmm0, xmm0, 0xff
983 punpckhqdq xmm0, xmm0
984 movdqa [esi + edi], xmm0
991 movdqa xmm0, [esi]
993 movdqa [esi + edi], xmm0
997 punpckhbw xmm0, xmm0 // duplicate last pixel for filtering
998 pshufhw xmm0, xmm0, 0xff
999 punpckhqdq xmm0, xmm0
1000 movdqa [esi + edi], xmm0
1007 movdqa xmm0, [esi]
1008 pavgb xmm0, [esi + edx]
1010 movdqa [esi + edi], xmm0
1014 punpckhbw xmm0, xmm0 // duplicate last pixel for filtering
1015 pshufhw xmm0, xmm0, 0xff
1016 punpckhqdq xmm0, xmm0
1017 movdqa [esi + edi], xmm0
1044 movd xmm0, eax // high fraction 0..127
1048 punpcklbw xmm5, xmm0
1054 movdqa xmm0, [esi]
1056 movdqa xmm1, xmm0
1057 punpcklbw xmm0, xmm2
1059 pmaddubsw xmm0, xmm5
1061 psrlw xmm0, 7
1063 packuswb xmm0, xmm1
1065 movdqa [esi + edi], xmm0
1069 punpckhbw xmm0, xmm0 // duplicate last pixel for filtering
1070 pshufhw xmm0, xmm0, 0xff
1071 punpckhqdq xmm0, xmm0
1072 movdqa [esi + edi], xmm0
1080 movdqa xmm0, [esi]
1082 xmm0
1086 punpckhbw xmm0, xmm0
1087 pshufhw xmm0, xmm0, 0xff
1088 punpckhqdq xmm0, xmm0
1089 movdqa [esi + edi], xmm0
1096 movdqa xmm0, [esi]
1097 pavgb xmm0, [esi + edx]
1099 movdqa [esi + edi], xmm0
1103 punpckhbw xmm0, xmm0
1104 pshufhw xmm0, xmm0, 0xff
1105 punpckhqdq xmm0, xmm0
1106 movdqa [esi + edi], xmm0
1126 "movdqa (%0),%%xmm0 \n"
1129 "pand %%xmm5,%%xmm0 \n"
1131 "packuswb %%xmm1,%%xmm0 \n"
1132 "movdqa %%xmm0,(%1) \n"
1142 , "xmm0", "xmm1", "xmm5"
1154 "movdqa (%0),%%xmm0 \n"
1159 "pavgb %%xmm2,%%xmm0 \n"
1161 "movdqa %%xmm0,%%xmm2 \n"
1162 "psrlw $0x8,%%xmm0 \n"
1167 "pavgw %%xmm2,%%xmm0 \n"
1169 "packuswb %%xmm1,%%xmm0 \n"
1170 "movdqa %%xmm0,(%1) \n"
1180 , "xmm0", "xmm1", "xmm2", "xmm3", "xmm5"
1192 "movdqu (%0),%%xmm0 \n"
1195 "pand %%xmm5,%%xmm0 \n"
1197 "packuswb %%xmm1,%%xmm0 \n"
1198 "movdqu %%xmm0,(%1) \n"
1208 , "xmm0", "xmm1", "xmm5"
1221 "movdqu (%0),%%xmm0 \n"
1226 "pavgb %%xmm2,%%xmm0 \n"
1228 "movdqa %%xmm0,%%xmm2 \n"
1229 "psrlw $0x8,%%xmm0 \n"
1234 "pavgw %%xmm2,%%xmm0 \n"
1236 "packuswb %%xmm1,%%xmm0 \n"
1237 "movdqu %%xmm0,(%1) \n"
1247 , "xmm0", "xmm1", "xmm2", "xmm3", "xmm5"
1260 "movdqa (%0),%%xmm0 \n"
1263 "pand %%xmm5,%%xmm0 \n"
1265 "packuswb %%xmm1,%%xmm0 \n"
1266 "packuswb %%xmm0,%%xmm0 \n"
1267 "movq %%xmm0,(%1) \n"
1277 , "xmm0", "xmm1", "xmm5"
1291 "movdqa (%0),%%xmm0 \n"
1295 "pavgb %%xmm2,%%xmm0 \n"
1303 "pavgb %%xmm2,%%xmm0 \n"
1306 "movdqa %%xmm0,%%xmm2 \n"
1307 "psrlw $0x8,%%xmm0 \n"
1312 "pavgw %%xmm2,%%xmm0 \n"
1314 "packuswb %%xmm1,%%xmm0 \n"
1315 "movdqa %%xmm0,%%xmm2 \n"
1316 "psrlw $0x8,%%xmm0 \n"
1318 "pavgw %%xmm2,%%xmm0 \n"
1319 "packuswb %%xmm0,%%xmm0 \n"
1320 "movq %%xmm0,(%1) \n"
1331 , "xmm0", "xmm1", "xmm2", "xmm3", "xmm4", "xmm5", "xmm7"
1344 "movdqa (%0),%%xmm0 \n"
1347 "pand %%xmm5,%%xmm0 \n"
1349 "packuswb %%xmm1,%%xmm0 \n"
1350 "packuswb %%xmm0,%%xmm0 \n"
1351 "packuswb %%xmm0,%%xmm0 \n"
1352 "movd %%xmm0,(%1) \n"
1362 , "xmm0", "xmm1", "xmm5"
1376 "movdqa (%0),%%xmm0 \n"
1380 "pavgb %%xmm2,%%xmm0 \n"
1390 "pavgb %%xmm2,%%xmm0 \n"
1406 "pavgb %%xmm2,%%xmm0 \n"
1408 "psadbw %%xmm7,%%xmm0 \n"
1410 "pshufd $0xd8,%%xmm0,%%xmm0 \n"
1412 "por %%xmm1,%%xmm0 \n"
1413 "psrlw $0x3,%%xmm0 \n"
1414 "packuswb %%xmm0,%%xmm0 \n"
1415 "packuswb %%xmm0,%%xmm0 \n"
1416 "movd %%xmm0,(%1) \n"
1428 , "xmm0", "xmm1", "xmm2", "xmm3", "xmm4", "xmm5", "xmm6", "xmm7"
1448 "movdqa (%0),%%xmm0 \n"
1452 "palignr $0x8,%%xmm0,%%xmm1 \n"
1453 "pshufb %%xmm3,%%xmm0 \n"
1456 "movq %%xmm0,(%1) \n"
1468 , "xmm0", "xmm1", "xmm2", "xmm3", "xmm4", "xmm5"
1487 "movdqa %1,%%xmm0 \n" // kMadd11
1510 "pmaddubsw %%xmm0,%%xmm6 \n"
1535 , "xmm0", "xmm1", "xmm2", "xmm3", "xmm4", "xmm5", "xmm6", "xmm7"
1554 "movdqa %1,%%xmm0 \n" // kMadd11
1580 "pmaddubsw %%xmm0,%%xmm6 \n"
1606 , "xmm0", "xmm1", "xmm2", "xmm3", "xmm4", "xmm5", "xmm6", "xmm7"
1619 "movdqa (%0),%%xmm0 \n"
1622 "pshufb %%xmm4,%%xmm0 \n"
1624 "paddusb %%xmm1,%%xmm0 \n"
1625 "movq %%xmm0,(%1) \n"
1626 "movhlps %%xmm0,%%xmm1 \n"
1638 , "xmm0", "xmm1", "xmm4", "xmm5"
1660 "movdqa (%0),%%xmm0 \n"
1661 "pavgb (%0,%3,1),%%xmm0 \n"
1663 "movdqa %%xmm0,%%xmm1 \n"
1665 "movdqa %%xmm0,%%xmm6 \n"
1668 "pshufb %%xmm4,%%xmm0 \n"
1669 "paddusw %%xmm0,%%xmm1 \n"
1684 , "xmm0", "xmm1", "xmm2", "xmm3", "xmm4", "xmm5", "xmm6"
1705 "movdqa (%0),%%xmm0 \n"
1707 "movhlps %%xmm0,%%xmm1 \n"
1709 "punpcklbw %%xmm5,%%xmm0 \n"
1713 "paddusw %%xmm6,%%xmm0 \n"
1720 "paddusw %%xmm6,%%xmm0 \n"
1722 "movdqa %%xmm0,%%xmm6 \n"
1723 "psrldq $0x2,%%xmm0 \n"
1724 "paddusw %%xmm0,%%xmm6 \n"
1725 "psrldq $0x2,%%xmm0 \n"
1726 "paddusw %%xmm0,%%xmm6 \n"
1749 , "xmm0", "xmm1", "xmm2", "xmm3", "xmm4", "xmm5", "xmm6", "xmm7"
1764 "movdqa (%0),%%xmm0 \n"
1767 "movdqa %%xmm0,%%xmm1 \n"
1768 "punpcklbw %%xmm4,%%xmm0 \n"
1779 "paddusw %%xmm2,%%xmm0 \n"
1784 "movdqa %%xmm0,(%1) \n"
1799 , "xmm0", "xmm1", "xmm2", "xmm3", "xmm4"
1823 "movdqa (%1),%%xmm0 \n"
1825 "movdqa %%xmm0,%%xmm1 \n"
1829 "punpcklbw %%xmm4,%%xmm0 \n"
1831 "psubw %%xmm0,%%xmm2 \n"
1835 "paddw %%xmm2,%%xmm0 \n"
1837 "packuswb %%xmm1,%%xmm0 \n"
1839 "movdqa %%xmm0,(%1,%0,1) \n"
1845 "movdqa (%1),%%xmm0 \n"
1847 "movdqa %%xmm0,(%1,%0,1) \n"
1853 "movdqa (%1),%%xmm0 \n"
1854 "pavgb (%1,%4,1),%%xmm0 \n"
1856 "movdqa %%xmm0,(%1,%0,1) \n"
1861 "punpckhbw %%xmm0,%%xmm0 \n"
1862 "pshufhw $0xff,%%xmm0,%%xmm0 \n"
1863 "punpckhqdq %%xmm0,%%xmm0 \n"
1864 "movdqa %%xmm0,(%1,%0,1) \n"
1872 , "xmm0", "xmm1", "xmm2", "xmm3", "xmm4", "xmm5"
1890 "movd %3,%%xmm0 \n"
1894 "punpcklbw %%xmm0,%%xmm5 \n"
1899 "movdqa (%1),%%xmm0 \n"
1901 "movdqa %%xmm0,%%xmm1 \n"
1902 "punpcklbw %%xmm2,%%xmm0 \n"
1904 "pmaddubsw %%xmm5,%%xmm0 \n"
1906 "psrlw $0x7,%%xmm0 \n"
1908 "packuswb %%xmm1,%%xmm0 \n"
1910 "movdqa %%xmm0,(%1,%0,1) \n"
1916 "movdqa (%1),%%xmm0 \n"
1918 "movdqa %%xmm0,(%1,%0,1) \n"
1924 "movdqa (%1),%%xmm0 \n"
1925 "pavgb (%1,%4,1),%%xmm0 \n"
1927 "movdqa %%xmm0,(%1,%0,1) \n"
1932 "punpckhbw %%xmm0,%%xmm0 \n"
1933 "pshufhw $0xff,%%xmm0,%%xmm0 \n"
1934 "punpckhqdq %%xmm0,%%xmm0 \n"
1935 "movdqa %%xmm0,(%1,%0,1) \n"
1943 , "xmm0", "xmm1", "xmm2", "xmm5"