Lines Matching refs:rsi
43 push rsi
48 xor rsi, rsi
64 mov rsi, arg(0) ;src_ptr
73 movq xmm0, MMWORD PTR [rsi - 2] ; -2 -1 0 1 2 3 4 5
75 movq xmm2, MMWORD PTR [rsi + 3] ; 3 4 5 6 7 8 9 10
91 lea rsi, [rsi + rax]
108 pop rsi
121 mov rsi, arg(0) ;src_ptr
131 movq xmm0, MMWORD PTR [rsi - 2] ; -2 -1 0 1 2 3 4 5
133 movq xmm1, MMWORD PTR [rsi + 3] ; 3 4 5 6 7 8 9 10
146 lea rsi, [rsi + rax]
163 pop rsi
184 push rsi
189 xor rsi, rsi
201 mov rsi, arg(0) ;src_ptr
212 movq xmm0, MMWORD PTR [rsi - 2] ; -2 -1 0 1 2 3 4 5
214 movq xmm3, MMWORD PTR [rsi + 3] ; 3 4 5 6 7 8 9 10
225 movq xmm3, MMWORD PTR [rsi + 6]
228 movq xmm7, MMWORD PTR [rsi + 11]
251 lea rsi, [rsi + rax]
272 pop rsi
282 mov rsi, arg(0) ;src_ptr
288 movdqu xmm1, XMMWORD PTR [rsi - 2]
295 movdqu xmm3, XMMWORD PTR [rsi + 6]
310 lea rsi, [rsi + rax]
327 pop rsi
348 push rsi
353 xor rsi, rsi
367 mov rsi, arg(0) ;src_ptr
376 movdqu xmm0, XMMWORD PTR [rsi - 2]
390 lea rsi, [rsi + rax]
407 pop rsi
419 mov rsi, arg(0) ;src_ptr
427 movdqu xmm1, XMMWORD PTR [rsi - 2]
437 lea rsi, [rsi + rax]
452 pop rsi
475 push rsi
480 xor rsi, rsi
493 mov rsi, arg(0) ;src_ptr
500 mov rax, rsi
506 movq xmm1, MMWORD PTR [rsi] ;A
507 movq xmm2, MMWORD PTR [rsi + rdx] ;B
508 movq xmm3, MMWORD PTR [rsi + rdx * 2] ;C
510 movq xmm0, MMWORD PTR [rsi + rdx * 4] ;E
530 movq xmm1, MMWORD PTR [rsi + 8] ;A
531 movq xmm2, MMWORD PTR [rsi + rdx + 8] ;B
532 movq xmm3, MMWORD PTR [rsi + rdx * 2 + 8] ;C
534 movq xmm0, MMWORD PTR [rsi + rdx * 4 + 8] ;E
545 add rsi, rdx
567 pop rsi
577 mov rsi, arg(0) ;src_ptr
584 mov rax, rsi
589 movq xmm2, MMWORD PTR [rsi + rdx] ;B
590 movq xmm3, MMWORD PTR [rsi + rdx * 2] ;C
592 movq xmm0, MMWORD PTR [rsi + rdx * 4] ;E
599 movq xmm5, MMWORD PTR [rsi + rdx + 8] ;B
600 movq xmm1, MMWORD PTR [rsi + rdx * 2 + 8] ;C
602 movq xmm0, MMWORD PTR [rsi + rdx * 4 + 8] ;E
616 add rsi, rdx
639 pop rsi
660 push rsi
665 xor rsi, rsi
685 mov rsi, arg(0) ;src_ptr
687 mov rax, rsi
691 movq xmm1, MMWORD PTR [rsi] ;A
692 movq xmm2, MMWORD PTR [rsi + rdx] ;B
693 movq xmm3, MMWORD PTR [rsi + rdx * 2] ;C
695 movq xmm0, MMWORD PTR [rsi + rdx * 4] ;E
707 add rsi, rdx
729 pop rsi
740 mov rsi, arg(0) ;src_ptr
742 mov rax, rsi
746 movq xmm2, MMWORD PTR [rsi + rdx] ;B
747 movq xmm3, MMWORD PTR [rsi + rdx * 2] ;C
749 movq xmm0, MMWORD PTR [rsi + rdx * 4] ;E
756 add rsi, rdx
777 pop rsi
797 push rsi
802 xor rsi, rsi
822 mov rsi, arg(0) ;src_ptr
824 mov rax, rsi
828 movd mm1, DWORD PTR [rsi] ;A
829 movd mm2, DWORD PTR [rsi + rdx] ;B
830 movd mm3, DWORD PTR [rsi + rdx * 2] ;C
832 movd mm0, DWORD PTR [rsi + rdx * 4] ;E
845 add rsi, rdx
867 pop rsi
878 mov rsi, arg(0) ;src_ptr
880 mov rax, rsi
884 movd mm2, DWORD PTR [rsi + rdx] ;B
885 movd mm3, DWORD PTR [rsi + rdx * 2] ;C
887 movd mm0, DWORD PTR [rsi + rdx * 4] ;E
894 add rsi, rdx
915 pop rsi
937 push rsi
951 mov rsi, arg(0) ; src_ptr
973 movq xmm3, [rsi] ; 00 01 02 03 04 05 06 07
974 movq xmm5, [rsi+1] ; 01 02 03 04 05 06 07 08
977 movq xmm4, [rsi+8] ; 08 09 10 11 12 13 14 15
979 movq xmm5, [rsi+9] ; 09 10 11 12 13 14 15 16
981 lea rsi, [rsi + rdx] ; next line
998 movq xmm6, [rsi] ; 00 01 02 03 04 05 06 07
999 movq xmm5, [rsi+1] ; 01 02 03 04 05 06 07 08
1002 movq xmm4, [rsi+8] ; 08 09 10 11 12 13 14 15
1004 movq xmm5, [rsi+9] ; 09 10 11 12 13 14 15 16
1005 lea rsi, [rsi + rdx] ; next line
1054 mov rsi, arg(0) ; src_ptr
1064 movq xmm4, [rsi] ; load row 0
1065 movq xmm2, [rsi + 8] ; load row 0
1067 lea rsi, [rsi + rax] ; next line
1069 movq xmm3, [rsi] ; load row + 1
1070 movq xmm5, [rsi + 8] ; load row + 1
1076 movq xmm7, [rsi + rax] ; load row + 2
1079 movq xmm6, [rsi + rax + 8] ; load row + 2
1106 lea rsi, [rsi + 2*rax]
1122 movq xmm2, [rsi] ; 00 01 02 03 04 05 06 07
1123 movq xmm4, [rsi+1] ; 01 02 03 04 05 06 07 08
1126 movq xmm3, [rsi+8] ; 08 09 10 11 12 13 14 15
1129 movq xmm4, [rsi+9] ; 09 10 11 12 13 14 15 16
1131 lea rsi, [rsi + rax] ; next line
1135 movq xmm5, [rsi]
1138 movq xmm7, [rsi+1]
1140 movq xmm6, [rsi+8]
1144 movq xmm7, [rsi+9]
1165 lea rsi, [rsi + rax] ; next line
1177 pop rsi
1200 push rsi
1209 mov rsi, arg(0) ;src_ptr
1214 movdqu xmm0, [rsi]
1216 movdqu xmm1, [rsi+rdx]
1217 movdqu xmm2, [rsi+rdx*2]
1218 add rsi, rax
1219 movdqu xmm3, [rsi]
1220 movdqu xmm4, [rsi+rdx]
1221 movdqu xmm5, [rsi+rdx*2]
1222 add rsi, rax
1223 movdqu xmm6, [rsi]
1224 movdqu xmm7, [rsi+rdx]
1228 movdqu xmm0, [rsi+rdx*2]
1489 pop rsi