Home | History | Annotate | Download | only in simd

Lines Matching refs:movdqa

130         movdqa  xmm0, XMMWORD [XMMBLOCK(1,0,rsi,SIZEOF_JCOEF)]
131 movdqa xmm1, XMMWORD [XMMBLOCK(2,0,rsi,SIZEOF_JCOEF)]
146 movdqa xmm5, XMMWORD [XMMBLOCK(0,0,rsi,SIZEOF_JCOEF)]
151 movdqa xmm4,xmm5 ; xmm5=in0=(00 01 02 03 04 05 06 07)
164 movdqa XMMWORD [wk(8)], xmm6 ; wk(8)=col1
165 movdqa XMMWORD [wk(9)], xmm5 ; wk(9)=col3
166 movdqa XMMWORD [wk(10)], xmm3 ; wk(10)=col5
167 movdqa XMMWORD [wk(11)], xmm4 ; wk(11)=col7
174 movdqa xmm0, XMMWORD [XMMBLOCK(0,0,rsi,SIZEOF_JCOEF)]
175 movdqa xmm1, XMMWORD [XMMBLOCK(2,0,rsi,SIZEOF_JCOEF)]
178 movdqa xmm2, XMMWORD [XMMBLOCK(4,0,rsi,SIZEOF_JCOEF)]
179 movdqa xmm3, XMMWORD [XMMBLOCK(6,0,rsi,SIZEOF_JCOEF)]
192 movdqa xmm4,xmm1 ; xmm1=in2=z2
193 movdqa xmm5,xmm1
196 movdqa xmm1,xmm4
197 movdqa xmm3,xmm5
203 movdqa xmm6,xmm0
214 movdqa xmm0,xmm7
217 movdqa xmm4,xmm2
221 movdqa XMMWORD [wk(0)], xmm7 ; wk(0)=tmp10L
222 movdqa XMMWORD [wk(1)], xmm2 ; wk(1)=tmp10H
223 movdqa XMMWORD [wk(2)], xmm0 ; wk(2)=tmp13L
224 movdqa XMMWORD [wk(3)], xmm4 ; wk(3)=tmp13H
233 movdqa xmm2,xmm5
236 movdqa xmm0,xmm7
240 movdqa XMMWORD [wk(4)], xmm5 ; wk(4)=tmp11L
241 movdqa XMMWORD [wk(5)], xmm7 ; wk(5)=tmp11H
242 movdqa XMMWORD [wk(6)], xmm2 ; wk(6)=tmp12L
243 movdqa XMMWORD [wk(7)], xmm0 ; wk(7)=tmp12H
247 movdqa xmm4, XMMWORD [XMMBLOCK(1,0,rsi,SIZEOF_JCOEF)]
248 movdqa xmm6, XMMWORD [XMMBLOCK(3,0,rsi,SIZEOF_JCOEF)]
251 movdqa xmm1, XMMWORD [XMMBLOCK(5,0,rsi,SIZEOF_JCOEF)]
252 movdqa xmm3, XMMWORD [XMMBLOCK(7,0,rsi,SIZEOF_JCOEF)]
256 movdqa xmm5,xmm6
257 movdqa xmm7,xmm4
270 movdqa xmm2,xmm5
271 movdqa xmm0,xmm5
274 movdqa xmm5,xmm2
275 movdqa xmm7,xmm0
281 movdqa XMMWORD [wk(10)], xmm2 ; wk(10)=z3L
282 movdqa XMMWORD [wk(11)], xmm0 ; wk(11)=z3H
300 movdqa xmm2,xmm3
301 movdqa xmm0,xmm3
304 movdqa xmm3,xmm2
305 movdqa xmm4,xmm0
316 movdqa XMMWORD [wk(8)], xmm2 ; wk(8)=tmp0L
317 movdqa XMMWORD [wk(9)], xmm0 ; wk(9)=tmp0H
319 movdqa xmm2,xmm1
320 movdqa xmm0,xmm1
323 movdqa xmm1,xmm2
324 movdqa xmm6,xmm0
335 movdqa XMMWORD [wk(10)], xmm2 ; wk(10)=tmp1L
336 movdqa XMMWORD [wk(11)], xmm0 ; wk(11)=tmp1H
340 movdqa xmm5, XMMWORD [wk(0)] ; xmm5=tmp10L
341 movdqa xmm7, XMMWORD [wk(1)] ; xmm7=tmp10H
343 movdqa xmm2,xmm5
344 movdqa xmm0,xmm7
350 movdqa xmm3,[rel PD_DESCALE_P1] ; xmm3=[rel PD_DESCALE_P1]
364 movdqa xmm4, XMMWORD [wk(4)] ; xmm4=tmp11L
365 movdqa xmm3, XMMWORD [wk(5)] ; xmm3=tmp11H
367 movdqa xmm7,xmm4
368 movdqa xmm0,xmm3
374 movdqa xmm1,[rel PD_DESCALE_P1] ; xmm1=[rel PD_DESCALE_P1]
388 movdqa xmm6,xmm5 ; transpose coefficients(phase 1)
391 movdqa xmm1,xmm7 ; transpose coefficients(phase 1)
395 movdqa xmm3, XMMWORD [wk(6)] ; xmm3=tmp12L
396 movdqa xmm0, XMMWORD [wk(7)] ; xmm0=tmp12H
397 movdqa xmm4, XMMWORD [wk(10)] ; xmm4=tmp1L
398 movdqa xmm2, XMMWORD [wk(11)] ; xmm2=tmp1H
400 movdqa XMMWORD [wk(0)], xmm5 ; wk(0)=(00 10 01 11 02 12 03 13)
401 movdqa XMMWORD [wk(1)], xmm6 ; wk(1)=(04 14 05 15 06 16 07 17)
402 movdqa
403 movdqa XMMWORD [wk(5)], xmm1 ; wk(5)=(64 74 65 75 66 76 67 77)
405 movdqa xmm5,xmm3
406 movdqa xmm6,xmm0
412 movdqa xmm7,[rel PD_DESCALE_P1] ; xmm7=[rel PD_DESCALE_P1]
426 movdqa xmm1, XMMWORD [wk(2)] ; xmm1=tmp13L
427 movdqa xmm4, XMMWORD [wk(3)] ; xmm4=tmp13H
428 movdqa xmm2, XMMWORD [wk(8)] ; xmm2=tmp0L
429 movdqa xmm7, XMMWORD [wk(9)] ; xmm7=tmp0H
431 movdqa xmm0,xmm1
432 movdqa xmm6,xmm4
438 movdqa xmm2,[rel PD_DESCALE_P1] ; xmm2=[rel PD_DESCALE_P1]
452 movdqa xmm7, XMMWORD [wk(0)] ; xmm7=(00 10 01 11 02 12 03 13)
453 movdqa xmm2, XMMWORD [wk(1)] ; xmm2=(04 14 05 15 06 16 07 17)
455 movdqa xmm4,xmm3 ; transpose coefficients(phase 1)
458 movdqa xmm6,xmm0 ; transpose coefficients(phase 1)
462 movdqa xmm1,xmm7 ; transpose coefficients(phase 2)
465 movdqa xmm5,xmm2 ; transpose coefficients(phase 2)
469 movdqa xmm3, XMMWORD [wk(4)] ; xmm3=(60 70 61 71 62 72 63 73)
470 movdqa xmm4, XMMWORD [wk(5)] ; xmm4=(64 74 65 75 66 76 67 77)
472 movdqa XMMWORD [wk(6)], xmm2 ; wk(6)=(04 14 24 34 05 15 25 35)
473 movdqa XMMWORD [wk(7)], xmm5 ; wk(7)=(06 16 26 36 07 17 27 37)
475 movdqa xmm2,xmm0 ; transpose coefficients(phase 2)
478 movdqa xmm5,xmm6 ; transpose coefficients(phase 2)
482 movdqa xmm3,xmm7 ; transpose coefficients(phase 3)
485 movdqa xmm4,xmm1 ; transpose coefficients(phase 3)
489 movdqa xmm0, XMMWORD [wk(6)] ; xmm0=(04 14 24 34 05 15 25 35)
490 movdqa xmm2, XMMWORD [wk(7)] ; xmm2=(06 16 26 36 07 17 27 37)
492 movdqa XMMWORD [wk(8)], xmm3 ; wk(8)=col1
493 movdqa XMMWORD [wk(9)], xmm4 ; wk(9)=col3
495 movdqa xmm3,xmm0 ; transpose coefficients(phase 3)
498 movdqa xmm4,xmm2 ; transpose coefficients(phase 3)
502 movdqa XMMWORD [wk(10)], xmm3 ; wk(10)=col5
503 movdqa XMMWORD [wk(11)], xmm4 ; wk(11)=col7
532 movdqa xmm6,xmm1 ; xmm1=in2=z2
533 movdqa xmm5,xmm1
536 movdqa xmm1,xmm6
537 movdqa xmm2,xmm5
543 movdqa xmm3,xmm7
554 movdqa xmm7,xmm4
557 movdqa xmm6,xmm0
561 movdqa XMMWORD [wk(0)], xmm4 ; wk(0)=tmp10L
562 movdqa XMMWORD [wk(1)], xmm0 ; wk(1)=tmp10H
563 movdqa XMMWORD [wk(2)], xmm7 ; wk(2)=tmp13L
564 movdqa XMMWORD [wk(3)], xmm6 ; wk(3)=tmp13H
573 movdqa xmm0,xmm5
576 movdqa xmm7,xmm4
580 movdqa XMMWORD [wk(4)], xmm5 ; wk(4)=tmp11L
581 movdqa XMMWORD [wk(5)], xmm4 ; wk(5)=tmp11H
582 movdqa XMMWORD [wk(6)], xmm0 ; wk(6)=tmp12L
583 movdqa XMMWORD [wk(7)], xmm7 ; wk(7)=tmp12H
587 movdqa xmm6, XMMWORD [wk(9)] ; xmm6=col3
588 movdqa xmm3, XMMWORD [wk(8)] ; xmm3=col1
589 movdqa xmm1, XMMWORD [wk(11)] ; xmm1=col7
590 movdqa xmm2, XMMWORD [wk(10)] ; xmm2=col5
592 movdqa xmm5,xmm6
593 movdqa xmm4,xmm3
606 movdqa xmm0,xmm5
607 movdqa xmm7,xmm5
610 movdqa xmm5,xmm0
611 movdqa xmm4,xmm7
617 movdqa XMMWORD [wk(10)], xmm0 ; wk(10)=z3L
618 movdqa XMMWORD [wk(11)], xmm7 ; wk(11)=z3H
636 movdqa xmm0,xmm1
637 movdqa xmm7,xmm1
640 movdqa xmm1,xmm0
641 movdqa xmm3,xmm7
652 movdqa XMMWORD [wk(8)], xmm0 ; wk(8)=tmp0L
653 movdqa XMMWORD [wk(9)], xmm7 ; wk(9)=tmp0H
655 movdqa xmm0,xmm2
656 movdqa xmm7,xmm2
659 movdqa xmm2,xmm0
660 movdqa xmm6,xmm7
671 movdqa XMMWORD [wk(10)], xmm0 ; wk(10)=tmp1L
672 movdqa XMMWORD [wk(11)], xmm7 ; wk(11)=tmp1H
676 movdqa xmm5, XMMWORD [wk(0)] ; xmm5=tmp10L
677 movdqa xmm4, XMMWORD [wk(1)] ; xmm4=tmp10H
679 movdqa xmm0,xmm5
680 movdqa xmm7,xmm4
686 movdqa xmm1,[rel PD_DESCALE_P2] ; xmm1=[rel PD_DESCALE_P2]
700 movdqa xmm3, XMMWORD [wk(4)] ; xmm3=tmp11L
701 movdqa xmm1, XMMWORD [wk(5)] ; xmm1=tmp11H
703 movdqa xmm4,xmm3
704 movdqa xmm7,xmm1
710 movdqa xmm2,[rel PD_DESCALE_P2] ; xmm2=[rel PD_DESCALE_P2]
727 movdqa xmm6, XMMWORD [wk(6)] ; xmm6=tmp12L
728 movdqa xmm2, XMMWORD [wk(7)] ; xmm2=tmp12H
729 movdqa xmm1, XMMWORD [wk(10)] ; xmm1=tmp1L
730 movdqa xmm7, XMMWORD [wk(11)] ; xmm7=tmp1H
732 movdqa XMMWORD [wk(0)], xmm5 ; wk(0)=(00 10 20 30 40 50 60 70 06 16 26 36 46 56 66 76)
733 movdqa XMMWORD [wk(1)], xmm3 ; wk(1)=(01 11 21 31 41 51 61 71 07 17 27 37 47 57 67 77)
735 movdqa xmm4,xmm6
736 movdqa xmm0,xmm2
742 movdqa xmm5,[rel PD_DESCALE_P2] ; xmm5=[rel PD_DESCALE_P2]
756 movdqa xmm3, XMMWORD [wk(2)] ; xmm3=tmp13L
757 movdqa xmm1, XMMWORD [wk(3)] ; xmm1=tmp13H
758 movdqa xmm7, XMMWORD [wk(8)] ; xmm7=tmp0L
759 movdqa xmm5, XMMWORD [wk(9)] ; xmm5=tmp0H
761 movdqa xmm2,xmm3
762 movdqa xmm0,xmm1
768 movdqa xmm7,[rel PD_DESCALE_P2] ; xmm7=[rel PD_DESCALE_P2]
779 movdqa xmm5,[rel PB_CENTERJSAMP] ; xmm5=[rel PB_CENTERJSAMP]
784 movdqa xmm7, XMMWORD [wk(0)] ; xmm7=(00 10 20 30 40 50 60 70 06 16 26 36 46 56 66 76)
785 movdqa xmm1, XMMWORD [wk(1)] ; xmm1=(01 11 21 31 41 51 61 71 07 17 27 37 47 57 67 77)
795 movdqa xmm0,xmm7 ; transpose coefficients(phase 1)
798 movdqa xmm2,xmm6 ; transpose coefficients(phase 1)
802 movdqa xmm4,xmm7 ; transpose coefficients(phase 2)
805 movdqa xmm5,xmm2 ; transpose coefficients(phase 2)
809 movdqa xmm1,xmm7 ; transpose coefficients(phase 3)
812 movdqa xmm3,xmm4 ; transpose coefficients(phase 3)