Lines Matching refs:x3
806 int16x8_t x2 = vld1q_s16(src + step*3); int16x8_t x3 = vld1q_s16(src + step*4);
809 x1 = vaddq_s16(x2, x3); x2 = vsubq_s16(x2, x3);
815 x0 = vld1q_s16(src + step); x3 = vld1q_s16(src + step*6);
817 x1 = vaddq_s16(x0, x3); x0 = vsubq_s16(x0, x3);
820 x0 = vld1q_s16(src + step*2); x3 = vld1q_s16(src + step*5);
822 int16x8_t t4 = vsubq_s16(x0, x3);
824 x0 = vaddq_s16(x0, x3);
825 x3 = vaddq_s16(x0, x1); x0 = vsubq_s16(x0, x1);
826 x1 = vaddq_s16(x2, x3); x2 = vsubq_s16(x2, x3);
837 x2 = t3; x3 = t1;
838 x0 = vaddq_s16(x0, x1); x1 = vaddq_s16(x1, x2); x2 = vaddq_s16(x2, x3);
841 x4 = vaddq_s16(x1, x3); x3 = vsubq_s16(x3, x1);
846 x1 = vaddq_s16(x0, x3); x3 = vsubq_s16(x3, x0);
850 int16x8_t res3 = x3;
945 x2 = transp_res3; x3 = transp_res4;
948 x1 = vaddq_s16(x2, x3); x2 = vsubq_s16(x2, x3);
955 x3 = transp_res6;
957 x1 = vaddq_s16(x0, x3); x0 = vsubq_s16(x0, x3);
961 x0 = transp_res2; x3 = transp_res5;
963 t4 = vsubq_s16(x0, x3);
965 x0 = vaddq_s16(x0, x3);
967 x3 = vaddq_s16(x0, x1); x0 = vsubq_s16(x0, x1);
968 x1 = vaddq_s16(x2, x3); x2 = vsubq_s16(x2, x3);
981 x2 = t3; x3 = t1;
983 x0 = vaddq_s16(x0, x1); x1 = vaddq_s16(x1, x2); x2 = vaddq_s16(x2, x3);
987 x4 = vaddq_s16(x1, x3); x3 = vsubq_s16(x3, x1);
993 x1 = vaddq_s16(x0, x3); x3 = vsubq_s16(x3, x0);
999 STORE_DESCALED(dst + 3*8, x3,postscale + 3*8);
1014 int x2 = src[3], x3 = src[4];
1017 x1 = x2 + x3; x2 -= x3;
1022 x0 = src[1]; x3 = src[6];
1023 x1 = x0 + x3; x0 -= x3;
1026 x0 = src[2]; x3 = src[5];
1027 work[3] = x0 - x3; x0 += x3;
1029 x3 = x0 + x1; x0 -= x1;
1030 x1 = x2 + x3; x2 -= x3;
1039 x2 = work[5]; x3 = work[7];
1041 x0 += x1; x1 += x2; x2 += x3;
1044 x4 = x1 + x3; x3 -= x1;
1049 x1 = x0 + x3; x3 -= x0;
1053 work[7] = x4; work[3] = x3;
1061 int x2 = work[8*3], x3 = work[8*4];
1064 x1 = x2 + x3; x2 -= x3;
1069 x0 = work[8*1]; x3 = work[8*6];
1070 x1 = x0 + x3; x0 -= x3;
1073 x0 = work[8*2]; x3 = work[8*5];
1074 work[8*3] = x0 - x3; x0 += x3;
1076 x3 = x0 + x1; x0 -= x1;
1077 x1 = x2 + x3; x2 -= x3;
1089 x2 = work[8*4]; x3 = work[8*7];
1091 x0 += x1; x1 += x2; x2 += x3;
1094 x4 = x1 + x3; x3 -= x1;
1099 x1 = x0 + x3; x3 -= x0;
1105 dst[3] = (short)DCT_DESCALE(x3*postscale[3], postshift);