/external/libavc/common/x86/ |
ih264_ihadamard_scaling_ssse3.c | 97 __m128i src_r0, src_r1, src_r2, src_r3; local 114 src_r3 = _mm_unpackhi_epi16(src_r2_r3, sign_reg); 128 temp2 = _mm_unpacklo_epi32(src_r2, src_r3); //c0 d0 c1 d1 130 temp3 = _mm_unpackhi_epi32(src_r2, src_r3); //c2 d2 c3 d3 134 src_r3 = _mm_unpackhi_epi64(temp1, temp3); //a3 b3 c3 d3 136 temp0 = _mm_add_epi32(src_r0, src_r3); 139 temp3 = _mm_sub_epi32(src_r0, src_r3); 144 src_r3 = _mm_sub_epi32(temp3, temp2); 157 temp2 = _mm_unpacklo_epi32(src_r2, src_r3); //a2 a3 b2 b3 159 temp3 = _mm_unpackhi_epi32(src_r2, src_r3); //c2 c3 d2 d [all...] |
ih264_ihadamard_scaling_sse42.c | 97 __m128i src_r0, src_r1, src_r2, src_r3; local 112 src_r3 = _mm_cvtepi16_epi32(src_r2_r3); 126 temp2 = _mm_unpacklo_epi32(src_r2, src_r3); //c0 d0 c1 d1 128 temp3 = _mm_unpackhi_epi32(src_r2, src_r3); //c2 d2 c3 d3 132 src_r3 = _mm_unpackhi_epi64(temp1, temp3); //a3 b3 c3 d3 134 temp0 = _mm_add_epi32(src_r0, src_r3); 137 temp3 = _mm_sub_epi32(src_r0, src_r3); 142 src_r3 = _mm_sub_epi32(temp3, temp2); 155 temp2 = _mm_unpacklo_epi32(src_r2, src_r3); //a2 a3 b2 b3 157 temp3 = _mm_unpackhi_epi32(src_r2, src_r3); //c2 c3 d2 d [all...] |
ih264_resi_trans_quant_sse42.c | 118 __m128i src_r0, src_r1, src_r2, src_r3; local 132 src_r3 = _mm_loadl_epi64((__m128i *) (&pu1_src[3 * src_strd])); //a30 a31 a32 a33 0 0 0 0 0 0 0 0 -- all 8 bits 137 src_r3 = _mm_cvtepu8_epi16(src_r3); 152 src_r3 = _mm_sub_epi16(src_r3, pred_r3); 166 temp2 = _mm_unpacklo_epi16(src_r2, src_r3); //c0 d0 c1 d1 c2 d2 c3 d3 173 src_r3 = _mm_unpackhi_epi64(temp3, zero_8x16b); //a3 b3 c3 d3 177 temp0 = _mm_add_epi16(src_r0, src_r3); 183 temp3 = _mm_sub_epi16(src_r0, src_r3); 392 __m128i src_r0, src_r1, src_r2, src_r3; local 676 __m128i src_r0, src_r1, src_r2, src_r3; local [all...] |
ih264_iquant_itrans_recon_sse42.c | 114 __m128i src_r0, src_r1, src_r2, src_r3; local 147 src_r3 = _mm_unpackhi_epi16(src_r2_r3, zero_8x16b); // a30 0 a31 0 a32 0 a33 0 -- 16 bit long 152 temp7 = _mm_madd_epi16(src_r3, temp7); 363 __m128i src_r0, src_r1, src_r2, src_r3; local 398 src_r3 = _mm_unpackhi_epi16(src_r2_r3, zero_8x16b); // a30 0 a31 0 a32 0 a33 0 -- 16 bit long 403 temp7 = _mm_madd_epi16(src_r3, temp7);
|
ih264_iquant_itrans_recon_ssse3.c | 114 __m128i src_r0, src_r1, src_r2, src_r3; local 148 src_r3 = _mm_unpackhi_epi16(src_r2_r3, zero_8x16b); // a30 0 a31 0 a32 0 a33 0 -- 16 bit long 153 temp7 = _mm_madd_epi16(src_r3, temp7); [all...] |
/external/libmpeg2/common/x86/ |
impeg2_inter_pred_sse42_intr.c | 76 __m128i src_r0, src_r1, src_r2, src_r3; local 87 src_r3 = _mm_loadu_si128((__m128i *) (src + 3 * src_wd)); 92 _mm_storeu_si128((__m128i *) (dst + 3 * dst_wd), src_r3); 100 src_r3 = _mm_loadu_si128((__m128i *) (src + 3 * src_wd)); 105 _mm_storeu_si128((__m128i *) (dst + 3 * dst_wd), src_r3); 113 src_r3 = _mm_loadu_si128((__m128i *) (src + 3 * src_wd)); 118 _mm_storeu_si128((__m128i *) (dst + 3 * dst_wd), src_r3); 126 src_r3 = _mm_loadu_si128((__m128i *) (src + 3 * src_wd)); 131 _mm_storeu_si128((__m128i *) (dst + 3 * dst_wd), src_r3); 146 src_r3 = _mm_loadl_epi64((__m128i *)(src + 3 * src_wd)) 873 __m128i src_r0, src_r1, src_r2, src_r3; local [all...] |
/external/libavc/encoder/x86/ |
ime_distortion_metrics_sse42.c | 108 __m128i src_r0, src_r1, src_r2, src_r3; local 119 src_r3 = _mm_loadu_si128((__m128i *) (pu1_src + 3*src_strd)); 129 res_r3 = _mm_sad_epu8(src_r3, est_r3); 142 src_r3 = _mm_loadu_si128((__m128i *) (pu1_src + 3*src_strd)); 152 res_r3 = _mm_sad_epu8(src_r3, est_r3); 165 src_r3 = _mm_loadu_si128((__m128i *) (pu1_src + 3*src_strd)); 175 res_r3 = _mm_sad_epu8(src_r3, est_r3); 188 src_r3 = _mm_loadu_si128((__m128i *) (pu1_src + 3*src_strd)); 198 res_r3 = _mm_sad_epu8(src_r3, est_r3); 252 __m128i src_r0, src_r1, src_r2, src_r3; local 348 __m128i src_r0, src_r1, src_r2, src_r3; local 503 __m128i src_r0, src_r1, src_r2, src_r3; local 1728 __m128i src_r0, src_r1, src_r2, src_r3; local [all...] |