/external/libhevc/common/x86/ |
ihevc_32x32_itrans_recon_sse42_intr.c | 196 __m128i m_coeff1, m_coeff2, m_coeff3, m_coeff4; local 343 m_coeff1 = _mm_loadu_si128((__m128i *)&g_ai2_ihevc_trans_32_intr_packed[0][0]); //90 358 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_10, m_coeff1); 374 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_14, m_coeff1); 599 m_coeff1 = _mm_loadu_si128((__m128i *)&g_ai2_ihevc_trans_16_even_packed[0][0]); //83 36 654 m_coeff1 = _mm_loadu_si128((__m128i *)&g_ai2_ihevc_trans_16_even_packed[4][0]); //89 75 671 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_10, m_coeff1); 681 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_14, m_coeff1); 779 m_coeff1 = _mm_loadu_si128((__m128i *)&g_ai2_ihevc_trans_32_intr_packed[0][0]); //90 87 798 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_10, m_coeff1); [all...] |
ihevc_itrans_recon_32x32_ssse3_intr.c | 204 __m128i m_coeff1, m_coeff2, m_coeff3, m_coeff4; local 352 m_coeff1 = _mm_load_si128((__m128i *)&g_ai2_ihevc_trans_32_intr_packed[0][0]); //90 368 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_10, m_coeff1); 385 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_14, m_coeff1); 610 m_coeff1 = _mm_load_si128((__m128i *)&g_ai2_ihevc_trans_16_even_packed[0][0]); //83 36 665 m_coeff1 = _mm_load_si128((__m128i *)&g_ai2_ihevc_trans_16_even_packed[4][0]); //89 75 682 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_10, m_coeff1); 692 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_14, m_coeff1); 790 m_coeff1 = _mm_load_si128((__m128i *)&g_ai2_ihevc_trans_32_intr_packed[0][0]); //90 87 808 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_10, m_coeff1); [all...] |
ihevc_itrans_recon_sse42_intr.c | 144 __m128i m_coeff1, m_coeff2, m_coeff3; local 201 m_coeff1 = _mm_loadu_si128((__m128i *)&g_ai4_ihevc_trans_4_ttype1[1][0]); //29 206 m_temp_reg_30 = _mm_mullo_epi32(m_temp_reg_10, m_coeff1); //29*c0 211 m_temp_reg_32 = _mm_mullo_epi32(m_temp_reg_11, m_coeff1); //29*c1 217 m_temp_reg_35 = _mm_mullo_epi32(m_temp_reg_12, m_coeff1); //29*c2 297 m_temp_reg_30 = _mm_mullo_epi32(m_temp_reg_0, m_coeff1); //29*c0 302 m_temp_reg_32 = _mm_mullo_epi32(m_temp_reg_1, m_coeff1); //29*c1 308 m_temp_reg_35 = _mm_mullo_epi32(m_temp_reg_2, m_coeff1); //29*c2 473 __m128i m_coeff1, m_coeff3; local 499 m_coeff1 = _mm_loadu_si128((__m128i *)&g_ai4_ihevc_trans_4_ttype0[0][0]); //3 845 __m128i m_coeff1, m_coeff2, m_coeff3, m_coeff4; local [all...] |
ihevc_itrans_recon_ssse3_intr.c | 226 //m_temp_reg_30 = _mm_mullo_epi32(m_temp_reg_10, m_coeff1);//29*c0 240 //m_temp_reg_32 = _mm_mullo_epi32(m_temp_reg_11, m_coeff1);//29*c1 260 //m_temp_reg_35 = _mm_mullo_epi32(m_temp_reg_12, m_coeff1);//29*c2 364 //m_temp_reg_30 = _mm_mullo_epi32(m_temp_reg_0, m_coeff1);//29*c0 378 //m_temp_reg_32 = _mm_mullo_epi32(m_temp_reg_1, m_coeff1);//29*c1 398 //m_temp_reg_35 = _mm_mullo_epi32(m_temp_reg_2, m_coeff1);//29*c2 625 //m_temp_reg_12 = _mm_mullo_epi32(m_temp_reg_1, m_coeff1);//src[1]*36 646 //m_temp_reg_15 = _mm_mullo_epi32(m_temp_reg_3, m_coeff1);//src[3]*36 740 m_temp_reg_12 = _mm_mullo_epi32(m_temp_reg_22, m_coeff1);//src[1]*36 743 m_temp_reg_15 = _mm_mullo_epi32(m_temp_reg_23, m_coeff1);//src[3]*3 1020 __m128i m_coeff1, m_coeff2, m_coeff3, m_coeff4; local [all...] |
ihevc_16x16_itrans_recon_sse42_intr.c | 160 __m128i m_coeff1, m_coeff2, m_coeff3, m_coeff4; local 243 m_coeff1 = _mm_loadu_si128((__m128i *)&g_ai2_ihevc_trans_16_even[2][0]); //89 75 256 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_10, m_coeff1); 275 m_temp_reg_31 = _mm_madd_epi16(m_temp_reg_11, m_coeff1); 325 m_coeff1 = _mm_loadu_si128((__m128i *)&g_ai2_ihevc_trans_16_even[8][0]); //50 -89 331 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_10, m_coeff1); 347 m_temp_reg_31 = _mm_madd_epi16(m_temp_reg_11, m_coeff1); 400 m_coeff1 = _mm_loadu_si128((__m128i *)&g_ai2_ihevc_trans_16_even[6][0]); //83 36 406 m_temp_reg_20 = _mm_madd_epi16(m_temp_reg_0, m_coeff1); 409 m_temp_reg_21 = _mm_madd_epi16(m_temp_reg_1, m_coeff1); [all...] |
ihevc_itrans_recon_16x16_ssse3_intr.c | 164 __m128i m_coeff1, m_coeff2, m_coeff3, m_coeff4; local 249 m_coeff1 = _mm_load_si128((__m128i *)&g_ai2_ihevc_trans_16_even[2][0]); //89 75 262 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_10, m_coeff1); 281 m_temp_reg_31 = _mm_madd_epi16(m_temp_reg_11, m_coeff1); 331 m_coeff1 = _mm_load_si128((__m128i *)&g_ai2_ihevc_trans_16_even[8][0]); //50 -89 337 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_10, m_coeff1); 353 m_temp_reg_31 = _mm_madd_epi16(m_temp_reg_11, m_coeff1); 406 m_coeff1 = _mm_load_si128((__m128i *)&g_ai2_ihevc_trans_16_even[6][0]); //83 36 412 m_temp_reg_20 = _mm_madd_epi16(m_temp_reg_0, m_coeff1); 415 m_temp_reg_21 = _mm_madd_epi16(m_temp_reg_1, m_coeff1); [all...] |
/external/libmpeg2/common/x86/ |
impeg2_idct_recon_sse42_intr.c | 183 __m128i m_coeff1, m_coeff2, m_coeff3, m_coeff4; local 221 m_coeff1 = _mm_loadu_si128((__m128i *)&gai2_impeg2_idct_even_8_q15[0][0]); 225 m_temp_reg_10 = _mm_madd_epi16(m_temp_reg_0, m_coeff1); 236 m_coeff1 = _mm_loadu_si128((__m128i *)&gai2_impeg2_idct_even_8_q15[1][0]); //sub 2B*36-6B*83 ,2T*36-6T*83 243 m_temp_reg_16 = _mm_madd_epi16(m_temp_reg_4, m_coeff1); 252 m_coeff1 = _mm_loadu_si128((__m128i *)&gai2_impeg2_idct_odd_8_q15[0][0]); 279 m_temp_reg_30 = _mm_madd_epi16(m_temp_reg_60, m_coeff1); 312 m_coeff1 = _mm_loadu_si128((__m128i *)&gai2_impeg2_idct_odd_8_q15[4][0]); 334 m_temp_reg_34 = _mm_madd_epi16(m_temp_reg_60, m_coeff1); 429 m_coeff1 = _mm_loadu_si128((__m128i *)&gai2_impeg2_idct_even_8_q15[0][0]) [all...] |