/external/libmpeg2/common/x86/ |
impeg2_inter_pred_sse42_intr.c | 143 src_r0 = _mm_loadl_epi64((__m128i *)src); 144 src_r1 = _mm_loadl_epi64((__m128i *)(src + src_wd)); 145 src_r2 = _mm_loadl_epi64((__m128i *)(src + 2 * src_wd)); 146 src_r3 = _mm_loadl_epi64((__m128i *)(src + 3 * src_wd)); 157 src_r0 = _mm_loadl_epi64((__m128i *)src); 158 src_r1 = _mm_loadl_epi64((__m128i *)(src + src_wd)); 159 src_r2 = _mm_loadl_epi64((__m128i *)(src + 2 * src_wd)); 160 src_r3 = _mm_loadl_epi64((__m128i *)(src + 3 * src_wd)); 173 src_r0 = _mm_loadl_epi64((__m128i *)src); 174 src_r1 = _mm_loadl_epi64((__m128i *)(src + src_wd)) [all...] |
icv_sad_ssse3.c | 108 src_r0 = (__m128)_mm_loadl_epi64((__m128i *) (pu1_src)); 111 src_r1 = (__m128)_mm_loadl_epi64((__m128i *) (pu1_src)); 122 ref_r0 = (__m128)_mm_loadl_epi64((__m128i *) (pu1_ref)); 125 ref_r1 = (__m128)_mm_loadl_epi64((__m128i *) (pu1_ref));
|
ideint_spatial_filter_ssse3.c | 119 row1_m1 = _mm_loadl_epi64((__m128i *) (pu1_src - 1)); 120 row1_0 = _mm_loadl_epi64((__m128i *) (pu1_src)); 121 row1_p1 = _mm_loadl_epi64((__m128i *) (pu1_src + 1)); 134 row2_m1 = _mm_loadl_epi64((__m128i *) (pu1_src - 1)); 135 row2_0 = _mm_loadl_epi64((__m128i *) (pu1_src)); 136 row2_p1 = _mm_loadl_epi64((__m128i *) (pu1_src + 1));
|
icv_variance_ssse3.c | 110 src_r0 = (__m128)_mm_loadl_epi64((__m128i *) (pu1_src)); 113 src_r1 = (__m128)_mm_loadl_epi64((__m128i *) (pu1_src));
|
/external/libhevc/common/x86/ |
ihevc_inter_pred_filters_sse42_intr.c | 130 src0_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src)); /* row =0 */ 131 src1_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src + 1 * src_strd)); /* row =1 */ 132 src2_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src + 2 * src_strd)); /* row =2 */ 133 src3_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src + 3 * src_strd)); /* row =3 */ 166 src0_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src)); /* row =0 */ 167 src1_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src + 1 * src_strd)); /* row =1 */ 168 src2_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src + 2 * src_strd)); /* row =2 */ 169 src3_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src + 3 * src_strd)); /* row =3 */ 288 src0_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src)); /* row =0 */ 289 src1_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src + 1 * src_strd)); /* row =1 * [all...] |
ihevc_inter_pred_filters_ssse3_intr.c | 168 src0_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src)); /* row =0 */ 169 src1_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src + 1 * src_strd)); /* row =1 */ 170 src2_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src + 2 * src_strd)); /* row =2 */ 171 src3_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src + 3 * src_strd)); /* row =3 */ 195 src0_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src)); /* row =0 */ 196 src1_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src + 1 * src_strd)); /* row =1 */ 197 src2_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src + 2 * src_strd)); /* row =2 */ 198 src3_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src + 3 * src_strd)); /* row =3 */ 292 src_temp1_16x8b = _mm_loadl_epi64((__m128i *)pi1_coeff); 453 res_temp7_8x16b = _mm_loadl_epi64((__m128i *)(pu1_dst + offset)) [all...] |
ihevc_deblk_ssse3_intr.c | 144 src_row0_8x16b = _mm_loadl_epi64((__m128i *)(pu1_src - 4)); 145 src_row3_8x16b = _mm_loadl_epi64((__m128i *)((pu1_src - 4) + 3 * src_strd)); 241 src_row1_8x16b = _mm_loadl_epi64((__m128i *)((pu1_src - 4) + src_strd)); 242 src_row2_8x16b = _mm_loadl_epi64((__m128i *)((pu1_src - 4) + 2 * src_strd)); 295 temp_str0_16x8b = _mm_loadl_epi64((__m128i *)(&mask)); 296 const2tc_8x16b = _mm_loadl_epi64((__m128i *)(&tc2)); 429 mask_pq_8x16b = _mm_loadl_epi64((__m128i *)(&mask1)); 459 tmp2_const_8x16b = _mm_loadl_epi64((__m128i *)(shuffle0)); 584 src_q0_8x16b = _mm_loadl_epi64((__m128i *)(pu1_src)); 585 src_q1_8x16b = _mm_loadl_epi64((__m128i *)(pu1_src + src_strd)) [all...] |
ihevc_mem_fns_ssse3_intr.c | 86 src_temp16x8b = _mm_loadl_epi64((__m128i *)(pu1_src));
|
/external/libavc/common/x86/ |
ih264_weighted_pred_sse42.c | 101 y0_0_16x8b = _mm_loadl_epi64((__m128i *)pu1_src1); 102 y0_1_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src1 + src_strd1)); 103 y0_2_16x8b = _mm_loadl_epi64( 105 y0_3_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src1 + src_strd1 * 3)); 107 y1_0_16x8b = _mm_loadl_epi64((__m128i *)pu1_src2); 108 y1_1_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src2 + src_strd2)); 109 y1_2_16x8b = _mm_loadl_epi64( 111 y1_3_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src2 + src_strd2 * 3)); 134 y0_0_16x8b = _mm_loadl_epi64((__m128i *)pu1_src1); 135 y0_1_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src1 + src_strd1)) [all...] |
ih264_iquant_itrans_recon_dc_ssse3.c | 136 predload_r = _mm_loadl_epi64((__m128i *) (&pu1_pred[0])); //p00 p01 p02 p03 0 0 0 0 0 0 0 0 -- all 8 bits 138 predload_r = _mm_loadl_epi64((__m128i *) (&pu1_pred[pred_strd])); //p10 p11 p12 p13 0 0 0 0 0 0 0 0 -- all 8 bits 140 predload_r = _mm_loadl_epi64((__m128i *) (&pu1_pred[2*pred_strd])); //p20 p21 p22 p23 0 0 0 0 0 0 0 0 -- all 8 bits 142 predload_r = _mm_loadl_epi64((__m128i *) (&pu1_pred[3*pred_strd])); //p30 p31 p32 p33 0 0 0 0 0 0 0 0 -- all 8 bits 258 predload_r = _mm_loadl_epi64((__m128i *)(&pu1_pred[0])); //p0 p1 p2 p3 p4 p5 p6 p7 0 0 0 0 0 0 0 0 -- all 8 bits 261 predload_r = _mm_loadl_epi64((__m128i *)(&pu1_pred[pred_strd])); //p0 p1 p2 p3 p4 p5 p6 p7 0 0 0 0 0 0 0 0 -- all 8 bits 264 predload_r = _mm_loadl_epi64( 268 predload_r = _mm_loadl_epi64( 272 predload_r = _mm_loadl_epi64( 276 predload_r = _mm_loadl_epi64( [all...] |
ih264_mem_fns_ssse3.c | 87 src_temp16x8b = _mm_loadl_epi64((__m128i *)(pu1_src));
|
ih264_iquant_itrans_recon_sse42.c | 230 pred_r0 = _mm_loadl_epi64((__m128i *) (&pu1_pred[0])); //p00 p01 p02 p03 0 0 0 0 0 0 0 0 -- all 8 bits 231 pred_r1 = _mm_loadl_epi64((__m128i *) (&pu1_pred[pred_strd])); //p10 p11 p12 p13 0 0 0 0 0 0 0 0 -- all 8 bits 232 pred_r2 = _mm_loadl_epi64((__m128i *) (&pu1_pred[2 * pred_strd])); //p20 p21 p22 p23 0 0 0 0 0 0 0 0 -- all 8 bits 233 pred_r3 = _mm_loadl_epi64((__m128i *) (&pu1_pred[3 * pred_strd])); //p30 p31 p32 p33 0 0 0 0 0 0 0 0 -- all 8 bits 480 pred_r0 = _mm_loadl_epi64((__m128i *) (&pu1_pred[0])); //p00 p01 p02 p03 0 0 0 0 0 0 0 0 -- all 8 bits 481 pred_r1 = _mm_loadl_epi64((__m128i *) (&pu1_pred[pred_strd])); //p10 p11 p12 p13 0 0 0 0 0 0 0 0 -- all 8 bits 482 pred_r2 = _mm_loadl_epi64((__m128i *) (&pu1_pred[2 * pred_strd])); //p20 p21 p22 p23 0 0 0 0 0 0 0 0 -- all 8 bits 483 pred_r3 = _mm_loadl_epi64((__m128i *) (&pu1_pred[3 * pred_strd])); //p30 p31 p32 p33 0 0 0 0 0 0 0 0 -- all 8 bits 553 out_r0 = _mm_loadl_epi64((__m128i *) (&pu1_out[0])); 554 out_r1 = _mm_loadl_epi64((__m128i *) (&pu1_out[out_strd])) [all...] |
ih264_deblk_chroma_ssse3.c | 115 linea = _mm_loadl_epi64((__m128i *)(pu1_src_uv - 4)); 116 lineb = _mm_loadl_epi64((__m128i *)(pu1_src_uv - 4 + src_strd)); 117 linec = _mm_loadl_epi64((__m128i *)(pu1_src_uv - 4 + 2 * src_strd)); 118 lined = _mm_loadl_epi64((__m128i *)(pu1_src_uv - 4 + 3 * src_strd)); 119 linee = _mm_loadl_epi64((__m128i *)(pu1_src_uv - 4 + 4 * src_strd)); 120 linef = _mm_loadl_epi64((__m128i *)(pu1_src_uv - 4 + 5 * src_strd)); 121 lineg = _mm_loadl_epi64((__m128i *)(pu1_src_uv - 4 + 6 * src_strd)); 122 lineh = _mm_loadl_epi64((__m128i *)(pu1_src_uv - 4 + 7 * src_strd)); 464 linea = _mm_loadl_epi64((__m128i *)(pu1_src_uv - 4)); 465 lineb = _mm_loadl_epi64((__m128i *)(pu1_src_uv - 4 + src_strd)) [all...] |
/external/libhevc/decoder/x86/ |
ihevcd_it_rec_dc_sse42_intr.c | 97 m_temp_reg_0 = _mm_loadl_epi64((__m128i *)(pu1_pred)); 98 m_temp_reg_1 = _mm_loadl_epi64((__m128i *)(pu1_pred + pred_strd)); 99 m_temp_reg_2 = _mm_loadl_epi64((__m128i *)(pu1_pred + 2 * pred_strd)); 100 m_temp_reg_3 = _mm_loadl_epi64((__m128i *)(pu1_pred + 3 * pred_strd)); 140 m_temp_reg_0 = _mm_loadl_epi64((__m128i *)pu1_pred); 141 m_temp_reg_1 = _mm_loadl_epi64((__m128i *)(pu1_pred + pred_strd)); 142 m_temp_reg_2 = _mm_loadl_epi64((__m128i *)(pu1_pred + 2 * pred_strd)); 143 m_temp_reg_3 = _mm_loadl_epi64((__m128i *)(pu1_pred + 3 * pred_strd)); 244 m_temp_reg_0 = _mm_loadl_epi64((__m128i *)(pu1_pred)); 245 m_temp_reg_1 = _mm_loadl_epi64((__m128i *)(pu1_pred + pred_strd)) [all...] |
ihevcd_it_rec_dc_ssse3_intr.c | 98 m_temp_reg_0 = _mm_loadl_epi64((__m128i *)(pu1_pred)); 99 m_temp_reg_1 = _mm_loadl_epi64((__m128i *)(pu1_pred + pred_strd)); 100 m_temp_reg_2 = _mm_loadl_epi64((__m128i *)(pu1_pred + 2 * pred_strd)); 101 m_temp_reg_3 = _mm_loadl_epi64((__m128i *)(pu1_pred + 3 * pred_strd)); 141 m_temp_reg_0 = _mm_loadl_epi64((__m128i *)pu1_pred); 142 m_temp_reg_1 = _mm_loadl_epi64((__m128i *)(pu1_pred + pred_strd)); 143 m_temp_reg_2 = _mm_loadl_epi64((__m128i *)(pu1_pred + 2 * pred_strd)); 144 m_temp_reg_3 = _mm_loadl_epi64((__m128i *)(pu1_pred + 3 * pred_strd)); 244 m_temp_reg_0 = _mm_loadl_epi64((__m128i *)(pu1_pred)); 245 m_temp_reg_1 = _mm_loadl_epi64((__m128i *)(pu1_pred + pred_strd)) [all...] |
/external/opencv3/3rdparty/libwebp/dsp/ |
enc_sse2.c | 133 in0 = _mm_loadl_epi64((__m128i*)&in[0]); 134 in1 = _mm_loadl_epi64((__m128i*)&in[4]); 135 in2 = _mm_loadl_epi64((__m128i*)&in[8]); 136 in3 = _mm_loadl_epi64((__m128i*)&in[12]); 142 const __m128i inB0 = _mm_loadl_epi64((__m128i*)&in[16]); 143 const __m128i inB1 = _mm_loadl_epi64((__m128i*)&in[20]); 144 const __m128i inB2 = _mm_loadl_epi64((__m128i*)&in[24]); 145 const __m128i inB3 = _mm_loadl_epi64((__m128i*)&in[28]); 282 ref0 = _mm_loadl_epi64((__m128i*)&ref[0 * BPS]); 283 ref1 = _mm_loadl_epi64((__m128i*)&ref[1 * BPS]) [all...] |
/external/libvpx/libvpx/vp9/encoder/x86/ |
vp9_avg_intrin_sse2.c | 21 s0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(s)), u0); 22 d0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(d)), u0); 27 s0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(s + p)), u0); 28 d0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(d + dp)), u0); 35 s0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(s + 2 * p)), u0); 36 d0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(d + 2 * dp)), u0); 43 s0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(s + 3 * p)), u0); 44 d0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(d + 3 * dp)), u0); 51 s0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(s + 4 * p)), u0); 52 d0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(d + 4 * dp)), u0) [all...] |
/external/libvpx/libvpx/vpx_dsp/x86/ |
vpx_subpixel_8t_intrin_ssse3.c | 236 srcReg1 = _mm_loadl_epi64((const __m128i *)src_ptr); 237 srcReg2 = _mm_loadl_epi64((const __m128i *)(src_ptr + src_pitch)); 238 srcReg3 = _mm_loadl_epi64((const __m128i *)(src_ptr + src_pitch * 2)); 239 srcReg4 = _mm_loadl_epi64((const __m128i *)(src_ptr + src_pitch * 3)); 240 srcReg5 = _mm_loadl_epi64((const __m128i *)(src_ptr + src_pitch * 4)); 241 srcReg6 = _mm_loadl_epi64((const __m128i *)(src_ptr + src_pitch * 5)); 242 srcReg7 = _mm_loadl_epi64((const __m128i *)(src_ptr + src_pitch * 6)); 246 srcReg8 = _mm_loadl_epi64((const __m128i *)(src_ptr + src_pitch * 7)); 382 const __m128i A = _mm_loadl_epi64((const __m128i *)src_x); 383 const __m128i B = _mm_loadl_epi64((const __m128i *)(src_x + src_pitch)) [all...] |
loopfilter_sse2.c | 35 q4p4 = _mm_loadl_epi64((__m128i *)(s - 5 * p)); 38 q3p3 = _mm_loadl_epi64((__m128i *)(s - 4 * p)); 41 q2p2 = _mm_loadl_epi64((__m128i *)(s - 3 * p)); 44 q1p1 = _mm_loadl_epi64((__m128i *)(s - 2 * p)); 48 q0p0 = _mm_loadl_epi64((__m128i *)(s - 1 * p)); 136 q5p5 = _mm_loadl_epi64((__m128i *)(s - 6 * p)); 140 q6p6 = _mm_loadl_epi64((__m128i *)(s - 7 * p)); 145 q7p7 = _mm_loadl_epi64((__m128i *)(s - 8 * p)); [all...] |
/external/neven/Embedded/common/src/b_BasicEm/ |
MathSSE2.c | 55 m_XMM0 = _mm_loadl_epi64( (__m128i *)&0[vec1L] ); 58 m_XMM1 = _mm_loadl_epi64( (__m128i *)&0[vec2L] ); 61 m_XMM2 = _mm_loadl_epi64( (__m128i *)&4[vec1L] ); 65 m_XMM3 = _mm_loadl_epi64( (__m128i *)&4[vec2L] ); 66 m_XMM4 = _mm_loadl_epi64( (__m128i *)&8[vec1L] ); 70 m_XMM5 = _mm_loadl_epi64( (__m128i *)&8[vec2L] ); 74 m_XMM6 = _mm_loadl_epi64( (__m128i *)&12[vec1L] ); 78 m_XMM8 = _mm_loadl_epi64( (__m128i *)&12[vec2L] ); 93 m_XMM0 = _mm_loadl_epi64( (__m128i *)&m_XMM7 );
|
/external/gemmlowp/internal/ |
pack_SSE.h | 101 _mm_loadl_epi64(reinterpret_cast<const __m128i*>(&src_data[0])); 102 __m128i xmm2 = _mm_loadl_epi64( 104 __m128i xmm3 = _mm_loadl_epi64( 106 __m128i xmm4 = _mm_loadl_epi64(
|
/external/webrtc/webrtc/modules/audio_processing/aec/ |
aec_rdft_sse2.c | 88 const __m128i a_00 = _mm_loadl_epi64((__m128i*)&a[j0 + 0]); 89 const __m128i a_08 = _mm_loadl_epi64((__m128i*)&a[j0 + 8]); 90 const __m128i a_32 = _mm_loadl_epi64((__m128i*)&a[j0 + 32]); 91 const __m128i a_40 = _mm_loadl_epi64((__m128i*)&a[j0 + 40]); 101 const __m128i a_16 = _mm_loadl_epi64((__m128i*)&a[j0 + 16]); 102 const __m128i a_24 = _mm_loadl_epi64((__m128i*)&a[j0 + 24]); 103 const __m128i a_48 = _mm_loadl_epi64((__m128i*)&a[j0 + 48]); 104 const __m128i a_56 = _mm_loadl_epi64((__m128i*)&a[j0 + 56]); 162 const __m128i a_00 = _mm_loadl_epi64((__m128i*)&a[j0 + 0]); 163 const __m128i a_08 = _mm_loadl_epi64((__m128i*)&a[j0 + 8]) [all...] |
/external/webp/src/dsp/ |
enc_sse2.c | 84 in0 = _mm_loadl_epi64((const __m128i*)&in[0]); 85 in1 = _mm_loadl_epi64((const __m128i*)&in[4]); 86 in2 = _mm_loadl_epi64((const __m128i*)&in[8]); 87 in3 = _mm_loadl_epi64((const __m128i*)&in[12]); 93 const __m128i inB0 = _mm_loadl_epi64((const __m128i*)&in[16]); 94 const __m128i inB1 = _mm_loadl_epi64((const __m128i*)&in[20]); 95 const __m128i inB2 = _mm_loadl_epi64((const __m128i*)&in[24]); 96 const __m128i inB3 = _mm_loadl_epi64((const __m128i*)&in[28]); 233 ref0 = _mm_loadl_epi64((const __m128i*)&ref[0 * BPS]); 234 ref1 = _mm_loadl_epi64((const __m128i*)&ref[1 * BPS]) [all...] |
enc_sse41.c | 78 const __m128i inA_0 = _mm_loadl_epi64((const __m128i*)&inA[BPS * 0]); 79 const __m128i inA_1 = _mm_loadl_epi64((const __m128i*)&inA[BPS * 1]); 80 const __m128i inA_2 = _mm_loadl_epi64((const __m128i*)&inA[BPS * 2]); 81 const __m128i inA_3 = _mm_loadl_epi64((const __m128i*)&inA[BPS * 3]); 82 const __m128i inB_0 = _mm_loadl_epi64((const __m128i*)&inB[BPS * 0]); 83 const __m128i inB_1 = _mm_loadl_epi64((const __m128i*)&inB[BPS * 1]); 84 const __m128i inB_2 = _mm_loadl_epi64((const __m128i*)&inB[BPS * 2]); 85 const __m128i inB_3 = _mm_loadl_epi64((const __m128i*)&inB[BPS * 3]);
|
/hardware/intel/common/omx-components/videocodec/libvpx_internal/libvpx/vp9/common/x86/ |
vp9_loopfilter_intrin_sse2.c | 29 q4p4 = _mm_loadl_epi64((__m128i *)(s - 5 * p)); 32 q3p3 = _mm_loadl_epi64((__m128i *)(s - 4 * p)); 35 q2p2 = _mm_loadl_epi64((__m128i *)(s - 3 * p)); 38 q1p1 = _mm_loadl_epi64((__m128i *)(s - 2 * p)); 42 q0p0 = _mm_loadl_epi64((__m128i *)(s - 1 * p)); 138 q5p5 = _mm_loadl_epi64((__m128i *)(s - 6 * p)); 142 q6p6 = _mm_loadl_epi64((__m128i *)(s - 7 * p)); 151 q7p7 = _mm_loadl_epi64((__m128i *)(s - 8 * p)); 576 p7 = _mm_unpacklo_epi8(_mm_loadl_epi64((__m128i *)(&ap[7 * 16] + off)), 578 p6 = _mm_unpacklo_epi8(_mm_loadl_epi64((__m128i *)(&ap[6 * 16] + off)) [all...] |