/external/libvpx/libvpx/vp9/common/mips/msa/ |
vp9_idct4x4_msa.c | 18 v8i16 in0, in1, in2, in3; local 21 LD4x4_SH(input, in0, in1, in2, in3); 22 TRANSPOSE4x4_SH_SH(in0, in1, in2, in3, in0, in1, in2, in3); 27 VP9_IDCT4x4(in0, in1, in2, in3, in0, in1, in2, in3); 29 TRANSPOSE4x4_SH_SH(in0, in1, in2, in3, in0, in1, in2, in3); 30 VP9_IDCT4x4(in0, in1, in2, in3, in0, in1, in2, in3) [all...] |
vp9_idct8x8_msa.c | 18 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local 21 LD_SH8(input, 8, in0, in1, in2, in3, in4, in5, in6, in7); 23 TRANSPOSE8x8_SH_SH(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2, in3, 29 VP9_IDCT8x8_1D(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2, in3, 32 TRANSPOSE8x8_SH_SH(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2, 34 VP9_IDCT8x8_1D(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2, in3 [all...] |
/external/libvpx/libvpx/vp9/common/x86/ |
vp9_idct_intrin_sse2.c | 121 __m128i in0[16], in1[16]; local 123 load_buffer_8x16(input, in0); 129 idct16_sse2(in0, in1); 130 idct16_sse2(in0, in1); 133 idct16_sse2(in0, in1); 134 iadst16_sse2(in0, in1); 137 iadst16_sse2(in0, in1); 138 idct16_sse2(in0, in1); 141 iadst16_sse2(in0, in1); 142 iadst16_sse2(in0, in1) [all...] |
/external/libvpx/libvpx/vp9/encoder/mips/msa/ |
vp9_fdct8x8_msa.c | 18 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local 20 LD_SH8(input, stride, in0, in1, in2, in3, in4, in5, in6, in7); 21 SLLI_4V(in0, in1, in2, in3, 2); 26 VP9_FDCT8(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2, in3, in4, 28 TRANSPOSE8x8_SH_SH(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2, 30 VP9_FDCT8(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2, in3, in4, 34 VP9_ADST8(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2, in3, in4 [all...] |
vp9_fdct4x4_msa.c | 18 v8i16 in0, in1, in2, in3, in4; local 20 LD_SH4(input, src_stride, in0, in1, in2, in3); 22 in0 += in1; 24 in4 = (in0 - in3) >> 1; 26 in0 -= in2; 29 TRANSPOSE4x4_SH_SH(in0, in2, in3, in1, in0, in2, in3, in1); 31 in0 += in2; 33 in4 = (in0 - in1) >> 1; 35 in0 -= in3 50 v8i16 in0, in1, in2, in3; local [all...] |
vp9_fdct16x16_msa.c | 368 v8i16 in0, in1, in2, in3, in4, in5, in6, in7, in8, in9, in10, in11; local 371 LD_SH8(temp, 16, in0, in1, in2, in3, in4, in5, in6, in7); 374 TRANSPOSE8x8_SH_SH(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2, in3, 378 FDCT_POSTPROC_2V_NEG_H(in0, in1); 386 BUTTERFLY_16(in0, in1, in2, in3, in4, in5, in6, in7, in8, in9, in10, in11, 395 FDCT8x16_ODD(in8, in9, in10, in11, in12, in13, in14, in15, in0, in1, in2, in3, 397 TRANSPOSE8x8_SH_SH(tmp0, in0, tmp1, in1, tmp2, in2, tmp3, in3, tmp0, in0, 399 ST_SH8(tmp0, in0, tmp1, in1, tmp2, in2, tmp3, in3, out, 16) [all...] |
/external/libvpx/libvpx/vpx_dsp/mips/ |
idct4x4_msa.c | 15 v8i16 in0, in1, in2, in3; local 19 LD4x4_SH(input, in0, in2, in3, in1); 20 TRANSPOSE4x4_SH_SH(in0, in2, in3, in1, in0, in2, in3, in1); 21 UNPCK_R_SH_SW(in0, in0_r); 45 PCKEV_H4_SH(in0_r, in0_r, in1_r, in1_r, in2_r, in2_r, in3_r, in3_r, in0, in1, 47 ADDBLK_ST4x4_UB(in0, in3, in1, in2, dst, dst_stride); 53 v8i16 in1, in0 = { 0 }; local 59 in0 = __msa_insert_h(in0, 0, a1) 72 v8i16 in0, in1, in2, in3; local [all...] |
idct8x8_msa.c | 15 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local 18 LD_SH8(input, 8, in0, in1, in2, in3, in4, in5, in6, in7); 21 TRANSPOSE8x8_SH_SH(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2, in3, 24 VP9_IDCT8x8_1D(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2, in3, 27 TRANSPOSE8x8_SH_SH(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2, in3, 30 VP9_IDCT8x8_1D(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2, in3 43 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local [all...] |
fwd_txfm_msa.c | 16 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local 29 LD_SH16(input, src_stride, in0, in1, in2, in3, in4, in5, in6, in7, in8, in9, 31 SLLI_4V(in0, in1, in2, in3, 2); 35 ADD4(in0, in15, in1, in14, in2, in13, in3, in12, tmp0, tmp1, tmp2, tmp3); 40 SUB4(in0, in15, in1, in14, in2, in13, in3, in12, in15, in14, in13, in12); 135 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local 138 LD_SH8(input, 16, in0, in1, in2, in3, in4, in5, in6, in7); 140 TRANSPOSE8x8_SH_SH(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2, in3, 144 ADD4(in0, 1, in1, 1, in2, 1, in3, 1, in0, in1, in2, in3) 171 v8i16 in0, in1, in2, in3; local 201 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local 219 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local 249 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local [all...] |
fwd_dct32x32_msa.c | 16 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local 22 LD_SH4(input, src_stride, in0, in1, in2, in3); 26 SLLI_4V(in0, in1, in2, in3, 2); 30 BUTTERFLY_8(in0, in1, in2, in3, in4, in5, in6, in7, step0, step1, step2, 40 LD_SH4(input + (8 * src_stride), src_stride, in0, in1, in2, in3); 44 SLLI_4V(in0, in1, in2, in3, 2); 48 BUTTERFLY_8(in0, in1, in2, in3, in4, in5, in6, in7, step0, step1, step2, 59 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local 65 LD_SH4(input, 8, in0, in1, in2, in3); 67 BUTTERFLY_8(in0, in1, in2, in3, in12, in13, in14, in15, vec0, vec1, vec2 255 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local 288 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local 392 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local 596 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local 695 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local 931 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local [all...] |
/external/libvpx/libvpx/vpx_dsp/x86/ |
fwd_txfm_sse2.c | 19 __m128i in0, in1; local 22 in0 = _mm_loadl_epi64((const __m128i *)(input + 0 * stride)); 26 in0 = _mm_unpacklo_epi64( 27 in0, _mm_loadl_epi64((const __m128i *)(input + 3 * stride))); 29 tmp = _mm_add_epi16(in0, in1); 30 in0 = _mm_unpacklo_epi16(zero, tmp); 32 in0 = _mm_srai_epi32(in0, 16); 35 tmp = _mm_add_epi32(in0, in1); 36 in0 = _mm_unpacklo_epi32(tmp, zero) 48 __m128i in0 = _mm_load_si128((const __m128i *)(input + 0 * stride)); local 89 __m128i in0, in1, in2, in3; local 158 __m128i in0, in1, in2, in3; local [all...] |
/external/libvpx/libvpx/vp8/encoder/mips/msa/ |
dct_msa.c | 14 #define TRANSPOSE4x4_H(in0, in1, in2, in3, out0, out1, out2, out3) \ 18 ILVR_H2_SH(in2, in0, in3, in1, s0_m, s1_m); \ 20 ILVL_H2_SH(in2, in0, in3, in1, s0_m, s1_m); \ 34 #define RET_1_IF_NZERO_H(in0) \ 39 tmp0_m = __msa_ceqi_h(in0, 0); \ 46 #define RET_1_IF_NZERO_W(in0) \ 51 tmp0_m = __msa_ceqi_w(in0, 0); \ 58 #define RET_1_IF_NEG_W(in0) \ 63 tmp0_m = __msa_clti_s_w(in0, 0); \ 70 v8i16 in0, in1, in2, in3 local 116 v8i16 in0, in1, in2, in3; local [all...] |
/system/bt/embdrv/sbc/decoder/srce/ |
synthesis-dct8.c | 97 double in0, in1, in2, in3; local 100 in0 = FLOAT_SCALE(in[0], DCTII_8_SHIFT_IN); 101 OI_ASSERT(VALID_INT32(in0)); 117 L00 = (in0 + in7); 132 L07 = (in0 - in7); 259 int32_t in0, in1, in2, in3; local 263 in0 = SCALE(in[0], DCTII_8_SHIFT_IN); 272 in0 = in[0]; 282 L00 = in0 + in7; 290 L07 = in0 - in7 [all...] |
/external/deqp/modules/gles3/functional/ |
es3fShaderPackingFunctionTests.cpp | 151 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_FLOAT_VEC2, precision))); 154 m_spec.source = "out0 = packSnorm2x16(in0);"; 254 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_UINT, glu::PRECISION_HIGHP))); 257 m_spec.source = "out0 = unpackSnorm2x16(in0);"; 297 const deInt16 in0 = (deInt16)(deUint16)(inputs[valNdx] & 0xffff); local 299 const float ref0 = de::clamp(float(in0) / 32767.f, -1.0f, 1.0f); 342 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_FLOAT_VEC2, precision))); 345 m_spec.source = "out0 = packUnorm2x16(in0);"; 445 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_UINT, glu::PRECISION_HIGHP))); 448 m_spec.source = "out0 = unpackUnorm2x16(in0);"; 488 const deUint16 in0 = (deUint16)(inputs[valNdx] & 0xffff); local 699 const deUint16 in0 = (deUint16)(inputs[valNdx] & 0xffff); local [all...] |
es3fShaderPrecisionTests.cpp | 99 op << "\t" << precName << " " << typeName << " in0 = " << (isVertexCase ? "a_" : "v_") << "in0;\n" 156 op << "\t" << precName << " " << typeName << " in0 = " << (isVertexCase ? "a_" : "v_") << "in0;\n" 180 typedef double (*EvalFunc) (double in0, double in1); 190 bool compare (float in0, float in1, double reference, float result); 286 bool ShaderFloatPrecisionCase::compare (float in0, float in1, double reference, float result) 299 const int in0Exp = tcu::Float32(in0).exponent(); 365 const float in0 = m_rnd.getFloat(m_rangeA.x(), m_rangeA.y()); local 367 const double refD = m_evalFunc((double)in0, (double)in1) 581 int in0 = deSignExtendTo32(((isMaxRangeA ? (int)m_rnd.getUint32() : m_rnd.getInt(m_rangeA.x(), m_rangeA.y())) & mask), m_bits); local 775 deUint32 in0 = (isMaxRangeA ? m_rnd.getUint32() : (m_rangeA.x() + m_rnd.getUint32()%(m_rangeA.y()-m_rangeA.x()+1))) & mask; local [all...] |
es3fShaderCommonFunctionTests.cpp | 425 m_spec.inputs.push_back(Symbol("in0", glu::VarType(baseType, precision))); 427 m_spec.source = "out0 = abs(in0);"; 469 const float in0 = ((const float*)inputs[0])[compNdx]; local 471 const float ref0 = de::abs(in0); 485 const int in0 = ((const int*)inputs[0])[compNdx]; local 487 const int ref0 = de::abs(in0); 507 m_spec.inputs.push_back(Symbol("in0", glu::VarType(baseType, precision))); 509 m_spec.source = "out0 = sign(in0);"; 562 const float in0 = ((const float*)inputs[0])[compNdx]; local 564 const float ref0 = in0 < 0.0f ? -1.0f 579 const int in0 = ((const int*)inputs[0])[compNdx]; local 668 const float in0 = ((const float*)inputs[0])[compNdx]; local 689 const float in0 = ((const float*)inputs[0])[compNdx]; local 758 const float in0 = ((const float*)inputs[0])[compNdx]; local 835 const float in0 = ((const float*)inputs[0])[compNdx]; local 916 const float in0 = ((const float*)inputs[0])[compNdx]; local 989 const float in0 = ((const float*)inputs[0])[compNdx]; local 1058 const float in0 = ((const float*)inputs[0])[compNdx]; local 1120 const float in0 = ((const float*)inputs[0])[compNdx]; local 1141 const float in0 = ((const float*)inputs[0])[compNdx]; local 1226 const float in0 = ((const float*)inputs[0])[compNdx]; local 1338 const float in0 = ((const float*)inputs[0])[compNdx]; local 1377 const float in0 = ((const float*)inputs[0])[compNdx]; local 1454 const float in0 = ((const float*)inputs[0])[compNdx]; local 1475 const float in0 = ((const float*)inputs[0])[compNdx]; local 1572 const float in0 = ((const float*)inputs[0])[compNdx]; local 1592 const float in0 = ((const float*)inputs[0])[compNdx]; local [all...] |
/external/icu/icu4c/source/test/intltest/ |
dtfmtrtts.cpp | 408 UBool in0; local 413 else if((in0=fmt->getTimeZone().inDaylightTime(d[0], status)) && ! failure(status, "gettingDaylightTime") && 417 else if (!in0 &&
|
/external/deqp/modules/gles31/functional/ |
es31fShaderPackingFunctionTests.cpp | 155 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_FLOAT_VEC2, precision))); 158 m_spec.source = "out0 = packSnorm2x16(in0);"; 258 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_UINT, glu::PRECISION_HIGHP))); 261 m_spec.source = "out0 = unpackSnorm2x16(in0);"; 301 const deInt16 in0 = (deInt16)(deUint16)(inputs[valNdx] & 0xffff); local 303 const float ref0 = de::clamp(float(in0) / 32767.f, -1.0f, 1.0f); 346 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_FLOAT_VEC2, precision))); 349 m_spec.source = "out0 = packUnorm2x16(in0);"; 449 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_UINT, glu::PRECISION_HIGHP))); 452 m_spec.source = "out0 = unpackUnorm2x16(in0);"; 492 const deUint16 in0 = (deUint16)(inputs[valNdx] & 0xffff); local 703 const deUint16 in0 = (deUint16)(inputs[valNdx] & 0xffff); local 909 const deInt8 in0 = (deInt8)(deUint8)(inputs[valNdx] & 0xff); local 1118 const deUint8 in0 = (deUint8)(inputs[valNdx] & 0xff); local [all...] |
es31fShaderCommonFunctionTests.cpp | 503 m_spec.inputs.push_back(Symbol("in0", glu::VarType(baseType, precision))); 505 m_spec.source = "out0 = abs(in0);"; 547 const float in0 = ((const float*)inputs[0])[compNdx]; local 549 const float ref0 = de::abs(in0); 563 const int in0 = ((const int*)inputs[0])[compNdx]; local 565 const int ref0 = de::abs(in0); 585 m_spec.inputs.push_back(Symbol("in0", glu::VarType(baseType, precision))); 587 m_spec.source = "out0 = sign(in0);"; 640 const float in0 = ((const float*)inputs[0])[compNdx]; local 642 const float ref0 = in0 < 0.0f ? -1.0f 657 const int in0 = ((const int*)inputs[0])[compNdx]; local 746 const float in0 = ((const float*)inputs[0])[compNdx]; local 767 const float in0 = ((const float*)inputs[0])[compNdx]; local 836 const float in0 = ((const float*)inputs[0])[compNdx]; local 913 const float in0 = ((const float*)inputs[0])[compNdx]; local 929 const float in0 = ((const float*)inputs[0])[compNdx]; local 996 const float in0 = ((const float*)inputs[0])[compNdx]; local 1012 const float in0 = ((const float*)inputs[0])[compNdx]; local 1072 const float in0 = ((const float*)inputs[0])[compNdx]; local 1141 const float in0 = ((const float*)inputs[0])[compNdx]; local 1203 const float in0 = ((const float*)inputs[0])[compNdx]; local 1224 const float in0 = ((const float*)inputs[0])[compNdx]; local 1309 const float in0 = ((const float*)inputs[0])[compNdx]; local 1421 const float in0 = ((const float*)inputs[0])[compNdx]; local 1460 const float in0 = ((const float*)inputs[0])[compNdx]; local 1537 const float in0 = ((const float*)inputs[0])[compNdx]; local 1558 const float in0 = ((const float*)inputs[0])[compNdx]; local 1655 const float in0 = ((const float*)inputs[0])[compNdx]; local 1675 const float in0 = ((const float*)inputs[0])[compNdx]; local [all...] |
es31fShaderIntegerFunctionTests.cpp | 377 deUint32* in0 = (deUint32*)values[0]; local 401 in0[easyCaseNdx*scalarSize + compNdx] = easyCases[easyCaseNdx].x & integerMask; 413 in0[easyCaseNdx*scalarSize + compNdx] = extendSignTo32(in0[easyCaseNdx*scalarSize + compNdx], integerLength); 419 generateRandomInputData(rnd, m_shaderType, type, precision, in0, numValues - DE_LENGTH_OF_ARRAY(easyCases)); 433 const deUint32 in0 = ((const deUint32*)inputs[0])[compNdx]; local 437 const deUint32 ref0 = in0+in1; 438 const deUint32 ref1 = (deUint64(in0)+deUint64(in1)) > 0xffffffffu ? 1u : 0u; 473 deUint32* in0 = (deUint32*)values[0]; local 495 in0[easyCaseNdx*scalarSize + compNdx] = easyCases[easyCaseNdx].x & integerMask 527 const deUint32 in0 = ((const deUint32*)inputs[0])[compNdx]; local 564 deUint32* in0 = (deUint32*)values[0]; local 616 const deUint32 in0 = ((const deUint32*)inputs[0])[compNdx]; local 654 deUint32* in0 = (deUint32*)values[0]; local 707 const deInt32 in0 = ((const deInt32*)inputs[0])[compNdx]; local [all...] |
/external/libjpeg-turbo/simd/ |
jquanti-altivec.c | 57 __vector unsigned char in0, in1, in2, in3, in4, in5, in6, in7; local 73 out0 = (__vector short)VEC_UNPACKHU(in0);
|
/external/deqp/external/vulkancts/modules/vulkan/shaderexecutor/ |
vktShaderPackingFunctionTests.cpp | 261 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_FLOAT_VEC2, precision))); 264 m_spec.source = "out0 = packSnorm2x16(in0);"; 320 const deInt16 in0 = (deInt16)(deUint16)(inputs[valNdx] & 0xffff); local 322 const float ref0 = de::clamp(float(in0) / 32767.f, -1.0f, 1.0f); 365 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_UINT, glu::PRECISION_HIGHP))); 368 m_spec.source = "out0 = unpackSnorm2x16(in0);"; 484 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_FLOAT_VEC2, precision))); 487 m_spec.source = "out0 = packUnorm2x16(in0);"; 543 const deUint16 in0 = (deUint16)(inputs[valNdx] & 0xffff); local 545 const float ref0 = float(in0) / 65535.0f 785 const deUint16 in0 = (deUint16)(inputs[valNdx] & 0xffff); local 1024 const deInt8 in0 = (deInt8)(deUint8)(inputs[valNdx] & 0xff); local 1267 const deUint8 in0 = (deUint8)(inputs[valNdx] & 0xff); local [all...] |
vktShaderIntegerFunctionTests.cpp | 468 deUint32* in0 = (deUint32*)values[0]; local 492 in0[easyCaseNdx*scalarSize + compNdx] = easyCases[easyCaseNdx].x & integerMask; 504 in0[easyCaseNdx*scalarSize + compNdx] = extendSignTo32(in0[easyCaseNdx*scalarSize + compNdx], integerLength); 510 generateRandomInputData(rnd, m_shaderType, type, precision, in0, numValues - DE_LENGTH_OF_ARRAY(easyCases)); 524 const deUint32 in0 = ((const deUint32*)inputs[0])[compNdx]; local 528 const deUint32 ref0 = in0+in1; 529 const deUint32 ref1 = (deUint64(in0)+deUint64(in1)) > 0xffffffffu ? 1u : 0u; 578 deUint32* in0 = (deUint32*)values[0]; local 600 in0[easyCaseNdx*scalarSize + compNdx] = easyCases[easyCaseNdx].x & integerMask 632 const deUint32 in0 = ((const deUint32*)inputs[0])[compNdx]; local 683 deUint32* in0 = (deUint32*)values[0]; local 735 const deUint32 in0 = ((const deUint32*)inputs[0])[compNdx]; local 787 deUint32* in0 = (deUint32*)values[0]; local 840 const deInt32 in0 = ((const deInt32*)inputs[0])[compNdx]; local [all...] |
/external/libvpx/libvpx/vp8/common/mips/msa/ |
idct_msa.c | 18 #define TRANSPOSE_TWO_4x4_H(in0, in1, in2, in3, out0, out1, out2, out3) \ 22 TRANSPOSE8X4_SH_SH(in0, in1, in2, in3, s4_m, s5_m, s6_m, s7_m); \ 45 #define VP8_IDCT_1D_H(in0, in1, in2, in3, out0, out1, out2, out3) \ 52 a1_m = in0 + in2; \ 53 b1_m = in0 - in2; \ 67 #define VP8_IDCT_1D_W(in0, in1, in2, in3, out0, out1, out2, out3) \ 75 a1_m = in0 + in2; \ 76 b1_m = in0 - in2; \ 90 v4i32 in0, in1, in2, in3, hz0, hz1, hz2, hz3, vt0, vt1, vt2, vt3; local 96 UNPCK_SH_SW(input0, in0, in1) 181 v8i16 in0, in1, in2, in3, hz0_h, hz1_h, hz2_h, hz3_h; local 218 v8i16 in0, in1, in2, in3, mul0, mul1, mul2, mul3, dequant_in0, dequant_in1; local [all...] |
/external/webp/src/dsp/ |
enc_sse41.c | 209 __m128i in0 = _mm_loadu_si128((__m128i*)&in[0]); local 217 __m128i coeff0 = _mm_abs_epi16(in0); 265 out0 = _mm_sign_epi16(out0, in0); 269 in0 = _mm_mullo_epi16(out0, q0); 272 _mm_storeu_si128((__m128i*)&in[0], in0);
|