HomeSort by relevance Sort by last modified time
    Searched defs:in0 (Results 1 - 25 of 49) sorted by null

1 2

  /external/libvpx/libvpx/vp9/common/mips/msa/
vp9_idct4x4_msa.c 18 v8i16 in0, in1, in2, in3; local
21 LD4x4_SH(input, in0, in1, in2, in3);
22 TRANSPOSE4x4_SH_SH(in0, in1, in2, in3, in0, in1, in2, in3);
27 VP9_IDCT4x4(in0, in1, in2, in3, in0, in1, in2, in3);
29 TRANSPOSE4x4_SH_SH(in0, in1, in2, in3, in0, in1, in2, in3);
30 VP9_IDCT4x4(in0, in1, in2, in3, in0, in1, in2, in3)
    [all...]
vp9_idct8x8_msa.c 18 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local
21 LD_SH8(input, 8, in0, in1, in2, in3, in4, in5, in6, in7);
23 TRANSPOSE8x8_SH_SH(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2, in3,
29 VP9_IDCT8x8_1D(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2, in3,
32 TRANSPOSE8x8_SH_SH(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2,
34 VP9_IDCT8x8_1D(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2, in3
    [all...]
  /external/libvpx/libvpx/vp9/common/x86/
vp9_idct_intrin_sse2.c 121 __m128i in0[16], in1[16]; local
123 load_buffer_8x16(input, in0);
129 idct16_sse2(in0, in1);
130 idct16_sse2(in0, in1);
133 idct16_sse2(in0, in1);
134 iadst16_sse2(in0, in1);
137 iadst16_sse2(in0, in1);
138 idct16_sse2(in0, in1);
141 iadst16_sse2(in0, in1);
142 iadst16_sse2(in0, in1)
    [all...]
  /external/libvpx/libvpx/vp9/encoder/mips/msa/
vp9_fdct8x8_msa.c 18 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local
20 LD_SH8(input, stride, in0, in1, in2, in3, in4, in5, in6, in7);
21 SLLI_4V(in0, in1, in2, in3, 2);
26 VP9_FDCT8(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2, in3, in4,
28 TRANSPOSE8x8_SH_SH(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2,
30 VP9_FDCT8(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2, in3, in4,
34 VP9_ADST8(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2, in3, in4
    [all...]
vp9_fdct4x4_msa.c 18 v8i16 in0, in1, in2, in3, in4; local
20 LD_SH4(input, src_stride, in0, in1, in2, in3);
22 in0 += in1;
24 in4 = (in0 - in3) >> 1;
26 in0 -= in2;
29 TRANSPOSE4x4_SH_SH(in0, in2, in3, in1, in0, in2, in3, in1);
31 in0 += in2;
33 in4 = (in0 - in1) >> 1;
35 in0 -= in3
50 v8i16 in0, in1, in2, in3; local
    [all...]
vp9_fdct16x16_msa.c 368 v8i16 in0, in1, in2, in3, in4, in5, in6, in7, in8, in9, in10, in11; local
371 LD_SH8(temp, 16, in0, in1, in2, in3, in4, in5, in6, in7);
374 TRANSPOSE8x8_SH_SH(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2, in3,
378 FDCT_POSTPROC_2V_NEG_H(in0, in1);
386 BUTTERFLY_16(in0, in1, in2, in3, in4, in5, in6, in7, in8, in9, in10, in11,
395 FDCT8x16_ODD(in8, in9, in10, in11, in12, in13, in14, in15, in0, in1, in2, in3,
397 TRANSPOSE8x8_SH_SH(tmp0, in0, tmp1, in1, tmp2, in2, tmp3, in3, tmp0, in0,
399 ST_SH8(tmp0, in0, tmp1, in1, tmp2, in2, tmp3, in3, out, 16)
    [all...]
  /external/libvpx/libvpx/vpx_dsp/mips/
idct4x4_msa.c 15 v8i16 in0, in1, in2, in3; local
19 LD4x4_SH(input, in0, in2, in3, in1);
20 TRANSPOSE4x4_SH_SH(in0, in2, in3, in1, in0, in2, in3, in1);
21 UNPCK_R_SH_SW(in0, in0_r);
45 PCKEV_H4_SH(in0_r, in0_r, in1_r, in1_r, in2_r, in2_r, in3_r, in3_r, in0, in1,
47 ADDBLK_ST4x4_UB(in0, in3, in1, in2, dst, dst_stride);
53 v8i16 in1, in0 = { 0 }; local
59 in0 = __msa_insert_h(in0, 0, a1)
72 v8i16 in0, in1, in2, in3; local
    [all...]
idct8x8_msa.c 15 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local
18 LD_SH8(input, 8, in0, in1, in2, in3, in4, in5, in6, in7);
21 TRANSPOSE8x8_SH_SH(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2, in3,
24 VP9_IDCT8x8_1D(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2, in3,
27 TRANSPOSE8x8_SH_SH(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2, in3,
30 VP9_IDCT8x8_1D(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2, in3
43 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local
    [all...]
fwd_txfm_msa.c 16 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local
29 LD_SH16(input, src_stride, in0, in1, in2, in3, in4, in5, in6, in7, in8, in9,
31 SLLI_4V(in0, in1, in2, in3, 2);
35 ADD4(in0, in15, in1, in14, in2, in13, in3, in12, tmp0, tmp1, tmp2, tmp3);
40 SUB4(in0, in15, in1, in14, in2, in13, in3, in12, in15, in14, in13, in12);
135 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local
138 LD_SH8(input, 16, in0, in1, in2, in3, in4, in5, in6, in7);
140 TRANSPOSE8x8_SH_SH(in0, in1, in2, in3, in4, in5, in6, in7, in0, in1, in2, in3,
144 ADD4(in0, 1, in1, 1, in2, 1, in3, 1, in0, in1, in2, in3)
171 v8i16 in0, in1, in2, in3; local
201 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local
219 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local
249 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local
    [all...]
fwd_dct32x32_msa.c 16 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local
22 LD_SH4(input, src_stride, in0, in1, in2, in3);
26 SLLI_4V(in0, in1, in2, in3, 2);
30 BUTTERFLY_8(in0, in1, in2, in3, in4, in5, in6, in7, step0, step1, step2,
40 LD_SH4(input + (8 * src_stride), src_stride, in0, in1, in2, in3);
44 SLLI_4V(in0, in1, in2, in3, 2);
48 BUTTERFLY_8(in0, in1, in2, in3, in4, in5, in6, in7, step0, step1, step2,
59 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local
65 LD_SH4(input, 8, in0, in1, in2, in3);
67 BUTTERFLY_8(in0, in1, in2, in3, in12, in13, in14, in15, vec0, vec1, vec2
255 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local
288 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local
392 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local
596 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local
695 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local
931 v8i16 in0, in1, in2, in3, in4, in5, in6, in7; local
    [all...]
  /external/libvpx/libvpx/vpx_dsp/x86/
fwd_txfm_sse2.c 19 __m128i in0, in1; local
22 in0 = _mm_loadl_epi64((const __m128i *)(input + 0 * stride));
26 in0 = _mm_unpacklo_epi64(
27 in0, _mm_loadl_epi64((const __m128i *)(input + 3 * stride)));
29 tmp = _mm_add_epi16(in0, in1);
30 in0 = _mm_unpacklo_epi16(zero, tmp);
32 in0 = _mm_srai_epi32(in0, 16);
35 tmp = _mm_add_epi32(in0, in1);
36 in0 = _mm_unpacklo_epi32(tmp, zero)
48 __m128i in0 = _mm_load_si128((const __m128i *)(input + 0 * stride)); local
89 __m128i in0, in1, in2, in3; local
158 __m128i in0, in1, in2, in3; local
    [all...]
  /external/libvpx/libvpx/vp8/encoder/mips/msa/
dct_msa.c 14 #define TRANSPOSE4x4_H(in0, in1, in2, in3, out0, out1, out2, out3) \
18 ILVR_H2_SH(in2, in0, in3, in1, s0_m, s1_m); \
20 ILVL_H2_SH(in2, in0, in3, in1, s0_m, s1_m); \
34 #define RET_1_IF_NZERO_H(in0) \
39 tmp0_m = __msa_ceqi_h(in0, 0); \
46 #define RET_1_IF_NZERO_W(in0) \
51 tmp0_m = __msa_ceqi_w(in0, 0); \
58 #define RET_1_IF_NEG_W(in0) \
63 tmp0_m = __msa_clti_s_w(in0, 0); \
70 v8i16 in0, in1, in2, in3 local
116 v8i16 in0, in1, in2, in3; local
    [all...]
  /system/bt/embdrv/sbc/decoder/srce/
synthesis-dct8.c 97 double in0, in1, in2, in3; local
100 in0 = FLOAT_SCALE(in[0], DCTII_8_SHIFT_IN);
101 OI_ASSERT(VALID_INT32(in0));
117 L00 = (in0 + in7);
132 L07 = (in0 - in7);
259 int32_t in0, in1, in2, in3; local
263 in0 = SCALE(in[0], DCTII_8_SHIFT_IN);
272 in0 = in[0];
282 L00 = in0 + in7;
290 L07 = in0 - in7
    [all...]
  /external/deqp/modules/gles3/functional/
es3fShaderPackingFunctionTests.cpp 151 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_FLOAT_VEC2, precision)));
154 m_spec.source = "out0 = packSnorm2x16(in0);";
254 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_UINT, glu::PRECISION_HIGHP)));
257 m_spec.source = "out0 = unpackSnorm2x16(in0);";
297 const deInt16 in0 = (deInt16)(deUint16)(inputs[valNdx] & 0xffff); local
299 const float ref0 = de::clamp(float(in0) / 32767.f, -1.0f, 1.0f);
342 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_FLOAT_VEC2, precision)));
345 m_spec.source = "out0 = packUnorm2x16(in0);";
445 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_UINT, glu::PRECISION_HIGHP)));
448 m_spec.source = "out0 = unpackUnorm2x16(in0);";
488 const deUint16 in0 = (deUint16)(inputs[valNdx] & 0xffff); local
699 const deUint16 in0 = (deUint16)(inputs[valNdx] & 0xffff); local
    [all...]
es3fShaderPrecisionTests.cpp 99 op << "\t" << precName << " " << typeName << " in0 = " << (isVertexCase ? "a_" : "v_") << "in0;\n"
156 op << "\t" << precName << " " << typeName << " in0 = " << (isVertexCase ? "a_" : "v_") << "in0;\n"
180 typedef double (*EvalFunc) (double in0, double in1);
190 bool compare (float in0, float in1, double reference, float result);
286 bool ShaderFloatPrecisionCase::compare (float in0, float in1, double reference, float result)
299 const int in0Exp = tcu::Float32(in0).exponent();
365 const float in0 = m_rnd.getFloat(m_rangeA.x(), m_rangeA.y()); local
367 const double refD = m_evalFunc((double)in0, (double)in1)
581 int in0 = deSignExtendTo32(((isMaxRangeA ? (int)m_rnd.getUint32() : m_rnd.getInt(m_rangeA.x(), m_rangeA.y())) & mask), m_bits); local
775 deUint32 in0 = (isMaxRangeA ? m_rnd.getUint32() : (m_rangeA.x() + m_rnd.getUint32()%(m_rangeA.y()-m_rangeA.x()+1))) & mask; local
    [all...]
es3fShaderCommonFunctionTests.cpp 425 m_spec.inputs.push_back(Symbol("in0", glu::VarType(baseType, precision)));
427 m_spec.source = "out0 = abs(in0);";
469 const float in0 = ((const float*)inputs[0])[compNdx]; local
471 const float ref0 = de::abs(in0);
485 const int in0 = ((const int*)inputs[0])[compNdx]; local
487 const int ref0 = de::abs(in0);
507 m_spec.inputs.push_back(Symbol("in0", glu::VarType(baseType, precision)));
509 m_spec.source = "out0 = sign(in0);";
562 const float in0 = ((const float*)inputs[0])[compNdx]; local
564 const float ref0 = in0 < 0.0f ? -1.0f
579 const int in0 = ((const int*)inputs[0])[compNdx]; local
668 const float in0 = ((const float*)inputs[0])[compNdx]; local
689 const float in0 = ((const float*)inputs[0])[compNdx]; local
758 const float in0 = ((const float*)inputs[0])[compNdx]; local
835 const float in0 = ((const float*)inputs[0])[compNdx]; local
916 const float in0 = ((const float*)inputs[0])[compNdx]; local
989 const float in0 = ((const float*)inputs[0])[compNdx]; local
1058 const float in0 = ((const float*)inputs[0])[compNdx]; local
1120 const float in0 = ((const float*)inputs[0])[compNdx]; local
1141 const float in0 = ((const float*)inputs[0])[compNdx]; local
1226 const float in0 = ((const float*)inputs[0])[compNdx]; local
1338 const float in0 = ((const float*)inputs[0])[compNdx]; local
1377 const float in0 = ((const float*)inputs[0])[compNdx]; local
1454 const float in0 = ((const float*)inputs[0])[compNdx]; local
1475 const float in0 = ((const float*)inputs[0])[compNdx]; local
1572 const float in0 = ((const float*)inputs[0])[compNdx]; local
1592 const float in0 = ((const float*)inputs[0])[compNdx]; local
    [all...]
  /external/icu/icu4c/source/test/intltest/
dtfmtrtts.cpp 408 UBool in0; local
413 else if((in0=fmt->getTimeZone().inDaylightTime(d[0], status)) && ! failure(status, "gettingDaylightTime") &&
417 else if (!in0 &&
  /external/deqp/modules/gles31/functional/
es31fShaderPackingFunctionTests.cpp 155 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_FLOAT_VEC2, precision)));
158 m_spec.source = "out0 = packSnorm2x16(in0);";
258 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_UINT, glu::PRECISION_HIGHP)));
261 m_spec.source = "out0 = unpackSnorm2x16(in0);";
301 const deInt16 in0 = (deInt16)(deUint16)(inputs[valNdx] & 0xffff); local
303 const float ref0 = de::clamp(float(in0) / 32767.f, -1.0f, 1.0f);
346 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_FLOAT_VEC2, precision)));
349 m_spec.source = "out0 = packUnorm2x16(in0);";
449 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_UINT, glu::PRECISION_HIGHP)));
452 m_spec.source = "out0 = unpackUnorm2x16(in0);";
492 const deUint16 in0 = (deUint16)(inputs[valNdx] & 0xffff); local
703 const deUint16 in0 = (deUint16)(inputs[valNdx] & 0xffff); local
909 const deInt8 in0 = (deInt8)(deUint8)(inputs[valNdx] & 0xff); local
1118 const deUint8 in0 = (deUint8)(inputs[valNdx] & 0xff); local
    [all...]
es31fShaderCommonFunctionTests.cpp 503 m_spec.inputs.push_back(Symbol("in0", glu::VarType(baseType, precision)));
505 m_spec.source = "out0 = abs(in0);";
547 const float in0 = ((const float*)inputs[0])[compNdx]; local
549 const float ref0 = de::abs(in0);
563 const int in0 = ((const int*)inputs[0])[compNdx]; local
565 const int ref0 = de::abs(in0);
585 m_spec.inputs.push_back(Symbol("in0", glu::VarType(baseType, precision)));
587 m_spec.source = "out0 = sign(in0);";
640 const float in0 = ((const float*)inputs[0])[compNdx]; local
642 const float ref0 = in0 < 0.0f ? -1.0f
657 const int in0 = ((const int*)inputs[0])[compNdx]; local
746 const float in0 = ((const float*)inputs[0])[compNdx]; local
767 const float in0 = ((const float*)inputs[0])[compNdx]; local
836 const float in0 = ((const float*)inputs[0])[compNdx]; local
913 const float in0 = ((const float*)inputs[0])[compNdx]; local
929 const float in0 = ((const float*)inputs[0])[compNdx]; local
996 const float in0 = ((const float*)inputs[0])[compNdx]; local
1012 const float in0 = ((const float*)inputs[0])[compNdx]; local
1072 const float in0 = ((const float*)inputs[0])[compNdx]; local
1141 const float in0 = ((const float*)inputs[0])[compNdx]; local
1203 const float in0 = ((const float*)inputs[0])[compNdx]; local
1224 const float in0 = ((const float*)inputs[0])[compNdx]; local
1309 const float in0 = ((const float*)inputs[0])[compNdx]; local
1421 const float in0 = ((const float*)inputs[0])[compNdx]; local
1460 const float in0 = ((const float*)inputs[0])[compNdx]; local
1537 const float in0 = ((const float*)inputs[0])[compNdx]; local
1558 const float in0 = ((const float*)inputs[0])[compNdx]; local
1655 const float in0 = ((const float*)inputs[0])[compNdx]; local
1675 const float in0 = ((const float*)inputs[0])[compNdx]; local
    [all...]
es31fShaderIntegerFunctionTests.cpp 377 deUint32* in0 = (deUint32*)values[0]; local
401 in0[easyCaseNdx*scalarSize + compNdx] = easyCases[easyCaseNdx].x & integerMask;
413 in0[easyCaseNdx*scalarSize + compNdx] = extendSignTo32(in0[easyCaseNdx*scalarSize + compNdx], integerLength);
419 generateRandomInputData(rnd, m_shaderType, type, precision, in0, numValues - DE_LENGTH_OF_ARRAY(easyCases));
433 const deUint32 in0 = ((const deUint32*)inputs[0])[compNdx]; local
437 const deUint32 ref0 = in0+in1;
438 const deUint32 ref1 = (deUint64(in0)+deUint64(in1)) > 0xffffffffu ? 1u : 0u;
473 deUint32* in0 = (deUint32*)values[0]; local
495 in0[easyCaseNdx*scalarSize + compNdx] = easyCases[easyCaseNdx].x & integerMask
527 const deUint32 in0 = ((const deUint32*)inputs[0])[compNdx]; local
564 deUint32* in0 = (deUint32*)values[0]; local
616 const deUint32 in0 = ((const deUint32*)inputs[0])[compNdx]; local
654 deUint32* in0 = (deUint32*)values[0]; local
707 const deInt32 in0 = ((const deInt32*)inputs[0])[compNdx]; local
    [all...]
  /external/libjpeg-turbo/simd/
jquanti-altivec.c 57 __vector unsigned char in0, in1, in2, in3, in4, in5, in6, in7; local
73 out0 = (__vector short)VEC_UNPACKHU(in0);
  /external/deqp/external/vulkancts/modules/vulkan/shaderexecutor/
vktShaderPackingFunctionTests.cpp 261 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_FLOAT_VEC2, precision)));
264 m_spec.source = "out0 = packSnorm2x16(in0);";
320 const deInt16 in0 = (deInt16)(deUint16)(inputs[valNdx] & 0xffff); local
322 const float ref0 = de::clamp(float(in0) / 32767.f, -1.0f, 1.0f);
365 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_UINT, glu::PRECISION_HIGHP)));
368 m_spec.source = "out0 = unpackSnorm2x16(in0);";
484 m_spec.inputs.push_back(Symbol("in0", glu::VarType(glu::TYPE_FLOAT_VEC2, precision)));
487 m_spec.source = "out0 = packUnorm2x16(in0);";
543 const deUint16 in0 = (deUint16)(inputs[valNdx] & 0xffff); local
545 const float ref0 = float(in0) / 65535.0f
785 const deUint16 in0 = (deUint16)(inputs[valNdx] & 0xffff); local
1024 const deInt8 in0 = (deInt8)(deUint8)(inputs[valNdx] & 0xff); local
1267 const deUint8 in0 = (deUint8)(inputs[valNdx] & 0xff); local
    [all...]
vktShaderIntegerFunctionTests.cpp 468 deUint32* in0 = (deUint32*)values[0]; local
492 in0[easyCaseNdx*scalarSize + compNdx] = easyCases[easyCaseNdx].x & integerMask;
504 in0[easyCaseNdx*scalarSize + compNdx] = extendSignTo32(in0[easyCaseNdx*scalarSize + compNdx], integerLength);
510 generateRandomInputData(rnd, m_shaderType, type, precision, in0, numValues - DE_LENGTH_OF_ARRAY(easyCases));
524 const deUint32 in0 = ((const deUint32*)inputs[0])[compNdx]; local
528 const deUint32 ref0 = in0+in1;
529 const deUint32 ref1 = (deUint64(in0)+deUint64(in1)) > 0xffffffffu ? 1u : 0u;
578 deUint32* in0 = (deUint32*)values[0]; local
600 in0[easyCaseNdx*scalarSize + compNdx] = easyCases[easyCaseNdx].x & integerMask
632 const deUint32 in0 = ((const deUint32*)inputs[0])[compNdx]; local
683 deUint32* in0 = (deUint32*)values[0]; local
735 const deUint32 in0 = ((const deUint32*)inputs[0])[compNdx]; local
787 deUint32* in0 = (deUint32*)values[0]; local
840 const deInt32 in0 = ((const deInt32*)inputs[0])[compNdx]; local
    [all...]
  /external/libvpx/libvpx/vp8/common/mips/msa/
idct_msa.c 18 #define TRANSPOSE_TWO_4x4_H(in0, in1, in2, in3, out0, out1, out2, out3) \
22 TRANSPOSE8X4_SH_SH(in0, in1, in2, in3, s4_m, s5_m, s6_m, s7_m); \
45 #define VP8_IDCT_1D_H(in0, in1, in2, in3, out0, out1, out2, out3) \
52 a1_m = in0 + in2; \
53 b1_m = in0 - in2; \
67 #define VP8_IDCT_1D_W(in0, in1, in2, in3, out0, out1, out2, out3) \
75 a1_m = in0 + in2; \
76 b1_m = in0 - in2; \
90 v4i32 in0, in1, in2, in3, hz0, hz1, hz2, hz3, vt0, vt1, vt2, vt3; local
96 UNPCK_SH_SW(input0, in0, in1)
181 v8i16 in0, in1, in2, in3, hz0_h, hz1_h, hz2_h, hz3_h; local
218 v8i16 in0, in1, in2, in3, mul0, mul1, mul2, mul3, dequant_in0, dequant_in1; local
    [all...]
  /external/webp/src/dsp/
enc_sse41.c 209 __m128i in0 = _mm_loadu_si128((__m128i*)&in[0]); local
217 __m128i coeff0 = _mm_abs_epi16(in0);
265 out0 = _mm_sign_epi16(out0, in0);
269 in0 = _mm_mullo_epi16(out0, q0);
272 _mm_storeu_si128((__m128i*)&in[0], in0);

Completed in 771 milliseconds

1 2