Lines Matching refs:wd
107 * @param[in] wd
128 WORD32 wd,
146 pu1_src_left[row] = pu1_src[row * src_strd + (wd - 1)];
148 pu1_src_top_left[0] = pu1_src_top[wd - 1];
149 for(col = 0; col < wd; col += 8)
254 for(col = wd; col >= 16; col -= 16)
336 wd_rem = wd & 0xF;
447 WORD32 wd,
466 pu1_src_left[2 * row] = pu1_src[row * src_strd + (wd - 2)];
467 pu1_src_left[2 * row + 1] = pu1_src[row * src_strd + (wd - 1)];
469 pu1_src_top_left[0] = pu1_src_top[wd - 2];
470 pu1_src_top_left[1] = pu1_src_top[wd - 1];
471 for(col = 0; col < wd; col += 8)
664 for(col = wd; col >= 16; col -= 16)
761 wd_rem = wd & 0xF;
886 WORD32 wd,
912 *pu1_src_top_left = pu1_src_top[wd - 1];
914 for(col = wd; col >= 16; col -= 16)
935 au1_mask[wd - 1] = u1_avail1;
943 for(col = wd; col >= 16; col -= 16)
1054 wd_rem = wd & 0xF;
1195 pu1_src += wd;
1221 WORD32 wd,
1248 pu1_src_top_left[0] = pu1_src_top[wd - 2];
1249 pu1_src_top_left[1] = pu1_src_top[wd - 1];;
1251 for(col = wd; col >= 16; col -= 16)
1274 au1_mask[wd - 1] = u1_avail1;
1275 au1_mask[wd - 2] = u1_avail1;
1284 for(col = wd; col >= 16; col -= 16)
1406 wd_rem = wd & 0xF;
1565 pu1_src += wd;
1591 WORD32 wd,
1615 pu1_src_left[row] = pu1_src[row * src_strd + (wd - 1)];
1617 *pu1_src_top_left = pu1_src_top[wd - 1];
1642 for(col = wd; col >= 16; col -= 16)
1645 src_top_16x8b = _mm_loadu_si128((__m128i *)(pu1_src_top_cpy + wd - col));
1770 _mm_storeu_si128((__m128i *)(pu1_src_top + wd - col), src_top_16x8b);
1774 wd_rem = wd & 0xF;
1778 src_top_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src_top_cpy + wd - col));
2011 _mm_storel_epi64((__m128i *)(pu1_src_top + wd - col), src_top_16x8b);
2027 WORD32 wd,
2051 pu1_src_left[2 * row] = pu1_src[row * src_strd + (wd - 2)];
2052 pu1_src_left[2 * row + 1] = pu1_src[row * src_strd + (wd - 1)];
2054 pu1_src_top_left[0] = pu1_src_top[wd - 2];
2055 pu1_src_top_left[1] = pu1_src_top[wd - 1];
2085 for(col = wd; col >= 16; col -= 16)
2088 src_top_16x8b = _mm_loadu_si128((__m128i *)(pu1_src_top_cpy + wd - col));
2221 _mm_storeu_si128((__m128i *)(pu1_src_top + wd - col), src_top_16x8b);
2225 wd_rem = wd & 0xF;
2229 src_top_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src_top_cpy + wd - col));
2470 _mm_storel_epi64((__m128i *)(pu1_src_top + wd - col), src_top_16x8b);
2486 WORD32 wd,
2566 edge_idx = 2 + SIGN(pu1_src[wd - 1 + (ht - 1) * src_strd] - pu1_src[wd - 1 + (ht - 1) * src_strd - 1 - src_strd]) +
2567 SIGN(pu1_src[wd - 1 + (ht - 1) * src_strd] - pu1_src[wd - 1 + (ht - 1) * src_strd + 1 + src_strd]);
2573 u1_pos_wd_ht_tmp = CLIP3(pu1_src[wd - 1 + (ht - 1) * src_strd] + pi1_sao_offset[edge_idx], 0, (1 << bit_depth) - 1);
2577 u1_pos_wd_ht_tmp = pu1_src[wd - 1 + (ht - 1) * src_strd];
2582 u1_pos_wd_ht_tmp = pu1_src[wd - 1 + (ht - 1) * src_strd];
2607 *pu1_src_top_left = pu1_src_top[wd - 1];
2612 au1_mask[wd - 1] = u1_avail1;
2620 for(col = wd; col >= 16; col -= 16)
2623 src_top_16x8b = _mm_loadu_si128((__m128i *)(pu1_src_top_cpy + wd - col));
2811 left_store_16x8b = _mm_loadu_si128((__m128i *)(pu1_src_top_cpy + wd - col));
2813 _mm_storeu_si128((__m128i *)(pu1_src_top + wd - col), src_top_16x8b);
2826 wd_rem = wd & 0xF;
2832 src_top_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src_top_cpy + wd - col));
3213 _mm_storel_epi64((__m128i *)(pu1_src_top + wd - col), src_top_16x8b);
3225 pu1_src_org[wd - 1 + (ht_tmp - 1) * src_strd] = u1_pos_wd_ht_tmp;
3246 WORD32 wd,
3348 edge_idx = 2 + SIGN(pu1_src[wd - 2 + (ht - 1) * src_strd] - pu1_src[wd - 2 + (ht - 1) * src_strd - 2 - src_strd]) +
3349 SIGN(pu1_src[wd - 2 + (ht - 1) * src_strd] - pu1_src[wd - 2 + (ht - 1) * src_strd + 2 + src_strd]);
3355 u1_pos_wd_ht_tmp_u = CLIP3(pu1_src[wd - 2 + (ht - 1) * src_strd] + pi1_sao_offset_u[edge_idx], 0, (1 << bit_depth) - 1);
3359 u1_pos_wd_ht_tmp_u = pu1_src[wd - 2 + (ht - 1) * src_strd];
3363 edge_idx = 2 + SIGN(pu1_src[wd - 1 + (ht - 1) * src_strd] - pu1_src[wd - 1 + (ht - 1) * src_strd - 2 - src_strd]) +
3364 SIGN(pu1_src[wd - 1 + (ht - 1) * src_strd] - pu1_src[wd - 1 + (ht - 1) * src_strd + 2 + src_strd]);
3370 u1_pos_wd_ht_tmp_v = CLIP3(pu1_src[wd - 1 + (ht - 1) * src_strd] + pi1_sao_offset_v[edge_idx], 0, (1 << bit_depth) - 1);
3374 u1_pos_wd_ht_tmp_v = pu1_src[wd - 1 + (ht - 1) * src_strd];
3379 u1_pos_wd_ht_tmp_u = pu1_src[wd - 2 + (ht - 1) * src_strd];
3380 u1_pos_wd_ht_tmp_v = pu1_src[wd - 1 + (ht - 1) * src_strd];
3411 au1_mask[wd - 1] = u1_avail1;
3412 au1_mask[wd - 2] = u1_avail1;
3415 pu1_src_top_left[0] = pu1_src_top[wd - 2];
3416 pu1_src_top_left[1] = pu1_src_top[wd - 1];
3423 for(col = wd; col >= 16; col -= 16)
3426 src_top_16x8b = _mm_loadu_si128((__m128i *)(pu1_src_top_cpy + wd - col));
3626 left_store_16x8b = _mm_loadu_si128((__m128i *)(pu1_src_top_cpy + wd - col));
3628 _mm_storeu_si128((__m128i *)(pu1_src_top + wd - col), src_top_16x8b);
3639 wd_rem = wd & 0xF;
3645 src_top_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src_top_cpy + wd - col));
4046 _mm_storel_epi64((__m128i *)(pu1_src_top + wd - col), src_top_16x8b);
4058 pu1_src_org[wd - 2 + (ht_tmp - 1) * src_strd] = u1_pos_wd_ht_tmp_u;
4059 pu1_src_org[wd - 1 + (ht_tmp - 1) * src_strd] = u1_pos_wd_ht_tmp_v;
4078 WORD32 wd,
4107 au1_src_left_tmp[0] = pu1_src[(wd - 1)];
4115 *pu1_src_top_left = pu1_src_top[wd - 1];
4134 edge_idx = 2 + SIGN(pu1_src[wd - 1] - pu1_src_top_right[0]) +
4135 SIGN(pu1_src[wd - 1] - pu1_src[wd - 1 - 1 + src_strd]);
4141 u1_pos_wd_0_tmp = CLIP3(pu1_src[wd - 1] + pi1_sao_offset[edge_idx], 0, (1 << bit_depth) - 1);
4145 u1_pos_wd_0_tmp = pu1_src[wd - 1];
4150 u1_pos_wd_0_tmp = pu1_src[wd - 1];
4202 au1_mask[wd - 1] = u1_avail1;
4209 for(col = wd; col >= 16; col -= 16)
4212 src_top_16x8b = _mm_loadu_si128((__m128i *)(pu1_src_top_cpy + wd - col + 1));
4409 left_store_16x8b = _mm_loadu_si128((__m128i *)(pu1_src_top_cpy + wd - col));
4411 _mm_storeu_si128((__m128i *)(pu1_src_top + wd - col), src_top_16x8b);
4423 wd_rem = wd & 0xF;
4429 src_top_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src_top_cpy + wd - col + 1));
4822 _mm_storel_epi64((__m128i *)(pu1_src_top + wd - col), src_top_16x8b);
4833 pu1_src_org[wd - 1] = u1_pos_wd_0_tmp;
4855 WORD32 wd,
4884 au1_src_left_tmp[0] = pu1_src[(wd - 2)];
4885 au1_src_left_tmp[1] = pu1_src[(wd - 1)];
4894 pu1_src_top_left[0] = pu1_src_top[wd - 2];
4895 pu1_src_top_left[1] = pu1_src_top[wd - 1];
4914 edge_idx = 2 + SIGN(pu1_src[wd - 2] - pu1_src_top_right[0]) +
4915 SIGN(pu1_src[wd - 2] - pu1_src[wd - 2 - 2 + src_strd]);
4921 u1_pos_wd_0_tmp_u = CLIP3(pu1_src[wd - 2] + pi1_sao_offset_u[edge_idx], 0, (1 << bit_depth) - 1);
4925 u1_pos_wd_0_tmp_u = pu1_src[wd - 2];
4929 edge_idx = 2 + SIGN(pu1_src[wd - 1] - pu1_src_top_right[1]) +
4930 SIGN(pu1_src[wd - 1] - pu1_src[wd - 1 - 2 + src_strd]);
4936 u1_pos_wd_0_tmp_v = CLIP3(pu1_src[wd - 1] + pi1_sao_offset_v[edge_idx], 0, (1 << bit_depth) - 1);
4940 u1_pos_wd_0_tmp_v = pu1_src[wd - 1];
4945 u1_pos_wd_0_tmp_u = pu1_src[wd - 2];
4946 u1_pos_wd_0_tmp_v = pu1_src[wd - 1];
5015 au1_mask[wd - 1] = u1_avail1;
5016 au1_mask[wd - 2] = u1_avail1;
5020 for(col = wd; col >= 16; col -= 16)
5023 src_top_16x8b = _mm_loadu_si128((__m128i *)(pu1_src_top_cpy + wd - col + 2));
5230 left_store_16x8b = _mm_loadu_si128((__m128i *)(pu1_src_top_cpy + wd - col));
5232 _mm_storeu_si128((__m128i *)(pu1_src_top + wd - col), src_top_16x8b);
5237 wd_rem = wd & 0xF;
5241 src_top_16x8b = _mm_loadl_epi64((__m128i *)(pu1_src_top_cpy + wd - col + 2));
5640 _mm_storel_epi64((__m128i *)(pu1_src_top + wd - col), src_top_16x8b);
5643 pu1_src_org[wd - 2] = u1_pos_wd_0_tmp_u;
5644 pu1_src_org[wd - 1] = u1_pos_wd_0_tmp_v;