/external/libhevc/common/arm/ |
ihevc_sao_edge_offset_class3_chroma.s | 355 VLD1.8 D16,[r11]! @I pu1_next_row = vld1q_u8(pu1_src_cpy + src_strd) 356 VLD1.8 D17,[r11] @I pu1_next_row = vld1q_u8(pu1_src_cpy + src_strd) 369 LDRB r8,[r0,#14] @I pu1_src_cpy[14] 372 LDRB r11,[r5,#16] @I load the value pu1_src_cpy[16 - src_strd] 374 LDRB r9,[r0,#15] @I pu1_src_cpy[15] 375 SUB r8,r8,r11 @I pu1_src_cpy[14] - pu1_src_cpy[16 - src_strd] 377 LDRB r10,[r5,#17] @I load the value pu1_src_cpy[17 - src_strd] 381 SUB r9,r9,r10 @I pu1_src_cpy[15] - pu1_src_cpy[17 - src_strd [all...] |
ihevc_sao_edge_offset_class2_chroma.s | 359 VLD1.8 D16,[r8]! @I pu1_next_row = vld1q_u8(pu1_src_cpy + src_strd) 360 VLD1.8 D17,[r8] @I pu1_next_row = vld1q_u8(pu1_src_cpy + src_strd) 365 LDRH r5,[r8] @I pu1_src_cpy[src_strd + 16] 368 VMOV.16 D18[0],r5 @I pu1_next_row_tmp = vsetq_lane_u8(pu1_src_cpy[src_strd + 16], pu1_next_row_tmp, 0) 375 LDRB r11,[r0] @I pu1_src_cpy[0] 378 LDRB r10,[r0,#1] @I pu1_src_cpy[0] 384 SUB r8,r11,r5 @I pu1_src_cpy[0] - pu1_src_left_cpy[(ht_tmp - 1 - row) * 2] 388 SUB r4,r10,r5 @I pu1_src_cpy[1] - pu1_src_left_cpy[(ht_tmp - 1 - row) * 2 + 1] 391 MOVGT r8,#1 @I SIGN(pu1_src_cpy[0] - pu1_src_left_cpy[(ht_tmp - 1 - row) * 2]) 394 VMOV.8 D14[0],r8 @I sign_up = sign_up = vsetq_lane_s8(SIGN(pu1_src_cpy[0] - pu1_src_left_cpy[(ht_tmp - 1 - row) * 2]), sign_up, 0 [all...] |
ihevc_sao_edge_offset_class0_chroma.s | 142 MOV r12,r0 @pu1_src_cpy = pu1_src 147 VLD1.8 D12,[r12]! @pu1_cur_row = vld1q_u8(pu1_src_cpy) 148 VLD1.8 D13,[r12],r1 @pu1_cur_row = vld1q_u8(pu1_src_cpy) 156 VLD1.8 D30,[r12]! @II Iteration pu1_cur_row = vld1q_u8(pu1_src_cpy) 157 VLD1.8 D31,[r12] @II Iteration pu1_cur_row = vld1q_u8(pu1_src_cpy) 173 LDRB r11,[r12,#16] @pu1_src_cpy[16] 176 VMOV.8 D14[0],r11 @pu1_cur_row_tmp = vsetq_lane_u8(pu1_src_cpy[16], pu1_cur_row_tmp, 0) 179 LDRB r11,[r12,#17] @pu1_src_cpy[17] 184 VMOV.8 D14[1],r11 @pu1_cur_row_tmp = vsetq_lane_u8(pu1_src_cpy[17], pu1_cur_row_tmp, 1) 185 LDRB r11,[r12,#16] @II pu1_src_cpy[16 [all...] |
ihevc_sao_edge_offset_class3.s | 280 VLD1.8 D16,[r8]! @I pu1_next_row = vld1q_u8(pu1_src_cpy + src_strd) 281 VLD1.8 D17,[r8] @I pu1_next_row = vld1q_u8(pu1_src_cpy + src_strd) 297 LDRB r8,[r0,#15] @I pu1_src_cpy[15] 298 SUB r5,r0,r1 @I pu1_src_cpy[16 - src_strd] 301 SUB r8,r8,r5 @I pu1_src_cpy[15] - pu1_src_cpy[16 - src_strd] 304 MOVGT r8,#1 @I SIGN(pu1_src_cpy[15] - pu1_src_cpy[16 - src_strd]) 305 VMOV.8 D15[7],r8 @I sign_up = vsetq_lane_s8(SIGN(pu1_src_cpy[15] - pu1_src_cpy[16 - src_strd]), sign_up, 15 [all...] |
ihevc_sao_edge_offset_class2.s | 269 VLD1.8 D16,[r8]! @I pu1_next_row = vld1q_u8(pu1_src_cpy + src_strd) 270 VLD1.8 D17,[r8] @I pu1_next_row = vld1q_u8(pu1_src_cpy + src_strd) 274 LDRB r5,[r8,#16] @I pu1_src_cpy[src_strd + 16] 275 VMOV.8 D18[0],r5 @I pu1_next_row_tmp = vsetq_lane_u8(pu1_src_cpy[src_strd + 16], pu1_next_row_tmp, 0) 283 LDRB r11,[r0] @I pu1_src_cpy[0] 287 SUBS r4,r11,r5 @I pu1_src_cpy[0] - pu1_src_left_cpy[ht_tmp - 1 - row] 289 MOVGT r4,#1 @I SIGN(pu1_src_cpy[0] - pu1_src_left_cpy[ht_tmp - 1 - row]) 290 VMOV.8 D14[0],r4 @I sign_up = sign_up = vsetq_lane_s8(SIGN(pu1_src_cpy[0] - pu1_src_left_cpy[ht_tmp - 1 - row]), sign_up, 0) 331 VST1.8 {Q10},[r0],r1 @I vst1q_u8(pu1_src_cpy, pu1_cur_row) 334 VLD1.8 D16,[r8]! @II pu1_next_row = vld1q_u8(pu1_src_cpy + src_strd [all...] |
ihevc_sao_band_offset_luma.s | 186 MOV r4,r0 @pu1_src_cpy 192 VLD1.8 D13,[r4] @au1_cur_row = vld1_u8(pu1_src_cpy) 195 VLD1.8 D15,[r5] @au1_cur_row = vld1_u8(pu1_src_cpy) 197 VLD1.8 D17,[r6] @au1_cur_row = vld1_u8(pu1_src_cpy) 199 VLD1.8 D19,[r10] @au1_cur_row = vld1_u8(pu1_src_cpy) 212 VST1.8 D13,[r4],r1 @vst1_u8(pu1_src_cpy, au1_cur_row) 214 VST1.8 D15,[r5] @vst1_u8(pu1_src_cpy, au1_cur_row) 217 VST1.8 D17,[r6],r1 @vst1_u8(pu1_src_cpy, au1_cur_row) 220 VST1.8 D19,[r10] @vst1_u8(pu1_src_cpy, au1_cur_row)
|
ihevc_sao_band_offset_chroma.s | 276 MOV r4,r0 @pu1_src_cpy 280 MOV r4,r0 @pu1_src_cpy 286 VLD2.8 {D5,D6},[r4] @vld1q_u8(pu1_src_cpy) 289 VLD2.8 {D13,D14},[r5] @vld1q_u8(pu1_src_cpy) 292 VLD2.8 {D17,D18},[r6] @vld1q_u8(pu1_src_cpy) 295 VLD2.8 {D21,D22},[r7] @vld1q_u8(pu1_src_cpy) 310 VST2.8 {D5,D6},[r4] @vst1q_u8(pu1_src_cpy, au1_cur_row) 316 VST2.8 {D13,D14},[r5] @vst1q_u8(pu1_src_cpy, au1_cur_row) 322 VST2.8 {D17,D18},[r6],r1 @vst1q_u8(pu1_src_cpy, au1_cur_row) 325 VST2.8 {D21,D22},[r7] @vst1q_u8(pu1_src_cpy, au1_cur_row [all...] |
ihevc_sao_edge_offset_class1.s | 142 VLD1.8 D18,[r10]! @pu1_next_row = vld1q_u8(pu1_src_cpy + src_strd) 143 VLD1.8 D19,[r10] @pu1_next_row = vld1q_u8(pu1_src_cpy + src_strd) 148 VLD1.8 D30,[r6]! @II pu1_next_row = vld1q_u8(pu1_src_cpy + src_strd) 149 VLD1.8 D31,[r6] @II pu1_next_row = vld1q_u8(pu1_src_cpy + src_strd) 210 VST1.8 {Q10},[r10],r1 @vst1q_u8(pu1_src_cpy, pu1_cur_row) 216 VST1.8 {Q15},[r10],r1 @II vst1q_u8(pu1_src_cpy, pu1_cur_row) 223 VLD1.8 D18,[r10]! @pu1_next_row = vld1q_u8(pu1_src_cpy + src_strd) 224 VLD1.8 D19,[r10] @pu1_next_row = vld1q_u8(pu1_src_cpy + src_strd) 251 VST1.8 {Q15},[r10],r1 @vst1q_u8(pu1_src_cpy, pu1_cur_row) 284 VLD1.8 D18,[r10]! @pu1_next_row = vld1q_u8(pu1_src_cpy + src_strd [all...] |
ihevc_sao_edge_offset_class1_chroma.s | 147 VLD1.8 D18,[r10]! @pu1_next_row = vld1q_u8(pu1_src_cpy + src_strd) 148 VLD1.8 D19,[r10] @pu1_next_row = vld1q_u8(pu1_src_cpy + src_strd) 153 VLD1.8 D30,[r6]! @II pu1_next_row = vld1q_u8(pu1_src_cpy + src_strd) 154 VLD1.8 D31,[r6] @II pu1_next_row = vld1q_u8(pu1_src_cpy + src_strd) 223 VST1.8 {Q10},[r10],r1 @vst1q_u8(pu1_src_cpy, pu1_cur_row) 229 VST1.8 {Q15},[r10],r1 @II vst1q_u8(pu1_src_cpy, pu1_cur_row) 236 VLD1.8 D18,[r10]! @pu1_next_row = vld1q_u8(pu1_src_cpy + src_strd) 237 VLD1.8 D19,[r10] @pu1_next_row = vld1q_u8(pu1_src_cpy + src_strd) 269 VST1.8 {Q15},[r10],r1 @vst1q_u8(pu1_src_cpy, pu1_cur_row) 302 VLD1.8 D18,[r10]! @pu1_next_row = vld1q_u8(pu1_src_cpy + src_strd [all...] |
ihevc_sao_edge_offset_class0.s | 136 MOV r12,r0 @pu1_src_cpy = pu1_src 141 VLD1.8 D12,[r12]! @pu1_cur_row = vld1q_u8(pu1_src_cpy) 142 VLD1.8 D13,[r12], r1 @pu1_cur_row = vld1q_u8(pu1_src_cpy) 150 VLD1.8 D26,[r12]! @II Iteration pu1_cur_row = vld1q_u8(pu1_src_cpy) 151 VLD1.8 D27,[r12] @II Iteration pu1_cur_row = vld1q_u8(pu1_src_cpy) 168 LDRB r11,[r12,#16] @pu1_src_cpy[16] 173 VMOV.8 D14[0],r11 @pu1_cur_row_tmp = vsetq_lane_u8(pu1_src_cpy[16], pu1_cur_row_tmp, 0) 176 LDRB r11,[r12,#16] @II pu1_src_cpy[16] 181 VMOV.8 D28[0],r11 @II pu1_cur_row_tmp = vsetq_lane_u8(pu1_src_cpy[16], pu1_cur_row_tmp, 0) 247 VST1.8 {D18,D19},[r12],r1 @vst1q_u8(pu1_src_cpy, pu1_cur_row [all...] |
/external/libhevc/common/x86/ |
ihevc_sao_ssse3_intr.c | 132 UWORD8 *pu1_src_cpy; local 256 pu1_src_cpy = pu1_src; 262 src_temp0_8x16b = _mm_loadu_si128((__m128i *)(pu1_src_cpy)); 264 src_temp2_8x16b = _mm_loadu_si128((__m128i *)(pu1_src_cpy + src_strd)); 328 _mm_storeu_si128((__m128i *)(pu1_src_cpy), src_temp0_8x16b); 330 _mm_storeu_si128((__m128i *)(pu1_src_cpy + src_strd), src_temp2_8x16b); 332 pu1_src_cpy += (src_strd << 1); 338 {pu1_src_cpy = pu1_src; 344 src_temp0_8x16b = _mm_loadl_epi64((__m128i *)(pu1_src_cpy)); 346 src_temp1_8x16b = _mm_loadl_epi64((__m128i *)(pu1_src_cpy + src_strd)) 646 UWORD8 *pu1_src_cpy; local 890 UWORD8 *pu1_src_cpy, *pu1_src_left_cpy, *pu1_src_left_str, *pu1_left_tmp; local 1225 UWORD8 *pu1_src_cpy, *pu1_src_left_cpy, *pu1_src_left_str, *pu1_left_tmp; local 1596 UWORD8 *pu1_src_cpy; local 2032 UWORD8 *pu1_src_cpy; local 2493 UWORD8 *pu1_src_cpy, *pu1_src_org; local 3253 UWORD8 *pu1_src_cpy, *pu1_src_org; local 4084 UWORD8 *pu1_src_cpy, *pu1_src_org; local 4860 UWORD8 *pu1_src_cpy, *pu1_src_org; local [all...] |