Home | History | Annotate | Download | only in x86_64
      1 #ifndef VP9_RTCD_H_
      2 #define VP9_RTCD_H_
      3 
      4 #ifdef RTCD_C
      5 #define RTCD_EXTERN
      6 #else
      7 #define RTCD_EXTERN extern
      8 #endif
      9 
     10 /*
     11  * VP9
     12  */
     13 
     14 #include "vpx/vpx_integer.h"
     15 #include "vp9/common/vp9_common.h"
     16 #include "vp9/common/vp9_enums.h"
     17 
     18 struct macroblockd;
     19 
     20 /* Encoder forward decls */
     21 struct macroblock;
     22 struct vp9_variance_vtable;
     23 struct search_site_config;
     24 struct mv;
     25 union int_mv;
     26 struct yv12_buffer_config;
     27 
     28 #ifdef __cplusplus
     29 extern "C" {
     30 #endif
     31 
     32 unsigned int vp9_avg_4x4_c(const uint8_t *, int p);
     33 unsigned int vp9_avg_4x4_sse2(const uint8_t *, int p);
     34 #define vp9_avg_4x4 vp9_avg_4x4_sse2
     35 
     36 unsigned int vp9_avg_8x8_c(const uint8_t *, int p);
     37 unsigned int vp9_avg_8x8_sse2(const uint8_t *, int p);
     38 #define vp9_avg_8x8 vp9_avg_8x8_sse2
     39 
     40 int64_t vp9_block_error_c(const tran_low_t *coeff, const tran_low_t *dqcoeff, intptr_t block_size, int64_t *ssz);
     41 int64_t vp9_block_error_sse2(const tran_low_t *coeff, const tran_low_t *dqcoeff, intptr_t block_size, int64_t *ssz);
     42 #define vp9_block_error vp9_block_error_sse2
     43 
     44 int64_t vp9_block_error_fp_c(const int16_t *coeff, const int16_t *dqcoeff, int block_size);
     45 int64_t vp9_block_error_fp_sse2(const int16_t *coeff, const int16_t *dqcoeff, int block_size);
     46 #define vp9_block_error_fp vp9_block_error_fp_sse2
     47 
     48 int vp9_diamond_search_sad_c(const struct macroblock *x, const struct search_site_config *cfg,  struct mv *ref_mv, struct mv *best_mv, int search_param, int sad_per_bit, int *num00, const struct vp9_variance_vtable *fn_ptr, const struct mv *center_mv);
     49 #define vp9_diamond_search_sad vp9_diamond_search_sad_c
     50 
     51 void vp9_fdct8x8_quant_c(const int16_t *input, int stride, tran_low_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan);
     52 void vp9_fdct8x8_quant_sse2(const int16_t *input, int stride, tran_low_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan);
     53 void vp9_fdct8x8_quant_ssse3(const int16_t *input, int stride, tran_low_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan);
     54 #define vp9_fdct8x8_quant vp9_fdct8x8_quant_ssse3
     55 
     56 void vp9_fht16x16_c(const int16_t *input, tran_low_t *output, int stride, int tx_type);
     57 void vp9_fht16x16_sse2(const int16_t *input, tran_low_t *output, int stride, int tx_type);
     58 #define vp9_fht16x16 vp9_fht16x16_sse2
     59 
     60 void vp9_fht4x4_c(const int16_t *input, tran_low_t *output, int stride, int tx_type);
     61 void vp9_fht4x4_sse2(const int16_t *input, tran_low_t *output, int stride, int tx_type);
     62 #define vp9_fht4x4 vp9_fht4x4_sse2
     63 
     64 void vp9_fht8x8_c(const int16_t *input, tran_low_t *output, int stride, int tx_type);
     65 void vp9_fht8x8_sse2(const int16_t *input, tran_low_t *output, int stride, int tx_type);
     66 #define vp9_fht8x8 vp9_fht8x8_sse2
     67 
     68 int vp9_full_range_search_c(const struct macroblock *x, const struct search_site_config *cfg, struct mv *ref_mv, struct mv *best_mv, int search_param, int sad_per_bit, int *num00, const struct vp9_variance_vtable *fn_ptr, const struct mv *center_mv);
     69 #define vp9_full_range_search vp9_full_range_search_c
     70 
     71 int vp9_full_search_sad_c(const struct macroblock *x, const struct mv *ref_mv, int sad_per_bit, int distance, const struct vp9_variance_vtable *fn_ptr, const struct mv *center_mv, struct mv *best_mv);
     72 int vp9_full_search_sadx3(const struct macroblock *x, const struct mv *ref_mv, int sad_per_bit, int distance, const struct vp9_variance_vtable *fn_ptr, const struct mv *center_mv, struct mv *best_mv);
     73 #define vp9_full_search_sad vp9_full_search_sadx3
     74 
     75 void vp9_fwht4x4_c(const int16_t *input, tran_low_t *output, int stride);
     76 void vp9_fwht4x4_mmx(const int16_t *input, tran_low_t *output, int stride);
     77 #define vp9_fwht4x4 vp9_fwht4x4_mmx
     78 
     79 void vp9_hadamard_16x16_c(int16_t const *src_diff, int src_stride, int16_t *coeff);
     80 void vp9_hadamard_16x16_sse2(int16_t const *src_diff, int src_stride, int16_t *coeff);
     81 #define vp9_hadamard_16x16 vp9_hadamard_16x16_sse2
     82 
     83 void vp9_hadamard_8x8_c(int16_t const *src_diff, int src_stride, int16_t *coeff);
     84 void vp9_hadamard_8x8_sse2(int16_t const *src_diff, int src_stride, int16_t *coeff);
     85 void vp9_hadamard_8x8_ssse3(int16_t const *src_diff, int src_stride, int16_t *coeff);
     86 #define vp9_hadamard_8x8 vp9_hadamard_8x8_ssse3
     87 
     88 void vp9_iht16x16_256_add_c(const tran_low_t *input, uint8_t *output, int pitch, int tx_type);
     89 void vp9_iht16x16_256_add_sse2(const tran_low_t *input, uint8_t *output, int pitch, int tx_type);
     90 #define vp9_iht16x16_256_add vp9_iht16x16_256_add_sse2
     91 
     92 void vp9_iht4x4_16_add_c(const tran_low_t *input, uint8_t *dest, int dest_stride, int tx_type);
     93 void vp9_iht4x4_16_add_sse2(const tran_low_t *input, uint8_t *dest, int dest_stride, int tx_type);
     94 #define vp9_iht4x4_16_add vp9_iht4x4_16_add_sse2
     95 
     96 void vp9_iht8x8_64_add_c(const tran_low_t *input, uint8_t *dest, int dest_stride, int tx_type);
     97 void vp9_iht8x8_64_add_sse2(const tran_low_t *input, uint8_t *dest, int dest_stride, int tx_type);
     98 #define vp9_iht8x8_64_add vp9_iht8x8_64_add_sse2
     99 
    100 int16_t vp9_int_pro_col_c(uint8_t const *ref, const int width);
    101 int16_t vp9_int_pro_col_sse2(uint8_t const *ref, const int width);
    102 #define vp9_int_pro_col vp9_int_pro_col_sse2
    103 
    104 void vp9_int_pro_row_c(int16_t *hbuf, uint8_t const *ref, const int ref_stride, const int height);
    105 void vp9_int_pro_row_sse2(int16_t *hbuf, uint8_t const *ref, const int ref_stride, const int height);
    106 #define vp9_int_pro_row vp9_int_pro_row_sse2
    107 
    108 void vp9_minmax_8x8_c(const uint8_t *s, int p, const uint8_t *d, int dp, int *min, int *max);
    109 void vp9_minmax_8x8_sse2(const uint8_t *s, int p, const uint8_t *d, int dp, int *min, int *max);
    110 #define vp9_minmax_8x8 vp9_minmax_8x8_sse2
    111 
    112 void vp9_quantize_fp_c(const tran_low_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan);
    113 void vp9_quantize_fp_sse2(const tran_low_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan);
    114 void vp9_quantize_fp_ssse3(const tran_low_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan);
    115 #define vp9_quantize_fp vp9_quantize_fp_ssse3
    116 
    117 void vp9_quantize_fp_32x32_c(const tran_low_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan);
    118 void vp9_quantize_fp_32x32_ssse3(const tran_low_t *coeff_ptr, intptr_t n_coeffs, int skip_block, const int16_t *zbin_ptr, const int16_t *round_ptr, const int16_t *quant_ptr, const int16_t *quant_shift_ptr, tran_low_t *qcoeff_ptr, tran_low_t *dqcoeff_ptr, const int16_t *dequant_ptr, uint16_t *eob_ptr, const int16_t *scan, const int16_t *iscan);
    119 #define vp9_quantize_fp_32x32 vp9_quantize_fp_32x32_ssse3
    120 
    121 int16_t vp9_satd_c(const int16_t *coeff, int length);
    122 int16_t vp9_satd_sse2(const int16_t *coeff, int length);
    123 #define vp9_satd vp9_satd_sse2
    124 
    125 void vp9_temporal_filter_apply_c(uint8_t *frame1, unsigned int stride, uint8_t *frame2, unsigned int block_width, unsigned int block_height, int strength, int filter_weight, unsigned int *accumulator, uint16_t *count);
    126 void vp9_temporal_filter_apply_sse2(uint8_t *frame1, unsigned int stride, uint8_t *frame2, unsigned int block_width, unsigned int block_height, int strength, int filter_weight, unsigned int *accumulator, uint16_t *count);
    127 #define vp9_temporal_filter_apply vp9_temporal_filter_apply_sse2
    128 
    129 int vp9_vector_var_c(int16_t const *ref, int16_t const *src, const int bwl);
    130 int vp9_vector_var_sse2(int16_t const *ref, int16_t const *src, const int bwl);
    131 #define vp9_vector_var vp9_vector_var_sse2
    132 
    133 void vp9_rtcd(void);
    134 
    135 #ifdef RTCD_C
    136 #include "vpx_ports/x86.h"
    137 static void setup_rtcd_internal(void)
    138 {
    139     int flags = x86_simd_caps();
    140 
    141     (void)flags;
    142 
    143 }
    144 #endif
    145 
    146 #ifdef __cplusplus
    147 }  // extern "C"
    148 #endif
    149 
    150 #endif
    151