diff options
author | Allan Sandfeld Jensen <allan.jensen@qt.io> | 2018-08-28 15:28:34 +0200 |
---|---|---|
committer | Allan Sandfeld Jensen <allan.jensen@qt.io> | 2018-08-28 13:54:51 +0000 |
commit | 2a19c63448c84c1805fb1a585c3651318bb86ca7 (patch) | |
tree | eb17888e8531aa6ee5e85721bd553b832a7e5156 /chromium/third_party/libaom/source/config/linux/ia32/config/av1_rtcd.h | |
parent | b014812705fc80bff0a5c120dfcef88f349816dc (diff) | |
download | qtwebengine-chromium-2a19c63448c84c1805fb1a585c3651318bb86ca7.tar.gz |
BASELINE: Update Chromium to 69.0.3497.70
Change-Id: I2b7b56e4e7a8b26656930def0d4575dc32b900a0
Reviewed-by: Allan Sandfeld Jensen <allan.jensen@qt.io>
Diffstat (limited to 'chromium/third_party/libaom/source/config/linux/ia32/config/av1_rtcd.h')
-rw-r--r-- | chromium/third_party/libaom/source/config/linux/ia32/config/av1_rtcd.h | 2225 |
1 files changed, 2225 insertions, 0 deletions
diff --git a/chromium/third_party/libaom/source/config/linux/ia32/config/av1_rtcd.h b/chromium/third_party/libaom/source/config/linux/ia32/config/av1_rtcd.h new file mode 100644 index 00000000000..724cd0b6808 --- /dev/null +++ b/chromium/third_party/libaom/source/config/linux/ia32/config/av1_rtcd.h @@ -0,0 +1,2225 @@ +// This file is generated. Do not edit. +#ifndef AV1_RTCD_H_ +#define AV1_RTCD_H_ + +#ifdef RTCD_C +#define RTCD_EXTERN +#else +#define RTCD_EXTERN extern +#endif + +/* + * AV1 + */ + +#include "aom/aom_integer.h" +#include "aom_dsp/txfm_common.h" +#include "av1/common/av1_txfm.h" +#include "av1/common/common.h" +#include "av1/common/convolve.h" +#include "av1/common/enums.h" +#include "av1/common/filter.h" +#include "av1/common/odintrin.h" +#include "av1/common/quant_common.h" +#include "av1/common/restoration.h" + +struct macroblockd; + +/* Encoder forward decls */ +struct macroblock; +struct txfm_param; +struct aom_variance_vtable; +struct search_site_config; +struct yv12_buffer_config; + +/* Function pointers return by CfL functions */ +typedef void (*cfl_subsample_lbd_fn)(const uint8_t* input, + int input_stride, + uint16_t* output_q3); + +typedef void (*cfl_subsample_hbd_fn)(const uint16_t* input, + int input_stride, + uint16_t* output_q3); + +typedef void (*cfl_subtract_average_fn)(const uint16_t* src, int16_t* dst); + +typedef void (*cfl_predict_lbd_fn)(const int16_t* src, + uint8_t* dst, + int dst_stride, + int alpha_q3); + +typedef void (*cfl_predict_hbd_fn)(const int16_t* src, + uint16_t* dst, + int dst_stride, + int alpha_q3, + int bd); + +#ifdef __cplusplus +extern "C" { +#endif + +void apply_selfguided_restoration_c(const uint8_t* dat, + int width, + int height, + int stride, + int eps, + const int* xqd, + uint8_t* dst, + int dst_stride, + int32_t* tmpbuf, + int bit_depth, + int highbd); +void apply_selfguided_restoration_sse4_1(const uint8_t* dat, + int width, + int height, + int stride, + int eps, + const int* xqd, + uint8_t* dst, + int dst_stride, + int32_t* tmpbuf, + int bit_depth, + int highbd); +void apply_selfguided_restoration_avx2(const uint8_t* dat, + int width, + int height, + int stride, + int eps, + const int* xqd, + uint8_t* dst, + int dst_stride, + int32_t* tmpbuf, + int bit_depth, + int highbd); +RTCD_EXTERN void (*apply_selfguided_restoration)(const uint8_t* dat, + int width, + int height, + int stride, + int eps, + const int* xqd, + uint8_t* dst, + int dst_stride, + int32_t* tmpbuf, + int bit_depth, + int highbd); + +void av1_build_compound_diffwtd_mask_c(uint8_t* mask, + DIFFWTD_MASK_TYPE mask_type, + const uint8_t* src0, + int src0_stride, + const uint8_t* src1, + int src1_stride, + int h, + int w); +void av1_build_compound_diffwtd_mask_sse4_1(uint8_t* mask, + DIFFWTD_MASK_TYPE mask_type, + const uint8_t* src0, + int src0_stride, + const uint8_t* src1, + int src1_stride, + int h, + int w); +RTCD_EXTERN void (*av1_build_compound_diffwtd_mask)(uint8_t* mask, + DIFFWTD_MASK_TYPE mask_type, + const uint8_t* src0, + int src0_stride, + const uint8_t* src1, + int src1_stride, + int h, + int w); + +void av1_build_compound_diffwtd_mask_d16_c(uint8_t* mask, + DIFFWTD_MASK_TYPE mask_type, + const CONV_BUF_TYPE* src0, + int src0_stride, + const CONV_BUF_TYPE* src1, + int src1_stride, + int h, + int w, + ConvolveParams* conv_params, + int bd); +void av1_build_compound_diffwtd_mask_d16_sse4_1(uint8_t* mask, + DIFFWTD_MASK_TYPE mask_type, + const CONV_BUF_TYPE* src0, + int src0_stride, + const CONV_BUF_TYPE* src1, + int src1_stride, + int h, + int w, + ConvolveParams* conv_params, + int bd); +RTCD_EXTERN void (*av1_build_compound_diffwtd_mask_d16)( + uint8_t* mask, + DIFFWTD_MASK_TYPE mask_type, + const CONV_BUF_TYPE* src0, + int src0_stride, + const CONV_BUF_TYPE* src1, + int src1_stride, + int h, + int w, + ConvolveParams* conv_params, + int bd); + +void av1_build_compound_diffwtd_mask_highbd_c(uint8_t* mask, + DIFFWTD_MASK_TYPE mask_type, + const uint8_t* src0, + int src0_stride, + const uint8_t* src1, + int src1_stride, + int h, + int w, + int bd); +void av1_build_compound_diffwtd_mask_highbd_ssse3(uint8_t* mask, + DIFFWTD_MASK_TYPE mask_type, + const uint8_t* src0, + int src0_stride, + const uint8_t* src1, + int src1_stride, + int h, + int w, + int bd); +void av1_build_compound_diffwtd_mask_highbd_avx2(uint8_t* mask, + DIFFWTD_MASK_TYPE mask_type, + const uint8_t* src0, + int src0_stride, + const uint8_t* src1, + int src1_stride, + int h, + int w, + int bd); +RTCD_EXTERN void (*av1_build_compound_diffwtd_mask_highbd)( + uint8_t* mask, + DIFFWTD_MASK_TYPE mask_type, + const uint8_t* src0, + int src0_stride, + const uint8_t* src1, + int src1_stride, + int h, + int w, + int bd); + +void av1_convolve_2d_copy_sr_c(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); +void av1_convolve_2d_copy_sr_sse2(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); +void av1_convolve_2d_copy_sr_avx2(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); +RTCD_EXTERN void (*av1_convolve_2d_copy_sr)(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); + +void av1_convolve_2d_scale_c(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_qn, + const int x_step_qn, + const int subpel_y_q4, + const int y_step_qn, + ConvolveParams* conv_params); +void av1_convolve_2d_scale_sse4_1(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_qn, + const int x_step_qn, + const int subpel_y_q4, + const int y_step_qn, + ConvolveParams* conv_params); +RTCD_EXTERN void (*av1_convolve_2d_scale)(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_qn, + const int x_step_qn, + const int subpel_y_q4, + const int y_step_qn, + ConvolveParams* conv_params); + +void av1_convolve_2d_sr_c(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); +void av1_convolve_2d_sr_sse2(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); +void av1_convolve_2d_sr_avx2(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); +RTCD_EXTERN void (*av1_convolve_2d_sr)(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); + +void av1_convolve_horiz_rs_c(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + const int16_t* x_filters, + int x0_qn, + int x_step_qn); +void av1_convolve_horiz_rs_sse4_1(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + const int16_t* x_filters, + int x0_qn, + int x_step_qn); +RTCD_EXTERN void (*av1_convolve_horiz_rs)(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + const int16_t* x_filters, + int x0_qn, + int x_step_qn); + +void av1_convolve_x_sr_c(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); +void av1_convolve_x_sr_sse2(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); +void av1_convolve_x_sr_avx2(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); +RTCD_EXTERN void (*av1_convolve_x_sr)(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); + +void av1_convolve_y_sr_c(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); +void av1_convolve_y_sr_sse2(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); +void av1_convolve_y_sr_avx2(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); +RTCD_EXTERN void (*av1_convolve_y_sr)(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); + +void av1_dr_prediction_z1_c(uint8_t* dst, + ptrdiff_t stride, + int bw, + int bh, + const uint8_t* above, + const uint8_t* left, + int upsample_above, + int dx, + int dy); +#define av1_dr_prediction_z1 av1_dr_prediction_z1_c + +void av1_dr_prediction_z2_c(uint8_t* dst, + ptrdiff_t stride, + int bw, + int bh, + const uint8_t* above, + const uint8_t* left, + int upsample_above, + int upsample_left, + int dx, + int dy); +#define av1_dr_prediction_z2 av1_dr_prediction_z2_c + +void av1_dr_prediction_z3_c(uint8_t* dst, + ptrdiff_t stride, + int bw, + int bh, + const uint8_t* above, + const uint8_t* left, + int upsample_left, + int dx, + int dy); +#define av1_dr_prediction_z3 av1_dr_prediction_z3_c + +void av1_filter_intra_edge_c(uint8_t* p, int sz, int strength); +void av1_filter_intra_edge_sse4_1(uint8_t* p, int sz, int strength); +RTCD_EXTERN void (*av1_filter_intra_edge)(uint8_t* p, int sz, int strength); + +void av1_filter_intra_edge_high_c(uint16_t* p, int sz, int strength); +void av1_filter_intra_edge_high_sse4_1(uint16_t* p, int sz, int strength); +RTCD_EXTERN void (*av1_filter_intra_edge_high)(uint16_t* p, + int sz, + int strength); + +void av1_filter_intra_predictor_c(uint8_t* dst, + ptrdiff_t stride, + TX_SIZE tx_size, + const uint8_t* above, + const uint8_t* left, + int mode); +void av1_filter_intra_predictor_sse4_1(uint8_t* dst, + ptrdiff_t stride, + TX_SIZE tx_size, + const uint8_t* above, + const uint8_t* left, + int mode); +RTCD_EXTERN void (*av1_filter_intra_predictor)(uint8_t* dst, + ptrdiff_t stride, + TX_SIZE tx_size, + const uint8_t* above, + const uint8_t* left, + int mode); + +void av1_highbd_convolve8_c(const uint8_t* src, + ptrdiff_t src_stride, + uint8_t* dst, + ptrdiff_t dst_stride, + const int16_t* filter_x, + int x_step_q4, + const int16_t* filter_y, + int y_step_q4, + int w, + int h, + int bps); +#define av1_highbd_convolve8 av1_highbd_convolve8_c + +void av1_highbd_convolve8_horiz_c(const uint8_t* src, + ptrdiff_t src_stride, + uint8_t* dst, + ptrdiff_t dst_stride, + const int16_t* filter_x, + int x_step_q4, + const int16_t* filter_y, + int y_step_q4, + int w, + int h, + int bps); +#define av1_highbd_convolve8_horiz av1_highbd_convolve8_horiz_c + +void av1_highbd_convolve8_vert_c(const uint8_t* src, + ptrdiff_t src_stride, + uint8_t* dst, + ptrdiff_t dst_stride, + const int16_t* filter_x, + int x_step_q4, + const int16_t* filter_y, + int y_step_q4, + int w, + int h, + int bps); +#define av1_highbd_convolve8_vert av1_highbd_convolve8_vert_c + +void av1_highbd_convolve_2d_copy_sr_c(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); +void av1_highbd_convolve_2d_copy_sr_sse2(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); +void av1_highbd_convolve_2d_copy_sr_avx2(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); +RTCD_EXTERN void (*av1_highbd_convolve_2d_copy_sr)( + const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); + +void av1_highbd_convolve_2d_scale_c(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int x_step_qn, + const int subpel_y_q4, + const int y_step_qn, + ConvolveParams* conv_params, + int bd); +void av1_highbd_convolve_2d_scale_sse4_1(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int x_step_qn, + const int subpel_y_q4, + const int y_step_qn, + ConvolveParams* conv_params, + int bd); +RTCD_EXTERN void (*av1_highbd_convolve_2d_scale)( + const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int x_step_qn, + const int subpel_y_q4, + const int y_step_qn, + ConvolveParams* conv_params, + int bd); + +void av1_highbd_convolve_2d_sr_c(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); +void av1_highbd_convolve_2d_sr_ssse3(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); +void av1_highbd_convolve_2d_sr_avx2(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); +RTCD_EXTERN void (*av1_highbd_convolve_2d_sr)( + const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); + +void av1_highbd_convolve_avg_c(const uint8_t* src, + ptrdiff_t src_stride, + uint8_t* dst, + ptrdiff_t dst_stride, + const int16_t* filter_x, + int x_step_q4, + const int16_t* filter_y, + int y_step_q4, + int w, + int h, + int bps); +#define av1_highbd_convolve_avg av1_highbd_convolve_avg_c + +void av1_highbd_convolve_copy_c(const uint8_t* src, + ptrdiff_t src_stride, + uint8_t* dst, + ptrdiff_t dst_stride, + const int16_t* filter_x, + int x_step_q4, + const int16_t* filter_y, + int y_step_q4, + int w, + int h, + int bps); +#define av1_highbd_convolve_copy av1_highbd_convolve_copy_c + +void av1_highbd_convolve_horiz_rs_c(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + const int16_t* x_filters, + int x0_qn, + int x_step_qn, + int bd); +void av1_highbd_convolve_horiz_rs_sse4_1(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + const int16_t* x_filters, + int x0_qn, + int x_step_qn, + int bd); +RTCD_EXTERN void (*av1_highbd_convolve_horiz_rs)(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + const int16_t* x_filters, + int x0_qn, + int x_step_qn, + int bd); + +void av1_highbd_convolve_x_sr_c(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); +void av1_highbd_convolve_x_sr_ssse3(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); +void av1_highbd_convolve_x_sr_avx2(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); +RTCD_EXTERN void (*av1_highbd_convolve_x_sr)( + const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); + +void av1_highbd_convolve_y_sr_c(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); +void av1_highbd_convolve_y_sr_ssse3(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); +void av1_highbd_convolve_y_sr_avx2(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); +RTCD_EXTERN void (*av1_highbd_convolve_y_sr)( + const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); + +void av1_highbd_dr_prediction_z1_c(uint16_t* dst, + ptrdiff_t stride, + int bw, + int bh, + const uint16_t* above, + const uint16_t* left, + int upsample_above, + int dx, + int dy, + int bd); +#define av1_highbd_dr_prediction_z1 av1_highbd_dr_prediction_z1_c + +void av1_highbd_dr_prediction_z2_c(uint16_t* dst, + ptrdiff_t stride, + int bw, + int bh, + const uint16_t* above, + const uint16_t* left, + int upsample_above, + int upsample_left, + int dx, + int dy, + int bd); +#define av1_highbd_dr_prediction_z2 av1_highbd_dr_prediction_z2_c + +void av1_highbd_dr_prediction_z3_c(uint16_t* dst, + ptrdiff_t stride, + int bw, + int bh, + const uint16_t* above, + const uint16_t* left, + int upsample_left, + int dx, + int dy, + int bd); +#define av1_highbd_dr_prediction_z3 av1_highbd_dr_prediction_z3_c + +void av1_highbd_iwht4x4_16_add_c(const tran_low_t* input, + uint8_t* dest, + int dest_stride, + int bd); +#define av1_highbd_iwht4x4_16_add av1_highbd_iwht4x4_16_add_c + +void av1_highbd_iwht4x4_1_add_c(const tran_low_t* input, + uint8_t* dest, + int dest_stride, + int bd); +#define av1_highbd_iwht4x4_1_add av1_highbd_iwht4x4_1_add_c + +void av1_highbd_jnt_convolve_2d_c(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); +void av1_highbd_jnt_convolve_2d_sse4_1(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); +void av1_highbd_jnt_convolve_2d_avx2(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); +RTCD_EXTERN void (*av1_highbd_jnt_convolve_2d)( + const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); + +void av1_highbd_jnt_convolve_2d_copy_c(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); +void av1_highbd_jnt_convolve_2d_copy_sse4_1(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); +void av1_highbd_jnt_convolve_2d_copy_avx2(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); +RTCD_EXTERN void (*av1_highbd_jnt_convolve_2d_copy)( + const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); + +void av1_highbd_jnt_convolve_x_c(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); +void av1_highbd_jnt_convolve_x_sse4_1(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); +void av1_highbd_jnt_convolve_x_avx2(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); +RTCD_EXTERN void (*av1_highbd_jnt_convolve_x)( + const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); + +void av1_highbd_jnt_convolve_y_c(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); +void av1_highbd_jnt_convolve_y_sse4_1(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); +void av1_highbd_jnt_convolve_y_avx2(const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); +RTCD_EXTERN void (*av1_highbd_jnt_convolve_y)( + const uint16_t* src, + int src_stride, + uint16_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params, + int bd); + +void av1_highbd_warp_affine_c(const int32_t* mat, + const uint16_t* ref, + int width, + int height, + int stride, + uint16_t* pred, + int p_col, + int p_row, + int p_width, + int p_height, + int p_stride, + int subsampling_x, + int subsampling_y, + int bd, + ConvolveParams* conv_params, + int16_t alpha, + int16_t beta, + int16_t gamma, + int16_t delta); +void av1_highbd_warp_affine_sse4_1(const int32_t* mat, + const uint16_t* ref, + int width, + int height, + int stride, + uint16_t* pred, + int p_col, + int p_row, + int p_width, + int p_height, + int p_stride, + int subsampling_x, + int subsampling_y, + int bd, + ConvolveParams* conv_params, + int16_t alpha, + int16_t beta, + int16_t gamma, + int16_t delta); +RTCD_EXTERN void (*av1_highbd_warp_affine)(const int32_t* mat, + const uint16_t* ref, + int width, + int height, + int stride, + uint16_t* pred, + int p_col, + int p_row, + int p_width, + int p_height, + int p_stride, + int subsampling_x, + int subsampling_y, + int bd, + ConvolveParams* conv_params, + int16_t alpha, + int16_t beta, + int16_t gamma, + int16_t delta); + +void av1_highbd_wiener_convolve_add_src_c(const uint8_t* src, + ptrdiff_t src_stride, + uint8_t* dst, + ptrdiff_t dst_stride, + const int16_t* filter_x, + int x_step_q4, + const int16_t* filter_y, + int y_step_q4, + int w, + int h, + const ConvolveParams* conv_params, + int bps); +void av1_highbd_wiener_convolve_add_src_ssse3(const uint8_t* src, + ptrdiff_t src_stride, + uint8_t* dst, + ptrdiff_t dst_stride, + const int16_t* filter_x, + int x_step_q4, + const int16_t* filter_y, + int y_step_q4, + int w, + int h, + const ConvolveParams* conv_params, + int bps); +void av1_highbd_wiener_convolve_add_src_avx2(const uint8_t* src, + ptrdiff_t src_stride, + uint8_t* dst, + ptrdiff_t dst_stride, + const int16_t* filter_x, + int x_step_q4, + const int16_t* filter_y, + int y_step_q4, + int w, + int h, + const ConvolveParams* conv_params, + int bps); +RTCD_EXTERN void (*av1_highbd_wiener_convolve_add_src)( + const uint8_t* src, + ptrdiff_t src_stride, + uint8_t* dst, + ptrdiff_t dst_stride, + const int16_t* filter_x, + int x_step_q4, + const int16_t* filter_y, + int y_step_q4, + int w, + int h, + const ConvolveParams* conv_params, + int bps); + +void av1_inv_txfm2d_add_16x16_c(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); +void av1_inv_txfm2d_add_16x16_sse4_1(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); +RTCD_EXTERN void (*av1_inv_txfm2d_add_16x16)(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); + +void av1_inv_txfm2d_add_16x32_c(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); +#define av1_inv_txfm2d_add_16x32 av1_inv_txfm2d_add_16x32_c + +void av1_inv_txfm2d_add_16x4_c(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); +#define av1_inv_txfm2d_add_16x4 av1_inv_txfm2d_add_16x4_c + +void av1_inv_txfm2d_add_16x64_c(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); +#define av1_inv_txfm2d_add_16x64 av1_inv_txfm2d_add_16x64_c + +void av1_inv_txfm2d_add_16x8_c(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); +#define av1_inv_txfm2d_add_16x8 av1_inv_txfm2d_add_16x8_c + +void av1_inv_txfm2d_add_32x16_c(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); +#define av1_inv_txfm2d_add_32x16 av1_inv_txfm2d_add_32x16_c + +void av1_inv_txfm2d_add_32x32_c(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); +void av1_inv_txfm2d_add_32x32_avx2(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); +RTCD_EXTERN void (*av1_inv_txfm2d_add_32x32)(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); + +void av1_inv_txfm2d_add_32x64_c(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); +#define av1_inv_txfm2d_add_32x64 av1_inv_txfm2d_add_32x64_c + +void av1_inv_txfm2d_add_32x8_c(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); +#define av1_inv_txfm2d_add_32x8 av1_inv_txfm2d_add_32x8_c + +void av1_inv_txfm2d_add_4x16_c(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); +#define av1_inv_txfm2d_add_4x16 av1_inv_txfm2d_add_4x16_c + +void av1_inv_txfm2d_add_4x4_c(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); +void av1_inv_txfm2d_add_4x4_sse4_1(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); +RTCD_EXTERN void (*av1_inv_txfm2d_add_4x4)(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); + +void av1_inv_txfm2d_add_4x8_c(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); +#define av1_inv_txfm2d_add_4x8 av1_inv_txfm2d_add_4x8_c + +void av1_inv_txfm2d_add_64x16_c(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); +#define av1_inv_txfm2d_add_64x16 av1_inv_txfm2d_add_64x16_c + +void av1_inv_txfm2d_add_64x32_c(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); +#define av1_inv_txfm2d_add_64x32 av1_inv_txfm2d_add_64x32_c + +void av1_inv_txfm2d_add_64x64_c(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); +void av1_inv_txfm2d_add_64x64_sse4_1(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); +RTCD_EXTERN void (*av1_inv_txfm2d_add_64x64)(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); + +void av1_inv_txfm2d_add_8x16_c(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); +#define av1_inv_txfm2d_add_8x16 av1_inv_txfm2d_add_8x16_c + +void av1_inv_txfm2d_add_8x32_c(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); +#define av1_inv_txfm2d_add_8x32 av1_inv_txfm2d_add_8x32_c + +void av1_inv_txfm2d_add_8x4_c(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); +#define av1_inv_txfm2d_add_8x4 av1_inv_txfm2d_add_8x4_c + +void av1_inv_txfm2d_add_8x8_c(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); +void av1_inv_txfm2d_add_8x8_sse4_1(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); +RTCD_EXTERN void (*av1_inv_txfm2d_add_8x8)(const int32_t* input, + uint16_t* output, + int stride, + TX_TYPE tx_type, + int bd); + +void av1_inv_txfm_add_c(const tran_low_t* dqcoeff, + uint8_t* dst, + int stride, + const TxfmParam* txfm_param); +void av1_inv_txfm_add_ssse3(const tran_low_t* dqcoeff, + uint8_t* dst, + int stride, + const TxfmParam* txfm_param); +void av1_inv_txfm_add_avx2(const tran_low_t* dqcoeff, + uint8_t* dst, + int stride, + const TxfmParam* txfm_param); +RTCD_EXTERN void (*av1_inv_txfm_add)(const tran_low_t* dqcoeff, + uint8_t* dst, + int stride, + const TxfmParam* txfm_param); + +void av1_jnt_convolve_2d_c(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); +void av1_jnt_convolve_2d_ssse3(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); +void av1_jnt_convolve_2d_avx2(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); +RTCD_EXTERN void (*av1_jnt_convolve_2d)(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); + +void av1_jnt_convolve_2d_copy_c(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); +void av1_jnt_convolve_2d_copy_sse2(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); +void av1_jnt_convolve_2d_copy_avx2(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); +RTCD_EXTERN void (*av1_jnt_convolve_2d_copy)( + const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); + +void av1_jnt_convolve_x_c(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); +void av1_jnt_convolve_x_sse2(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); +void av1_jnt_convolve_x_avx2(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); +RTCD_EXTERN void (*av1_jnt_convolve_x)(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); + +void av1_jnt_convolve_y_c(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); +void av1_jnt_convolve_y_sse2(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); +void av1_jnt_convolve_y_avx2(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); +RTCD_EXTERN void (*av1_jnt_convolve_y)(const uint8_t* src, + int src_stride, + uint8_t* dst, + int dst_stride, + int w, + int h, + InterpFilterParams* filter_params_x, + InterpFilterParams* filter_params_y, + const int subpel_x_q4, + const int subpel_y_q4, + ConvolveParams* conv_params); + +void av1_selfguided_restoration_c(const uint8_t* dgd8, + int width, + int height, + int dgd_stride, + int32_t* flt0, + int32_t* flt1, + int flt_stride, + int sgr_params_idx, + int bit_depth, + int highbd); +void av1_selfguided_restoration_sse4_1(const uint8_t* dgd8, + int width, + int height, + int dgd_stride, + int32_t* flt0, + int32_t* flt1, + int flt_stride, + int sgr_params_idx, + int bit_depth, + int highbd); +void av1_selfguided_restoration_avx2(const uint8_t* dgd8, + int width, + int height, + int dgd_stride, + int32_t* flt0, + int32_t* flt1, + int flt_stride, + int sgr_params_idx, + int bit_depth, + int highbd); +RTCD_EXTERN void (*av1_selfguided_restoration)(const uint8_t* dgd8, + int width, + int height, + int dgd_stride, + int32_t* flt0, + int32_t* flt1, + int flt_stride, + int sgr_params_idx, + int bit_depth, + int highbd); + +void av1_upsample_intra_edge_c(uint8_t* p, int sz); +void av1_upsample_intra_edge_sse4_1(uint8_t* p, int sz); +RTCD_EXTERN void (*av1_upsample_intra_edge)(uint8_t* p, int sz); + +void av1_upsample_intra_edge_high_c(uint16_t* p, int sz, int bd); +void av1_upsample_intra_edge_high_sse4_1(uint16_t* p, int sz, int bd); +RTCD_EXTERN void (*av1_upsample_intra_edge_high)(uint16_t* p, int sz, int bd); + +void av1_warp_affine_c(const int32_t* mat, + const uint8_t* ref, + int width, + int height, + int stride, + uint8_t* pred, + int p_col, + int p_row, + int p_width, + int p_height, + int p_stride, + int subsampling_x, + int subsampling_y, + ConvolveParams* conv_params, + int16_t alpha, + int16_t beta, + int16_t gamma, + int16_t delta); +void av1_warp_affine_sse4_1(const int32_t* mat, + const uint8_t* ref, + int width, + int height, + int stride, + uint8_t* pred, + int p_col, + int p_row, + int p_width, + int p_height, + int p_stride, + int subsampling_x, + int subsampling_y, + ConvolveParams* conv_params, + int16_t alpha, + int16_t beta, + int16_t gamma, + int16_t delta); +RTCD_EXTERN void (*av1_warp_affine)(const int32_t* mat, + const uint8_t* ref, + int width, + int height, + int stride, + uint8_t* pred, + int p_col, + int p_row, + int p_width, + int p_height, + int p_stride, + int subsampling_x, + int subsampling_y, + ConvolveParams* conv_params, + int16_t alpha, + int16_t beta, + int16_t gamma, + int16_t delta); + +void av1_wiener_convolve_add_src_c(const uint8_t* src, + ptrdiff_t src_stride, + uint8_t* dst, + ptrdiff_t dst_stride, + const int16_t* filter_x, + int x_step_q4, + const int16_t* filter_y, + int y_step_q4, + int w, + int h, + const ConvolveParams* conv_params); +void av1_wiener_convolve_add_src_sse2(const uint8_t* src, + ptrdiff_t src_stride, + uint8_t* dst, + ptrdiff_t dst_stride, + const int16_t* filter_x, + int x_step_q4, + const int16_t* filter_y, + int y_step_q4, + int w, + int h, + const ConvolveParams* conv_params); +void av1_wiener_convolve_add_src_avx2(const uint8_t* src, + ptrdiff_t src_stride, + uint8_t* dst, + ptrdiff_t dst_stride, + const int16_t* filter_x, + int x_step_q4, + const int16_t* filter_y, + int y_step_q4, + int w, + int h, + const ConvolveParams* conv_params); +RTCD_EXTERN void (*av1_wiener_convolve_add_src)( + const uint8_t* src, + ptrdiff_t src_stride, + uint8_t* dst, + ptrdiff_t dst_stride, + const int16_t* filter_x, + int x_step_q4, + const int16_t* filter_y, + int y_step_q4, + int w, + int h, + const ConvolveParams* conv_params); + +void cdef_filter_block_c(uint8_t* dst8, + uint16_t* dst16, + int dstride, + const uint16_t* in, + int pri_strength, + int sec_strength, + int dir, + int pri_damping, + int sec_damping, + int bsize, + int max, + int coeff_shift); +void cdef_filter_block_sse2(uint8_t* dst8, + uint16_t* dst16, + int dstride, + const uint16_t* in, + int pri_strength, + int sec_strength, + int dir, + int pri_damping, + int sec_damping, + int bsize, + int max, + int coeff_shift); +void cdef_filter_block_ssse3(uint8_t* dst8, + uint16_t* dst16, + int dstride, + const uint16_t* in, + int pri_strength, + int sec_strength, + int dir, + int pri_damping, + int sec_damping, + int bsize, + int max, + int coeff_shift); +void cdef_filter_block_sse4_1(uint8_t* dst8, + uint16_t* dst16, + int dstride, + const uint16_t* in, + int pri_strength, + int sec_strength, + int dir, + int pri_damping, + int sec_damping, + int bsize, + int max, + int coeff_shift); +void cdef_filter_block_avx2(uint8_t* dst8, + uint16_t* dst16, + int dstride, + const uint16_t* in, + int pri_strength, + int sec_strength, + int dir, + int pri_damping, + int sec_damping, + int bsize, + int max, + int coeff_shift); +RTCD_EXTERN void (*cdef_filter_block)(uint8_t* dst8, + uint16_t* dst16, + int dstride, + const uint16_t* in, + int pri_strength, + int sec_strength, + int dir, + int pri_damping, + int sec_damping, + int bsize, + int max, + int coeff_shift); + +int cdef_find_dir_c(const uint16_t* img, + int stride, + int32_t* var, + int coeff_shift); +int cdef_find_dir_sse2(const uint16_t* img, + int stride, + int32_t* var, + int coeff_shift); +int cdef_find_dir_ssse3(const uint16_t* img, + int stride, + int32_t* var, + int coeff_shift); +int cdef_find_dir_sse4_1(const uint16_t* img, + int stride, + int32_t* var, + int coeff_shift); +int cdef_find_dir_avx2(const uint16_t* img, + int stride, + int32_t* var, + int coeff_shift); +RTCD_EXTERN int (*cdef_find_dir)(const uint16_t* img, + int stride, + int32_t* var, + int coeff_shift); + +cfl_subsample_hbd_fn cfl_get_luma_subsampling_420_hbd_c(TX_SIZE tx_size); +cfl_subsample_hbd_fn cfl_get_luma_subsampling_420_hbd_ssse3(TX_SIZE tx_size); +cfl_subsample_hbd_fn cfl_get_luma_subsampling_420_hbd_avx2(TX_SIZE tx_size); +RTCD_EXTERN cfl_subsample_hbd_fn (*cfl_get_luma_subsampling_420_hbd)( + TX_SIZE tx_size); + +cfl_subsample_lbd_fn cfl_get_luma_subsampling_420_lbd_c(TX_SIZE tx_size); +cfl_subsample_lbd_fn cfl_get_luma_subsampling_420_lbd_ssse3(TX_SIZE tx_size); +cfl_subsample_lbd_fn cfl_get_luma_subsampling_420_lbd_avx2(TX_SIZE tx_size); +RTCD_EXTERN cfl_subsample_lbd_fn (*cfl_get_luma_subsampling_420_lbd)( + TX_SIZE tx_size); + +cfl_subsample_hbd_fn cfl_get_luma_subsampling_422_hbd_c(TX_SIZE tx_size); +cfl_subsample_hbd_fn cfl_get_luma_subsampling_422_hbd_ssse3(TX_SIZE tx_size); +cfl_subsample_hbd_fn cfl_get_luma_subsampling_422_hbd_avx2(TX_SIZE tx_size); +RTCD_EXTERN cfl_subsample_hbd_fn (*cfl_get_luma_subsampling_422_hbd)( + TX_SIZE tx_size); + +cfl_subsample_lbd_fn cfl_get_luma_subsampling_422_lbd_c(TX_SIZE tx_size); +cfl_subsample_lbd_fn cfl_get_luma_subsampling_422_lbd_ssse3(TX_SIZE tx_size); +cfl_subsample_lbd_fn cfl_get_luma_subsampling_422_lbd_avx2(TX_SIZE tx_size); +RTCD_EXTERN cfl_subsample_lbd_fn (*cfl_get_luma_subsampling_422_lbd)( + TX_SIZE tx_size); + +cfl_subsample_hbd_fn cfl_get_luma_subsampling_444_hbd_c(TX_SIZE tx_size); +cfl_subsample_hbd_fn cfl_get_luma_subsampling_444_hbd_ssse3(TX_SIZE tx_size); +cfl_subsample_hbd_fn cfl_get_luma_subsampling_444_hbd_avx2(TX_SIZE tx_size); +RTCD_EXTERN cfl_subsample_hbd_fn (*cfl_get_luma_subsampling_444_hbd)( + TX_SIZE tx_size); + +cfl_subsample_lbd_fn cfl_get_luma_subsampling_444_lbd_c(TX_SIZE tx_size); +cfl_subsample_lbd_fn cfl_get_luma_subsampling_444_lbd_ssse3(TX_SIZE tx_size); +cfl_subsample_lbd_fn cfl_get_luma_subsampling_444_lbd_avx2(TX_SIZE tx_size); +RTCD_EXTERN cfl_subsample_lbd_fn (*cfl_get_luma_subsampling_444_lbd)( + TX_SIZE tx_size); + +void copy_rect8_16bit_to_16bit_c(uint16_t* dst, + int dstride, + const uint16_t* src, + int sstride, + int v, + int h); +void copy_rect8_16bit_to_16bit_sse2(uint16_t* dst, + int dstride, + const uint16_t* src, + int sstride, + int v, + int h); +void copy_rect8_16bit_to_16bit_ssse3(uint16_t* dst, + int dstride, + const uint16_t* src, + int sstride, + int v, + int h); +void copy_rect8_16bit_to_16bit_sse4_1(uint16_t* dst, + int dstride, + const uint16_t* src, + int sstride, + int v, + int h); +void copy_rect8_16bit_to_16bit_avx2(uint16_t* dst, + int dstride, + const uint16_t* src, + int sstride, + int v, + int h); +RTCD_EXTERN void (*copy_rect8_16bit_to_16bit)(uint16_t* dst, + int dstride, + const uint16_t* src, + int sstride, + int v, + int h); + +void copy_rect8_8bit_to_16bit_c(uint16_t* dst, + int dstride, + const uint8_t* src, + int sstride, + int v, + int h); +void copy_rect8_8bit_to_16bit_sse2(uint16_t* dst, + int dstride, + const uint8_t* src, + int sstride, + int v, + int h); +void copy_rect8_8bit_to_16bit_ssse3(uint16_t* dst, + int dstride, + const uint8_t* src, + int sstride, + int v, + int h); +void copy_rect8_8bit_to_16bit_sse4_1(uint16_t* dst, + int dstride, + const uint8_t* src, + int sstride, + int v, + int h); +void copy_rect8_8bit_to_16bit_avx2(uint16_t* dst, + int dstride, + const uint8_t* src, + int sstride, + int v, + int h); +RTCD_EXTERN void (*copy_rect8_8bit_to_16bit)(uint16_t* dst, + int dstride, + const uint8_t* src, + int sstride, + int v, + int h); + +cfl_predict_hbd_fn get_predict_hbd_fn_c(TX_SIZE tx_size); +cfl_predict_hbd_fn get_predict_hbd_fn_ssse3(TX_SIZE tx_size); +cfl_predict_hbd_fn get_predict_hbd_fn_avx2(TX_SIZE tx_size); +RTCD_EXTERN cfl_predict_hbd_fn (*get_predict_hbd_fn)(TX_SIZE tx_size); + +cfl_predict_lbd_fn get_predict_lbd_fn_c(TX_SIZE tx_size); +cfl_predict_lbd_fn get_predict_lbd_fn_ssse3(TX_SIZE tx_size); +cfl_predict_lbd_fn get_predict_lbd_fn_avx2(TX_SIZE tx_size); +RTCD_EXTERN cfl_predict_lbd_fn (*get_predict_lbd_fn)(TX_SIZE tx_size); + +cfl_subtract_average_fn get_subtract_average_fn_c(TX_SIZE tx_size); +cfl_subtract_average_fn get_subtract_average_fn_sse2(TX_SIZE tx_size); +cfl_subtract_average_fn get_subtract_average_fn_avx2(TX_SIZE tx_size); +RTCD_EXTERN cfl_subtract_average_fn (*get_subtract_average_fn)(TX_SIZE tx_size); + +void av1_rtcd(void); + +#ifdef RTCD_C +#include "aom_ports/x86.h" +static void setup_rtcd_internal(void) { + int flags = x86_simd_caps(); + + (void)flags; + + apply_selfguided_restoration = apply_selfguided_restoration_c; + if (flags & HAS_SSE4_1) + apply_selfguided_restoration = apply_selfguided_restoration_sse4_1; + if (flags & HAS_AVX2) + apply_selfguided_restoration = apply_selfguided_restoration_avx2; + av1_build_compound_diffwtd_mask = av1_build_compound_diffwtd_mask_c; + if (flags & HAS_SSE4_1) + av1_build_compound_diffwtd_mask = av1_build_compound_diffwtd_mask_sse4_1; + av1_build_compound_diffwtd_mask_d16 = av1_build_compound_diffwtd_mask_d16_c; + if (flags & HAS_SSE4_1) + av1_build_compound_diffwtd_mask_d16 = + av1_build_compound_diffwtd_mask_d16_sse4_1; + av1_build_compound_diffwtd_mask_highbd = + av1_build_compound_diffwtd_mask_highbd_c; + if (flags & HAS_SSSE3) + av1_build_compound_diffwtd_mask_highbd = + av1_build_compound_diffwtd_mask_highbd_ssse3; + if (flags & HAS_AVX2) + av1_build_compound_diffwtd_mask_highbd = + av1_build_compound_diffwtd_mask_highbd_avx2; + av1_convolve_2d_copy_sr = av1_convolve_2d_copy_sr_c; + if (flags & HAS_SSE2) + av1_convolve_2d_copy_sr = av1_convolve_2d_copy_sr_sse2; + if (flags & HAS_AVX2) + av1_convolve_2d_copy_sr = av1_convolve_2d_copy_sr_avx2; + av1_convolve_2d_scale = av1_convolve_2d_scale_c; + if (flags & HAS_SSE4_1) + av1_convolve_2d_scale = av1_convolve_2d_scale_sse4_1; + av1_convolve_2d_sr = av1_convolve_2d_sr_c; + if (flags & HAS_SSE2) + av1_convolve_2d_sr = av1_convolve_2d_sr_sse2; + if (flags & HAS_AVX2) + av1_convolve_2d_sr = av1_convolve_2d_sr_avx2; + av1_convolve_horiz_rs = av1_convolve_horiz_rs_c; + if (flags & HAS_SSE4_1) + av1_convolve_horiz_rs = av1_convolve_horiz_rs_sse4_1; + av1_convolve_x_sr = av1_convolve_x_sr_c; + if (flags & HAS_SSE2) + av1_convolve_x_sr = av1_convolve_x_sr_sse2; + if (flags & HAS_AVX2) + av1_convolve_x_sr = av1_convolve_x_sr_avx2; + av1_convolve_y_sr = av1_convolve_y_sr_c; + if (flags & HAS_SSE2) + av1_convolve_y_sr = av1_convolve_y_sr_sse2; + if (flags & HAS_AVX2) + av1_convolve_y_sr = av1_convolve_y_sr_avx2; + av1_filter_intra_edge = av1_filter_intra_edge_c; + if (flags & HAS_SSE4_1) + av1_filter_intra_edge = av1_filter_intra_edge_sse4_1; + av1_filter_intra_edge_high = av1_filter_intra_edge_high_c; + if (flags & HAS_SSE4_1) + av1_filter_intra_edge_high = av1_filter_intra_edge_high_sse4_1; + av1_filter_intra_predictor = av1_filter_intra_predictor_c; + if (flags & HAS_SSE4_1) + av1_filter_intra_predictor = av1_filter_intra_predictor_sse4_1; + av1_highbd_convolve_2d_copy_sr = av1_highbd_convolve_2d_copy_sr_c; + if (flags & HAS_SSE2) + av1_highbd_convolve_2d_copy_sr = av1_highbd_convolve_2d_copy_sr_sse2; + if (flags & HAS_AVX2) + av1_highbd_convolve_2d_copy_sr = av1_highbd_convolve_2d_copy_sr_avx2; + av1_highbd_convolve_2d_scale = av1_highbd_convolve_2d_scale_c; + if (flags & HAS_SSE4_1) + av1_highbd_convolve_2d_scale = av1_highbd_convolve_2d_scale_sse4_1; + av1_highbd_convolve_2d_sr = av1_highbd_convolve_2d_sr_c; + if (flags & HAS_SSSE3) + av1_highbd_convolve_2d_sr = av1_highbd_convolve_2d_sr_ssse3; + if (flags & HAS_AVX2) + av1_highbd_convolve_2d_sr = av1_highbd_convolve_2d_sr_avx2; + av1_highbd_convolve_horiz_rs = av1_highbd_convolve_horiz_rs_c; + if (flags & HAS_SSE4_1) + av1_highbd_convolve_horiz_rs = av1_highbd_convolve_horiz_rs_sse4_1; + av1_highbd_convolve_x_sr = av1_highbd_convolve_x_sr_c; + if (flags & HAS_SSSE3) + av1_highbd_convolve_x_sr = av1_highbd_convolve_x_sr_ssse3; + if (flags & HAS_AVX2) + av1_highbd_convolve_x_sr = av1_highbd_convolve_x_sr_avx2; + av1_highbd_convolve_y_sr = av1_highbd_convolve_y_sr_c; + if (flags & HAS_SSSE3) + av1_highbd_convolve_y_sr = av1_highbd_convolve_y_sr_ssse3; + if (flags & HAS_AVX2) + av1_highbd_convolve_y_sr = av1_highbd_convolve_y_sr_avx2; + av1_highbd_jnt_convolve_2d = av1_highbd_jnt_convolve_2d_c; + if (flags & HAS_SSE4_1) + av1_highbd_jnt_convolve_2d = av1_highbd_jnt_convolve_2d_sse4_1; + if (flags & HAS_AVX2) + av1_highbd_jnt_convolve_2d = av1_highbd_jnt_convolve_2d_avx2; + av1_highbd_jnt_convolve_2d_copy = av1_highbd_jnt_convolve_2d_copy_c; + if (flags & HAS_SSE4_1) + av1_highbd_jnt_convolve_2d_copy = av1_highbd_jnt_convolve_2d_copy_sse4_1; + if (flags & HAS_AVX2) + av1_highbd_jnt_convolve_2d_copy = av1_highbd_jnt_convolve_2d_copy_avx2; + av1_highbd_jnt_convolve_x = av1_highbd_jnt_convolve_x_c; + if (flags & HAS_SSE4_1) + av1_highbd_jnt_convolve_x = av1_highbd_jnt_convolve_x_sse4_1; + if (flags & HAS_AVX2) + av1_highbd_jnt_convolve_x = av1_highbd_jnt_convolve_x_avx2; + av1_highbd_jnt_convolve_y = av1_highbd_jnt_convolve_y_c; + if (flags & HAS_SSE4_1) + av1_highbd_jnt_convolve_y = av1_highbd_jnt_convolve_y_sse4_1; + if (flags & HAS_AVX2) + av1_highbd_jnt_convolve_y = av1_highbd_jnt_convolve_y_avx2; + av1_highbd_warp_affine = av1_highbd_warp_affine_c; + if (flags & HAS_SSE4_1) + av1_highbd_warp_affine = av1_highbd_warp_affine_sse4_1; + av1_highbd_wiener_convolve_add_src = av1_highbd_wiener_convolve_add_src_c; + if (flags & HAS_SSSE3) + av1_highbd_wiener_convolve_add_src = + av1_highbd_wiener_convolve_add_src_ssse3; + if (flags & HAS_AVX2) + av1_highbd_wiener_convolve_add_src = + av1_highbd_wiener_convolve_add_src_avx2; + av1_inv_txfm2d_add_16x16 = av1_inv_txfm2d_add_16x16_c; + if (flags & HAS_SSE4_1) + av1_inv_txfm2d_add_16x16 = av1_inv_txfm2d_add_16x16_sse4_1; + av1_inv_txfm2d_add_32x32 = av1_inv_txfm2d_add_32x32_c; + if (flags & HAS_AVX2) + av1_inv_txfm2d_add_32x32 = av1_inv_txfm2d_add_32x32_avx2; + av1_inv_txfm2d_add_4x4 = av1_inv_txfm2d_add_4x4_c; + if (flags & HAS_SSE4_1) + av1_inv_txfm2d_add_4x4 = av1_inv_txfm2d_add_4x4_sse4_1; + av1_inv_txfm2d_add_64x64 = av1_inv_txfm2d_add_64x64_c; + if (flags & HAS_SSE4_1) + av1_inv_txfm2d_add_64x64 = av1_inv_txfm2d_add_64x64_sse4_1; + av1_inv_txfm2d_add_8x8 = av1_inv_txfm2d_add_8x8_c; + if (flags & HAS_SSE4_1) + av1_inv_txfm2d_add_8x8 = av1_inv_txfm2d_add_8x8_sse4_1; + av1_inv_txfm_add = av1_inv_txfm_add_c; + if (flags & HAS_SSSE3) + av1_inv_txfm_add = av1_inv_txfm_add_ssse3; + if (flags & HAS_AVX2) + av1_inv_txfm_add = av1_inv_txfm_add_avx2; + av1_jnt_convolve_2d = av1_jnt_convolve_2d_c; + if (flags & HAS_SSSE3) + av1_jnt_convolve_2d = av1_jnt_convolve_2d_ssse3; + if (flags & HAS_AVX2) + av1_jnt_convolve_2d = av1_jnt_convolve_2d_avx2; + av1_jnt_convolve_2d_copy = av1_jnt_convolve_2d_copy_c; + if (flags & HAS_SSE2) + av1_jnt_convolve_2d_copy = av1_jnt_convolve_2d_copy_sse2; + if (flags & HAS_AVX2) + av1_jnt_convolve_2d_copy = av1_jnt_convolve_2d_copy_avx2; + av1_jnt_convolve_x = av1_jnt_convolve_x_c; + if (flags & HAS_SSE2) + av1_jnt_convolve_x = av1_jnt_convolve_x_sse2; + if (flags & HAS_AVX2) + av1_jnt_convolve_x = av1_jnt_convolve_x_avx2; + av1_jnt_convolve_y = av1_jnt_convolve_y_c; + if (flags & HAS_SSE2) + av1_jnt_convolve_y = av1_jnt_convolve_y_sse2; + if (flags & HAS_AVX2) + av1_jnt_convolve_y = av1_jnt_convolve_y_avx2; + av1_selfguided_restoration = av1_selfguided_restoration_c; + if (flags & HAS_SSE4_1) + av1_selfguided_restoration = av1_selfguided_restoration_sse4_1; + if (flags & HAS_AVX2) + av1_selfguided_restoration = av1_selfguided_restoration_avx2; + av1_upsample_intra_edge = av1_upsample_intra_edge_c; + if (flags & HAS_SSE4_1) + av1_upsample_intra_edge = av1_upsample_intra_edge_sse4_1; + av1_upsample_intra_edge_high = av1_upsample_intra_edge_high_c; + if (flags & HAS_SSE4_1) + av1_upsample_intra_edge_high = av1_upsample_intra_edge_high_sse4_1; + av1_warp_affine = av1_warp_affine_c; + if (flags & HAS_SSE4_1) + av1_warp_affine = av1_warp_affine_sse4_1; + av1_wiener_convolve_add_src = av1_wiener_convolve_add_src_c; + if (flags & HAS_SSE2) + av1_wiener_convolve_add_src = av1_wiener_convolve_add_src_sse2; + if (flags & HAS_AVX2) + av1_wiener_convolve_add_src = av1_wiener_convolve_add_src_avx2; + cdef_filter_block = cdef_filter_block_c; + if (flags & HAS_SSE2) + cdef_filter_block = cdef_filter_block_sse2; + if (flags & HAS_SSSE3) + cdef_filter_block = cdef_filter_block_ssse3; + if (flags & HAS_SSE4_1) + cdef_filter_block = cdef_filter_block_sse4_1; + if (flags & HAS_AVX2) + cdef_filter_block = cdef_filter_block_avx2; + cdef_find_dir = cdef_find_dir_c; + if (flags & HAS_SSE2) + cdef_find_dir = cdef_find_dir_sse2; + if (flags & HAS_SSSE3) + cdef_find_dir = cdef_find_dir_ssse3; + if (flags & HAS_SSE4_1) + cdef_find_dir = cdef_find_dir_sse4_1; + if (flags & HAS_AVX2) + cdef_find_dir = cdef_find_dir_avx2; + cfl_get_luma_subsampling_420_hbd = cfl_get_luma_subsampling_420_hbd_c; + if (flags & HAS_SSSE3) + cfl_get_luma_subsampling_420_hbd = cfl_get_luma_subsampling_420_hbd_ssse3; + if (flags & HAS_AVX2) + cfl_get_luma_subsampling_420_hbd = cfl_get_luma_subsampling_420_hbd_avx2; + cfl_get_luma_subsampling_420_lbd = cfl_get_luma_subsampling_420_lbd_c; + if (flags & HAS_SSSE3) + cfl_get_luma_subsampling_420_lbd = cfl_get_luma_subsampling_420_lbd_ssse3; + if (flags & HAS_AVX2) + cfl_get_luma_subsampling_420_lbd = cfl_get_luma_subsampling_420_lbd_avx2; + cfl_get_luma_subsampling_422_hbd = cfl_get_luma_subsampling_422_hbd_c; + if (flags & HAS_SSSE3) + cfl_get_luma_subsampling_422_hbd = cfl_get_luma_subsampling_422_hbd_ssse3; + if (flags & HAS_AVX2) + cfl_get_luma_subsampling_422_hbd = cfl_get_luma_subsampling_422_hbd_avx2; + cfl_get_luma_subsampling_422_lbd = cfl_get_luma_subsampling_422_lbd_c; + if (flags & HAS_SSSE3) + cfl_get_luma_subsampling_422_lbd = cfl_get_luma_subsampling_422_lbd_ssse3; + if (flags & HAS_AVX2) + cfl_get_luma_subsampling_422_lbd = cfl_get_luma_subsampling_422_lbd_avx2; + cfl_get_luma_subsampling_444_hbd = cfl_get_luma_subsampling_444_hbd_c; + if (flags & HAS_SSSE3) + cfl_get_luma_subsampling_444_hbd = cfl_get_luma_subsampling_444_hbd_ssse3; + if (flags & HAS_AVX2) + cfl_get_luma_subsampling_444_hbd = cfl_get_luma_subsampling_444_hbd_avx2; + cfl_get_luma_subsampling_444_lbd = cfl_get_luma_subsampling_444_lbd_c; + if (flags & HAS_SSSE3) + cfl_get_luma_subsampling_444_lbd = cfl_get_luma_subsampling_444_lbd_ssse3; + if (flags & HAS_AVX2) + cfl_get_luma_subsampling_444_lbd = cfl_get_luma_subsampling_444_lbd_avx2; + copy_rect8_16bit_to_16bit = copy_rect8_16bit_to_16bit_c; + if (flags & HAS_SSE2) + copy_rect8_16bit_to_16bit = copy_rect8_16bit_to_16bit_sse2; + if (flags & HAS_SSSE3) + copy_rect8_16bit_to_16bit = copy_rect8_16bit_to_16bit_ssse3; + if (flags & HAS_SSE4_1) + copy_rect8_16bit_to_16bit = copy_rect8_16bit_to_16bit_sse4_1; + if (flags & HAS_AVX2) + copy_rect8_16bit_to_16bit = copy_rect8_16bit_to_16bit_avx2; + copy_rect8_8bit_to_16bit = copy_rect8_8bit_to_16bit_c; + if (flags & HAS_SSE2) + copy_rect8_8bit_to_16bit = copy_rect8_8bit_to_16bit_sse2; + if (flags & HAS_SSSE3) + copy_rect8_8bit_to_16bit = copy_rect8_8bit_to_16bit_ssse3; + if (flags & HAS_SSE4_1) + copy_rect8_8bit_to_16bit = copy_rect8_8bit_to_16bit_sse4_1; + if (flags & HAS_AVX2) + copy_rect8_8bit_to_16bit = copy_rect8_8bit_to_16bit_avx2; + get_predict_hbd_fn = get_predict_hbd_fn_c; + if (flags & HAS_SSSE3) + get_predict_hbd_fn = get_predict_hbd_fn_ssse3; + if (flags & HAS_AVX2) + get_predict_hbd_fn = get_predict_hbd_fn_avx2; + get_predict_lbd_fn = get_predict_lbd_fn_c; + if (flags & HAS_SSSE3) + get_predict_lbd_fn = get_predict_lbd_fn_ssse3; + if (flags & HAS_AVX2) + get_predict_lbd_fn = get_predict_lbd_fn_avx2; + get_subtract_average_fn = get_subtract_average_fn_c; + if (flags & HAS_SSE2) + get_subtract_average_fn = get_subtract_average_fn_sse2; + if (flags & HAS_AVX2) + get_subtract_average_fn = get_subtract_average_fn_avx2; +} +#endif + +#ifdef __cplusplus +} // extern "C" +#endif + +#endif |