summaryrefslogtreecommitdiff
path: root/chromium/third_party/libaom/source/config/linux/ia32/config/av1_rtcd.h
diff options
context:
space:
mode:
authorAllan Sandfeld Jensen <allan.jensen@qt.io>2018-08-28 15:28:34 +0200
committerAllan Sandfeld Jensen <allan.jensen@qt.io>2018-08-28 13:54:51 +0000
commit2a19c63448c84c1805fb1a585c3651318bb86ca7 (patch)
treeeb17888e8531aa6ee5e85721bd553b832a7e5156 /chromium/third_party/libaom/source/config/linux/ia32/config/av1_rtcd.h
parentb014812705fc80bff0a5c120dfcef88f349816dc (diff)
downloadqtwebengine-chromium-2a19c63448c84c1805fb1a585c3651318bb86ca7.tar.gz
BASELINE: Update Chromium to 69.0.3497.70
Change-Id: I2b7b56e4e7a8b26656930def0d4575dc32b900a0 Reviewed-by: Allan Sandfeld Jensen <allan.jensen@qt.io>
Diffstat (limited to 'chromium/third_party/libaom/source/config/linux/ia32/config/av1_rtcd.h')
-rw-r--r--chromium/third_party/libaom/source/config/linux/ia32/config/av1_rtcd.h2225
1 files changed, 2225 insertions, 0 deletions
diff --git a/chromium/third_party/libaom/source/config/linux/ia32/config/av1_rtcd.h b/chromium/third_party/libaom/source/config/linux/ia32/config/av1_rtcd.h
new file mode 100644
index 00000000000..724cd0b6808
--- /dev/null
+++ b/chromium/third_party/libaom/source/config/linux/ia32/config/av1_rtcd.h
@@ -0,0 +1,2225 @@
+// This file is generated. Do not edit.
+#ifndef AV1_RTCD_H_
+#define AV1_RTCD_H_
+
+#ifdef RTCD_C
+#define RTCD_EXTERN
+#else
+#define RTCD_EXTERN extern
+#endif
+
+/*
+ * AV1
+ */
+
+#include "aom/aom_integer.h"
+#include "aom_dsp/txfm_common.h"
+#include "av1/common/av1_txfm.h"
+#include "av1/common/common.h"
+#include "av1/common/convolve.h"
+#include "av1/common/enums.h"
+#include "av1/common/filter.h"
+#include "av1/common/odintrin.h"
+#include "av1/common/quant_common.h"
+#include "av1/common/restoration.h"
+
+struct macroblockd;
+
+/* Encoder forward decls */
+struct macroblock;
+struct txfm_param;
+struct aom_variance_vtable;
+struct search_site_config;
+struct yv12_buffer_config;
+
+/* Function pointers return by CfL functions */
+typedef void (*cfl_subsample_lbd_fn)(const uint8_t* input,
+ int input_stride,
+ uint16_t* output_q3);
+
+typedef void (*cfl_subsample_hbd_fn)(const uint16_t* input,
+ int input_stride,
+ uint16_t* output_q3);
+
+typedef void (*cfl_subtract_average_fn)(const uint16_t* src, int16_t* dst);
+
+typedef void (*cfl_predict_lbd_fn)(const int16_t* src,
+ uint8_t* dst,
+ int dst_stride,
+ int alpha_q3);
+
+typedef void (*cfl_predict_hbd_fn)(const int16_t* src,
+ uint16_t* dst,
+ int dst_stride,
+ int alpha_q3,
+ int bd);
+
+#ifdef __cplusplus
+extern "C" {
+#endif
+
+void apply_selfguided_restoration_c(const uint8_t* dat,
+ int width,
+ int height,
+ int stride,
+ int eps,
+ const int* xqd,
+ uint8_t* dst,
+ int dst_stride,
+ int32_t* tmpbuf,
+ int bit_depth,
+ int highbd);
+void apply_selfguided_restoration_sse4_1(const uint8_t* dat,
+ int width,
+ int height,
+ int stride,
+ int eps,
+ const int* xqd,
+ uint8_t* dst,
+ int dst_stride,
+ int32_t* tmpbuf,
+ int bit_depth,
+ int highbd);
+void apply_selfguided_restoration_avx2(const uint8_t* dat,
+ int width,
+ int height,
+ int stride,
+ int eps,
+ const int* xqd,
+ uint8_t* dst,
+ int dst_stride,
+ int32_t* tmpbuf,
+ int bit_depth,
+ int highbd);
+RTCD_EXTERN void (*apply_selfguided_restoration)(const uint8_t* dat,
+ int width,
+ int height,
+ int stride,
+ int eps,
+ const int* xqd,
+ uint8_t* dst,
+ int dst_stride,
+ int32_t* tmpbuf,
+ int bit_depth,
+ int highbd);
+
+void av1_build_compound_diffwtd_mask_c(uint8_t* mask,
+ DIFFWTD_MASK_TYPE mask_type,
+ const uint8_t* src0,
+ int src0_stride,
+ const uint8_t* src1,
+ int src1_stride,
+ int h,
+ int w);
+void av1_build_compound_diffwtd_mask_sse4_1(uint8_t* mask,
+ DIFFWTD_MASK_TYPE mask_type,
+ const uint8_t* src0,
+ int src0_stride,
+ const uint8_t* src1,
+ int src1_stride,
+ int h,
+ int w);
+RTCD_EXTERN void (*av1_build_compound_diffwtd_mask)(uint8_t* mask,
+ DIFFWTD_MASK_TYPE mask_type,
+ const uint8_t* src0,
+ int src0_stride,
+ const uint8_t* src1,
+ int src1_stride,
+ int h,
+ int w);
+
+void av1_build_compound_diffwtd_mask_d16_c(uint8_t* mask,
+ DIFFWTD_MASK_TYPE mask_type,
+ const CONV_BUF_TYPE* src0,
+ int src0_stride,
+ const CONV_BUF_TYPE* src1,
+ int src1_stride,
+ int h,
+ int w,
+ ConvolveParams* conv_params,
+ int bd);
+void av1_build_compound_diffwtd_mask_d16_sse4_1(uint8_t* mask,
+ DIFFWTD_MASK_TYPE mask_type,
+ const CONV_BUF_TYPE* src0,
+ int src0_stride,
+ const CONV_BUF_TYPE* src1,
+ int src1_stride,
+ int h,
+ int w,
+ ConvolveParams* conv_params,
+ int bd);
+RTCD_EXTERN void (*av1_build_compound_diffwtd_mask_d16)(
+ uint8_t* mask,
+ DIFFWTD_MASK_TYPE mask_type,
+ const CONV_BUF_TYPE* src0,
+ int src0_stride,
+ const CONV_BUF_TYPE* src1,
+ int src1_stride,
+ int h,
+ int w,
+ ConvolveParams* conv_params,
+ int bd);
+
+void av1_build_compound_diffwtd_mask_highbd_c(uint8_t* mask,
+ DIFFWTD_MASK_TYPE mask_type,
+ const uint8_t* src0,
+ int src0_stride,
+ const uint8_t* src1,
+ int src1_stride,
+ int h,
+ int w,
+ int bd);
+void av1_build_compound_diffwtd_mask_highbd_ssse3(uint8_t* mask,
+ DIFFWTD_MASK_TYPE mask_type,
+ const uint8_t* src0,
+ int src0_stride,
+ const uint8_t* src1,
+ int src1_stride,
+ int h,
+ int w,
+ int bd);
+void av1_build_compound_diffwtd_mask_highbd_avx2(uint8_t* mask,
+ DIFFWTD_MASK_TYPE mask_type,
+ const uint8_t* src0,
+ int src0_stride,
+ const uint8_t* src1,
+ int src1_stride,
+ int h,
+ int w,
+ int bd);
+RTCD_EXTERN void (*av1_build_compound_diffwtd_mask_highbd)(
+ uint8_t* mask,
+ DIFFWTD_MASK_TYPE mask_type,
+ const uint8_t* src0,
+ int src0_stride,
+ const uint8_t* src1,
+ int src1_stride,
+ int h,
+ int w,
+ int bd);
+
+void av1_convolve_2d_copy_sr_c(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+void av1_convolve_2d_copy_sr_sse2(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+void av1_convolve_2d_copy_sr_avx2(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+RTCD_EXTERN void (*av1_convolve_2d_copy_sr)(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+
+void av1_convolve_2d_scale_c(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_qn,
+ const int x_step_qn,
+ const int subpel_y_q4,
+ const int y_step_qn,
+ ConvolveParams* conv_params);
+void av1_convolve_2d_scale_sse4_1(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_qn,
+ const int x_step_qn,
+ const int subpel_y_q4,
+ const int y_step_qn,
+ ConvolveParams* conv_params);
+RTCD_EXTERN void (*av1_convolve_2d_scale)(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_qn,
+ const int x_step_qn,
+ const int subpel_y_q4,
+ const int y_step_qn,
+ ConvolveParams* conv_params);
+
+void av1_convolve_2d_sr_c(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+void av1_convolve_2d_sr_sse2(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+void av1_convolve_2d_sr_avx2(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+RTCD_EXTERN void (*av1_convolve_2d_sr)(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+
+void av1_convolve_horiz_rs_c(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ const int16_t* x_filters,
+ int x0_qn,
+ int x_step_qn);
+void av1_convolve_horiz_rs_sse4_1(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ const int16_t* x_filters,
+ int x0_qn,
+ int x_step_qn);
+RTCD_EXTERN void (*av1_convolve_horiz_rs)(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ const int16_t* x_filters,
+ int x0_qn,
+ int x_step_qn);
+
+void av1_convolve_x_sr_c(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+void av1_convolve_x_sr_sse2(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+void av1_convolve_x_sr_avx2(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+RTCD_EXTERN void (*av1_convolve_x_sr)(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+
+void av1_convolve_y_sr_c(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+void av1_convolve_y_sr_sse2(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+void av1_convolve_y_sr_avx2(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+RTCD_EXTERN void (*av1_convolve_y_sr)(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+
+void av1_dr_prediction_z1_c(uint8_t* dst,
+ ptrdiff_t stride,
+ int bw,
+ int bh,
+ const uint8_t* above,
+ const uint8_t* left,
+ int upsample_above,
+ int dx,
+ int dy);
+#define av1_dr_prediction_z1 av1_dr_prediction_z1_c
+
+void av1_dr_prediction_z2_c(uint8_t* dst,
+ ptrdiff_t stride,
+ int bw,
+ int bh,
+ const uint8_t* above,
+ const uint8_t* left,
+ int upsample_above,
+ int upsample_left,
+ int dx,
+ int dy);
+#define av1_dr_prediction_z2 av1_dr_prediction_z2_c
+
+void av1_dr_prediction_z3_c(uint8_t* dst,
+ ptrdiff_t stride,
+ int bw,
+ int bh,
+ const uint8_t* above,
+ const uint8_t* left,
+ int upsample_left,
+ int dx,
+ int dy);
+#define av1_dr_prediction_z3 av1_dr_prediction_z3_c
+
+void av1_filter_intra_edge_c(uint8_t* p, int sz, int strength);
+void av1_filter_intra_edge_sse4_1(uint8_t* p, int sz, int strength);
+RTCD_EXTERN void (*av1_filter_intra_edge)(uint8_t* p, int sz, int strength);
+
+void av1_filter_intra_edge_high_c(uint16_t* p, int sz, int strength);
+void av1_filter_intra_edge_high_sse4_1(uint16_t* p, int sz, int strength);
+RTCD_EXTERN void (*av1_filter_intra_edge_high)(uint16_t* p,
+ int sz,
+ int strength);
+
+void av1_filter_intra_predictor_c(uint8_t* dst,
+ ptrdiff_t stride,
+ TX_SIZE tx_size,
+ const uint8_t* above,
+ const uint8_t* left,
+ int mode);
+void av1_filter_intra_predictor_sse4_1(uint8_t* dst,
+ ptrdiff_t stride,
+ TX_SIZE tx_size,
+ const uint8_t* above,
+ const uint8_t* left,
+ int mode);
+RTCD_EXTERN void (*av1_filter_intra_predictor)(uint8_t* dst,
+ ptrdiff_t stride,
+ TX_SIZE tx_size,
+ const uint8_t* above,
+ const uint8_t* left,
+ int mode);
+
+void av1_highbd_convolve8_c(const uint8_t* src,
+ ptrdiff_t src_stride,
+ uint8_t* dst,
+ ptrdiff_t dst_stride,
+ const int16_t* filter_x,
+ int x_step_q4,
+ const int16_t* filter_y,
+ int y_step_q4,
+ int w,
+ int h,
+ int bps);
+#define av1_highbd_convolve8 av1_highbd_convolve8_c
+
+void av1_highbd_convolve8_horiz_c(const uint8_t* src,
+ ptrdiff_t src_stride,
+ uint8_t* dst,
+ ptrdiff_t dst_stride,
+ const int16_t* filter_x,
+ int x_step_q4,
+ const int16_t* filter_y,
+ int y_step_q4,
+ int w,
+ int h,
+ int bps);
+#define av1_highbd_convolve8_horiz av1_highbd_convolve8_horiz_c
+
+void av1_highbd_convolve8_vert_c(const uint8_t* src,
+ ptrdiff_t src_stride,
+ uint8_t* dst,
+ ptrdiff_t dst_stride,
+ const int16_t* filter_x,
+ int x_step_q4,
+ const int16_t* filter_y,
+ int y_step_q4,
+ int w,
+ int h,
+ int bps);
+#define av1_highbd_convolve8_vert av1_highbd_convolve8_vert_c
+
+void av1_highbd_convolve_2d_copy_sr_c(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+void av1_highbd_convolve_2d_copy_sr_sse2(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+void av1_highbd_convolve_2d_copy_sr_avx2(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+RTCD_EXTERN void (*av1_highbd_convolve_2d_copy_sr)(
+ const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+
+void av1_highbd_convolve_2d_scale_c(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int x_step_qn,
+ const int subpel_y_q4,
+ const int y_step_qn,
+ ConvolveParams* conv_params,
+ int bd);
+void av1_highbd_convolve_2d_scale_sse4_1(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int x_step_qn,
+ const int subpel_y_q4,
+ const int y_step_qn,
+ ConvolveParams* conv_params,
+ int bd);
+RTCD_EXTERN void (*av1_highbd_convolve_2d_scale)(
+ const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int x_step_qn,
+ const int subpel_y_q4,
+ const int y_step_qn,
+ ConvolveParams* conv_params,
+ int bd);
+
+void av1_highbd_convolve_2d_sr_c(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+void av1_highbd_convolve_2d_sr_ssse3(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+void av1_highbd_convolve_2d_sr_avx2(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+RTCD_EXTERN void (*av1_highbd_convolve_2d_sr)(
+ const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+
+void av1_highbd_convolve_avg_c(const uint8_t* src,
+ ptrdiff_t src_stride,
+ uint8_t* dst,
+ ptrdiff_t dst_stride,
+ const int16_t* filter_x,
+ int x_step_q4,
+ const int16_t* filter_y,
+ int y_step_q4,
+ int w,
+ int h,
+ int bps);
+#define av1_highbd_convolve_avg av1_highbd_convolve_avg_c
+
+void av1_highbd_convolve_copy_c(const uint8_t* src,
+ ptrdiff_t src_stride,
+ uint8_t* dst,
+ ptrdiff_t dst_stride,
+ const int16_t* filter_x,
+ int x_step_q4,
+ const int16_t* filter_y,
+ int y_step_q4,
+ int w,
+ int h,
+ int bps);
+#define av1_highbd_convolve_copy av1_highbd_convolve_copy_c
+
+void av1_highbd_convolve_horiz_rs_c(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ const int16_t* x_filters,
+ int x0_qn,
+ int x_step_qn,
+ int bd);
+void av1_highbd_convolve_horiz_rs_sse4_1(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ const int16_t* x_filters,
+ int x0_qn,
+ int x_step_qn,
+ int bd);
+RTCD_EXTERN void (*av1_highbd_convolve_horiz_rs)(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ const int16_t* x_filters,
+ int x0_qn,
+ int x_step_qn,
+ int bd);
+
+void av1_highbd_convolve_x_sr_c(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+void av1_highbd_convolve_x_sr_ssse3(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+void av1_highbd_convolve_x_sr_avx2(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+RTCD_EXTERN void (*av1_highbd_convolve_x_sr)(
+ const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+
+void av1_highbd_convolve_y_sr_c(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+void av1_highbd_convolve_y_sr_ssse3(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+void av1_highbd_convolve_y_sr_avx2(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+RTCD_EXTERN void (*av1_highbd_convolve_y_sr)(
+ const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+
+void av1_highbd_dr_prediction_z1_c(uint16_t* dst,
+ ptrdiff_t stride,
+ int bw,
+ int bh,
+ const uint16_t* above,
+ const uint16_t* left,
+ int upsample_above,
+ int dx,
+ int dy,
+ int bd);
+#define av1_highbd_dr_prediction_z1 av1_highbd_dr_prediction_z1_c
+
+void av1_highbd_dr_prediction_z2_c(uint16_t* dst,
+ ptrdiff_t stride,
+ int bw,
+ int bh,
+ const uint16_t* above,
+ const uint16_t* left,
+ int upsample_above,
+ int upsample_left,
+ int dx,
+ int dy,
+ int bd);
+#define av1_highbd_dr_prediction_z2 av1_highbd_dr_prediction_z2_c
+
+void av1_highbd_dr_prediction_z3_c(uint16_t* dst,
+ ptrdiff_t stride,
+ int bw,
+ int bh,
+ const uint16_t* above,
+ const uint16_t* left,
+ int upsample_left,
+ int dx,
+ int dy,
+ int bd);
+#define av1_highbd_dr_prediction_z3 av1_highbd_dr_prediction_z3_c
+
+void av1_highbd_iwht4x4_16_add_c(const tran_low_t* input,
+ uint8_t* dest,
+ int dest_stride,
+ int bd);
+#define av1_highbd_iwht4x4_16_add av1_highbd_iwht4x4_16_add_c
+
+void av1_highbd_iwht4x4_1_add_c(const tran_low_t* input,
+ uint8_t* dest,
+ int dest_stride,
+ int bd);
+#define av1_highbd_iwht4x4_1_add av1_highbd_iwht4x4_1_add_c
+
+void av1_highbd_jnt_convolve_2d_c(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+void av1_highbd_jnt_convolve_2d_sse4_1(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+void av1_highbd_jnt_convolve_2d_avx2(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+RTCD_EXTERN void (*av1_highbd_jnt_convolve_2d)(
+ const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+
+void av1_highbd_jnt_convolve_2d_copy_c(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+void av1_highbd_jnt_convolve_2d_copy_sse4_1(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+void av1_highbd_jnt_convolve_2d_copy_avx2(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+RTCD_EXTERN void (*av1_highbd_jnt_convolve_2d_copy)(
+ const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+
+void av1_highbd_jnt_convolve_x_c(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+void av1_highbd_jnt_convolve_x_sse4_1(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+void av1_highbd_jnt_convolve_x_avx2(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+RTCD_EXTERN void (*av1_highbd_jnt_convolve_x)(
+ const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+
+void av1_highbd_jnt_convolve_y_c(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+void av1_highbd_jnt_convolve_y_sse4_1(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+void av1_highbd_jnt_convolve_y_avx2(const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+RTCD_EXTERN void (*av1_highbd_jnt_convolve_y)(
+ const uint16_t* src,
+ int src_stride,
+ uint16_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params,
+ int bd);
+
+void av1_highbd_warp_affine_c(const int32_t* mat,
+ const uint16_t* ref,
+ int width,
+ int height,
+ int stride,
+ uint16_t* pred,
+ int p_col,
+ int p_row,
+ int p_width,
+ int p_height,
+ int p_stride,
+ int subsampling_x,
+ int subsampling_y,
+ int bd,
+ ConvolveParams* conv_params,
+ int16_t alpha,
+ int16_t beta,
+ int16_t gamma,
+ int16_t delta);
+void av1_highbd_warp_affine_sse4_1(const int32_t* mat,
+ const uint16_t* ref,
+ int width,
+ int height,
+ int stride,
+ uint16_t* pred,
+ int p_col,
+ int p_row,
+ int p_width,
+ int p_height,
+ int p_stride,
+ int subsampling_x,
+ int subsampling_y,
+ int bd,
+ ConvolveParams* conv_params,
+ int16_t alpha,
+ int16_t beta,
+ int16_t gamma,
+ int16_t delta);
+RTCD_EXTERN void (*av1_highbd_warp_affine)(const int32_t* mat,
+ const uint16_t* ref,
+ int width,
+ int height,
+ int stride,
+ uint16_t* pred,
+ int p_col,
+ int p_row,
+ int p_width,
+ int p_height,
+ int p_stride,
+ int subsampling_x,
+ int subsampling_y,
+ int bd,
+ ConvolveParams* conv_params,
+ int16_t alpha,
+ int16_t beta,
+ int16_t gamma,
+ int16_t delta);
+
+void av1_highbd_wiener_convolve_add_src_c(const uint8_t* src,
+ ptrdiff_t src_stride,
+ uint8_t* dst,
+ ptrdiff_t dst_stride,
+ const int16_t* filter_x,
+ int x_step_q4,
+ const int16_t* filter_y,
+ int y_step_q4,
+ int w,
+ int h,
+ const ConvolveParams* conv_params,
+ int bps);
+void av1_highbd_wiener_convolve_add_src_ssse3(const uint8_t* src,
+ ptrdiff_t src_stride,
+ uint8_t* dst,
+ ptrdiff_t dst_stride,
+ const int16_t* filter_x,
+ int x_step_q4,
+ const int16_t* filter_y,
+ int y_step_q4,
+ int w,
+ int h,
+ const ConvolveParams* conv_params,
+ int bps);
+void av1_highbd_wiener_convolve_add_src_avx2(const uint8_t* src,
+ ptrdiff_t src_stride,
+ uint8_t* dst,
+ ptrdiff_t dst_stride,
+ const int16_t* filter_x,
+ int x_step_q4,
+ const int16_t* filter_y,
+ int y_step_q4,
+ int w,
+ int h,
+ const ConvolveParams* conv_params,
+ int bps);
+RTCD_EXTERN void (*av1_highbd_wiener_convolve_add_src)(
+ const uint8_t* src,
+ ptrdiff_t src_stride,
+ uint8_t* dst,
+ ptrdiff_t dst_stride,
+ const int16_t* filter_x,
+ int x_step_q4,
+ const int16_t* filter_y,
+ int y_step_q4,
+ int w,
+ int h,
+ const ConvolveParams* conv_params,
+ int bps);
+
+void av1_inv_txfm2d_add_16x16_c(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+void av1_inv_txfm2d_add_16x16_sse4_1(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+RTCD_EXTERN void (*av1_inv_txfm2d_add_16x16)(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+
+void av1_inv_txfm2d_add_16x32_c(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+#define av1_inv_txfm2d_add_16x32 av1_inv_txfm2d_add_16x32_c
+
+void av1_inv_txfm2d_add_16x4_c(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+#define av1_inv_txfm2d_add_16x4 av1_inv_txfm2d_add_16x4_c
+
+void av1_inv_txfm2d_add_16x64_c(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+#define av1_inv_txfm2d_add_16x64 av1_inv_txfm2d_add_16x64_c
+
+void av1_inv_txfm2d_add_16x8_c(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+#define av1_inv_txfm2d_add_16x8 av1_inv_txfm2d_add_16x8_c
+
+void av1_inv_txfm2d_add_32x16_c(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+#define av1_inv_txfm2d_add_32x16 av1_inv_txfm2d_add_32x16_c
+
+void av1_inv_txfm2d_add_32x32_c(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+void av1_inv_txfm2d_add_32x32_avx2(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+RTCD_EXTERN void (*av1_inv_txfm2d_add_32x32)(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+
+void av1_inv_txfm2d_add_32x64_c(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+#define av1_inv_txfm2d_add_32x64 av1_inv_txfm2d_add_32x64_c
+
+void av1_inv_txfm2d_add_32x8_c(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+#define av1_inv_txfm2d_add_32x8 av1_inv_txfm2d_add_32x8_c
+
+void av1_inv_txfm2d_add_4x16_c(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+#define av1_inv_txfm2d_add_4x16 av1_inv_txfm2d_add_4x16_c
+
+void av1_inv_txfm2d_add_4x4_c(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+void av1_inv_txfm2d_add_4x4_sse4_1(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+RTCD_EXTERN void (*av1_inv_txfm2d_add_4x4)(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+
+void av1_inv_txfm2d_add_4x8_c(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+#define av1_inv_txfm2d_add_4x8 av1_inv_txfm2d_add_4x8_c
+
+void av1_inv_txfm2d_add_64x16_c(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+#define av1_inv_txfm2d_add_64x16 av1_inv_txfm2d_add_64x16_c
+
+void av1_inv_txfm2d_add_64x32_c(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+#define av1_inv_txfm2d_add_64x32 av1_inv_txfm2d_add_64x32_c
+
+void av1_inv_txfm2d_add_64x64_c(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+void av1_inv_txfm2d_add_64x64_sse4_1(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+RTCD_EXTERN void (*av1_inv_txfm2d_add_64x64)(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+
+void av1_inv_txfm2d_add_8x16_c(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+#define av1_inv_txfm2d_add_8x16 av1_inv_txfm2d_add_8x16_c
+
+void av1_inv_txfm2d_add_8x32_c(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+#define av1_inv_txfm2d_add_8x32 av1_inv_txfm2d_add_8x32_c
+
+void av1_inv_txfm2d_add_8x4_c(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+#define av1_inv_txfm2d_add_8x4 av1_inv_txfm2d_add_8x4_c
+
+void av1_inv_txfm2d_add_8x8_c(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+void av1_inv_txfm2d_add_8x8_sse4_1(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+RTCD_EXTERN void (*av1_inv_txfm2d_add_8x8)(const int32_t* input,
+ uint16_t* output,
+ int stride,
+ TX_TYPE tx_type,
+ int bd);
+
+void av1_inv_txfm_add_c(const tran_low_t* dqcoeff,
+ uint8_t* dst,
+ int stride,
+ const TxfmParam* txfm_param);
+void av1_inv_txfm_add_ssse3(const tran_low_t* dqcoeff,
+ uint8_t* dst,
+ int stride,
+ const TxfmParam* txfm_param);
+void av1_inv_txfm_add_avx2(const tran_low_t* dqcoeff,
+ uint8_t* dst,
+ int stride,
+ const TxfmParam* txfm_param);
+RTCD_EXTERN void (*av1_inv_txfm_add)(const tran_low_t* dqcoeff,
+ uint8_t* dst,
+ int stride,
+ const TxfmParam* txfm_param);
+
+void av1_jnt_convolve_2d_c(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+void av1_jnt_convolve_2d_ssse3(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+void av1_jnt_convolve_2d_avx2(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+RTCD_EXTERN void (*av1_jnt_convolve_2d)(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+
+void av1_jnt_convolve_2d_copy_c(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+void av1_jnt_convolve_2d_copy_sse2(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+void av1_jnt_convolve_2d_copy_avx2(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+RTCD_EXTERN void (*av1_jnt_convolve_2d_copy)(
+ const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+
+void av1_jnt_convolve_x_c(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+void av1_jnt_convolve_x_sse2(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+void av1_jnt_convolve_x_avx2(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+RTCD_EXTERN void (*av1_jnt_convolve_x)(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+
+void av1_jnt_convolve_y_c(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+void av1_jnt_convolve_y_sse2(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+void av1_jnt_convolve_y_avx2(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+RTCD_EXTERN void (*av1_jnt_convolve_y)(const uint8_t* src,
+ int src_stride,
+ uint8_t* dst,
+ int dst_stride,
+ int w,
+ int h,
+ InterpFilterParams* filter_params_x,
+ InterpFilterParams* filter_params_y,
+ const int subpel_x_q4,
+ const int subpel_y_q4,
+ ConvolveParams* conv_params);
+
+void av1_selfguided_restoration_c(const uint8_t* dgd8,
+ int width,
+ int height,
+ int dgd_stride,
+ int32_t* flt0,
+ int32_t* flt1,
+ int flt_stride,
+ int sgr_params_idx,
+ int bit_depth,
+ int highbd);
+void av1_selfguided_restoration_sse4_1(const uint8_t* dgd8,
+ int width,
+ int height,
+ int dgd_stride,
+ int32_t* flt0,
+ int32_t* flt1,
+ int flt_stride,
+ int sgr_params_idx,
+ int bit_depth,
+ int highbd);
+void av1_selfguided_restoration_avx2(const uint8_t* dgd8,
+ int width,
+ int height,
+ int dgd_stride,
+ int32_t* flt0,
+ int32_t* flt1,
+ int flt_stride,
+ int sgr_params_idx,
+ int bit_depth,
+ int highbd);
+RTCD_EXTERN void (*av1_selfguided_restoration)(const uint8_t* dgd8,
+ int width,
+ int height,
+ int dgd_stride,
+ int32_t* flt0,
+ int32_t* flt1,
+ int flt_stride,
+ int sgr_params_idx,
+ int bit_depth,
+ int highbd);
+
+void av1_upsample_intra_edge_c(uint8_t* p, int sz);
+void av1_upsample_intra_edge_sse4_1(uint8_t* p, int sz);
+RTCD_EXTERN void (*av1_upsample_intra_edge)(uint8_t* p, int sz);
+
+void av1_upsample_intra_edge_high_c(uint16_t* p, int sz, int bd);
+void av1_upsample_intra_edge_high_sse4_1(uint16_t* p, int sz, int bd);
+RTCD_EXTERN void (*av1_upsample_intra_edge_high)(uint16_t* p, int sz, int bd);
+
+void av1_warp_affine_c(const int32_t* mat,
+ const uint8_t* ref,
+ int width,
+ int height,
+ int stride,
+ uint8_t* pred,
+ int p_col,
+ int p_row,
+ int p_width,
+ int p_height,
+ int p_stride,
+ int subsampling_x,
+ int subsampling_y,
+ ConvolveParams* conv_params,
+ int16_t alpha,
+ int16_t beta,
+ int16_t gamma,
+ int16_t delta);
+void av1_warp_affine_sse4_1(const int32_t* mat,
+ const uint8_t* ref,
+ int width,
+ int height,
+ int stride,
+ uint8_t* pred,
+ int p_col,
+ int p_row,
+ int p_width,
+ int p_height,
+ int p_stride,
+ int subsampling_x,
+ int subsampling_y,
+ ConvolveParams* conv_params,
+ int16_t alpha,
+ int16_t beta,
+ int16_t gamma,
+ int16_t delta);
+RTCD_EXTERN void (*av1_warp_affine)(const int32_t* mat,
+ const uint8_t* ref,
+ int width,
+ int height,
+ int stride,
+ uint8_t* pred,
+ int p_col,
+ int p_row,
+ int p_width,
+ int p_height,
+ int p_stride,
+ int subsampling_x,
+ int subsampling_y,
+ ConvolveParams* conv_params,
+ int16_t alpha,
+ int16_t beta,
+ int16_t gamma,
+ int16_t delta);
+
+void av1_wiener_convolve_add_src_c(const uint8_t* src,
+ ptrdiff_t src_stride,
+ uint8_t* dst,
+ ptrdiff_t dst_stride,
+ const int16_t* filter_x,
+ int x_step_q4,
+ const int16_t* filter_y,
+ int y_step_q4,
+ int w,
+ int h,
+ const ConvolveParams* conv_params);
+void av1_wiener_convolve_add_src_sse2(const uint8_t* src,
+ ptrdiff_t src_stride,
+ uint8_t* dst,
+ ptrdiff_t dst_stride,
+ const int16_t* filter_x,
+ int x_step_q4,
+ const int16_t* filter_y,
+ int y_step_q4,
+ int w,
+ int h,
+ const ConvolveParams* conv_params);
+void av1_wiener_convolve_add_src_avx2(const uint8_t* src,
+ ptrdiff_t src_stride,
+ uint8_t* dst,
+ ptrdiff_t dst_stride,
+ const int16_t* filter_x,
+ int x_step_q4,
+ const int16_t* filter_y,
+ int y_step_q4,
+ int w,
+ int h,
+ const ConvolveParams* conv_params);
+RTCD_EXTERN void (*av1_wiener_convolve_add_src)(
+ const uint8_t* src,
+ ptrdiff_t src_stride,
+ uint8_t* dst,
+ ptrdiff_t dst_stride,
+ const int16_t* filter_x,
+ int x_step_q4,
+ const int16_t* filter_y,
+ int y_step_q4,
+ int w,
+ int h,
+ const ConvolveParams* conv_params);
+
+void cdef_filter_block_c(uint8_t* dst8,
+ uint16_t* dst16,
+ int dstride,
+ const uint16_t* in,
+ int pri_strength,
+ int sec_strength,
+ int dir,
+ int pri_damping,
+ int sec_damping,
+ int bsize,
+ int max,
+ int coeff_shift);
+void cdef_filter_block_sse2(uint8_t* dst8,
+ uint16_t* dst16,
+ int dstride,
+ const uint16_t* in,
+ int pri_strength,
+ int sec_strength,
+ int dir,
+ int pri_damping,
+ int sec_damping,
+ int bsize,
+ int max,
+ int coeff_shift);
+void cdef_filter_block_ssse3(uint8_t* dst8,
+ uint16_t* dst16,
+ int dstride,
+ const uint16_t* in,
+ int pri_strength,
+ int sec_strength,
+ int dir,
+ int pri_damping,
+ int sec_damping,
+ int bsize,
+ int max,
+ int coeff_shift);
+void cdef_filter_block_sse4_1(uint8_t* dst8,
+ uint16_t* dst16,
+ int dstride,
+ const uint16_t* in,
+ int pri_strength,
+ int sec_strength,
+ int dir,
+ int pri_damping,
+ int sec_damping,
+ int bsize,
+ int max,
+ int coeff_shift);
+void cdef_filter_block_avx2(uint8_t* dst8,
+ uint16_t* dst16,
+ int dstride,
+ const uint16_t* in,
+ int pri_strength,
+ int sec_strength,
+ int dir,
+ int pri_damping,
+ int sec_damping,
+ int bsize,
+ int max,
+ int coeff_shift);
+RTCD_EXTERN void (*cdef_filter_block)(uint8_t* dst8,
+ uint16_t* dst16,
+ int dstride,
+ const uint16_t* in,
+ int pri_strength,
+ int sec_strength,
+ int dir,
+ int pri_damping,
+ int sec_damping,
+ int bsize,
+ int max,
+ int coeff_shift);
+
+int cdef_find_dir_c(const uint16_t* img,
+ int stride,
+ int32_t* var,
+ int coeff_shift);
+int cdef_find_dir_sse2(const uint16_t* img,
+ int stride,
+ int32_t* var,
+ int coeff_shift);
+int cdef_find_dir_ssse3(const uint16_t* img,
+ int stride,
+ int32_t* var,
+ int coeff_shift);
+int cdef_find_dir_sse4_1(const uint16_t* img,
+ int stride,
+ int32_t* var,
+ int coeff_shift);
+int cdef_find_dir_avx2(const uint16_t* img,
+ int stride,
+ int32_t* var,
+ int coeff_shift);
+RTCD_EXTERN int (*cdef_find_dir)(const uint16_t* img,
+ int stride,
+ int32_t* var,
+ int coeff_shift);
+
+cfl_subsample_hbd_fn cfl_get_luma_subsampling_420_hbd_c(TX_SIZE tx_size);
+cfl_subsample_hbd_fn cfl_get_luma_subsampling_420_hbd_ssse3(TX_SIZE tx_size);
+cfl_subsample_hbd_fn cfl_get_luma_subsampling_420_hbd_avx2(TX_SIZE tx_size);
+RTCD_EXTERN cfl_subsample_hbd_fn (*cfl_get_luma_subsampling_420_hbd)(
+ TX_SIZE tx_size);
+
+cfl_subsample_lbd_fn cfl_get_luma_subsampling_420_lbd_c(TX_SIZE tx_size);
+cfl_subsample_lbd_fn cfl_get_luma_subsampling_420_lbd_ssse3(TX_SIZE tx_size);
+cfl_subsample_lbd_fn cfl_get_luma_subsampling_420_lbd_avx2(TX_SIZE tx_size);
+RTCD_EXTERN cfl_subsample_lbd_fn (*cfl_get_luma_subsampling_420_lbd)(
+ TX_SIZE tx_size);
+
+cfl_subsample_hbd_fn cfl_get_luma_subsampling_422_hbd_c(TX_SIZE tx_size);
+cfl_subsample_hbd_fn cfl_get_luma_subsampling_422_hbd_ssse3(TX_SIZE tx_size);
+cfl_subsample_hbd_fn cfl_get_luma_subsampling_422_hbd_avx2(TX_SIZE tx_size);
+RTCD_EXTERN cfl_subsample_hbd_fn (*cfl_get_luma_subsampling_422_hbd)(
+ TX_SIZE tx_size);
+
+cfl_subsample_lbd_fn cfl_get_luma_subsampling_422_lbd_c(TX_SIZE tx_size);
+cfl_subsample_lbd_fn cfl_get_luma_subsampling_422_lbd_ssse3(TX_SIZE tx_size);
+cfl_subsample_lbd_fn cfl_get_luma_subsampling_422_lbd_avx2(TX_SIZE tx_size);
+RTCD_EXTERN cfl_subsample_lbd_fn (*cfl_get_luma_subsampling_422_lbd)(
+ TX_SIZE tx_size);
+
+cfl_subsample_hbd_fn cfl_get_luma_subsampling_444_hbd_c(TX_SIZE tx_size);
+cfl_subsample_hbd_fn cfl_get_luma_subsampling_444_hbd_ssse3(TX_SIZE tx_size);
+cfl_subsample_hbd_fn cfl_get_luma_subsampling_444_hbd_avx2(TX_SIZE tx_size);
+RTCD_EXTERN cfl_subsample_hbd_fn (*cfl_get_luma_subsampling_444_hbd)(
+ TX_SIZE tx_size);
+
+cfl_subsample_lbd_fn cfl_get_luma_subsampling_444_lbd_c(TX_SIZE tx_size);
+cfl_subsample_lbd_fn cfl_get_luma_subsampling_444_lbd_ssse3(TX_SIZE tx_size);
+cfl_subsample_lbd_fn cfl_get_luma_subsampling_444_lbd_avx2(TX_SIZE tx_size);
+RTCD_EXTERN cfl_subsample_lbd_fn (*cfl_get_luma_subsampling_444_lbd)(
+ TX_SIZE tx_size);
+
+void copy_rect8_16bit_to_16bit_c(uint16_t* dst,
+ int dstride,
+ const uint16_t* src,
+ int sstride,
+ int v,
+ int h);
+void copy_rect8_16bit_to_16bit_sse2(uint16_t* dst,
+ int dstride,
+ const uint16_t* src,
+ int sstride,
+ int v,
+ int h);
+void copy_rect8_16bit_to_16bit_ssse3(uint16_t* dst,
+ int dstride,
+ const uint16_t* src,
+ int sstride,
+ int v,
+ int h);
+void copy_rect8_16bit_to_16bit_sse4_1(uint16_t* dst,
+ int dstride,
+ const uint16_t* src,
+ int sstride,
+ int v,
+ int h);
+void copy_rect8_16bit_to_16bit_avx2(uint16_t* dst,
+ int dstride,
+ const uint16_t* src,
+ int sstride,
+ int v,
+ int h);
+RTCD_EXTERN void (*copy_rect8_16bit_to_16bit)(uint16_t* dst,
+ int dstride,
+ const uint16_t* src,
+ int sstride,
+ int v,
+ int h);
+
+void copy_rect8_8bit_to_16bit_c(uint16_t* dst,
+ int dstride,
+ const uint8_t* src,
+ int sstride,
+ int v,
+ int h);
+void copy_rect8_8bit_to_16bit_sse2(uint16_t* dst,
+ int dstride,
+ const uint8_t* src,
+ int sstride,
+ int v,
+ int h);
+void copy_rect8_8bit_to_16bit_ssse3(uint16_t* dst,
+ int dstride,
+ const uint8_t* src,
+ int sstride,
+ int v,
+ int h);
+void copy_rect8_8bit_to_16bit_sse4_1(uint16_t* dst,
+ int dstride,
+ const uint8_t* src,
+ int sstride,
+ int v,
+ int h);
+void copy_rect8_8bit_to_16bit_avx2(uint16_t* dst,
+ int dstride,
+ const uint8_t* src,
+ int sstride,
+ int v,
+ int h);
+RTCD_EXTERN void (*copy_rect8_8bit_to_16bit)(uint16_t* dst,
+ int dstride,
+ const uint8_t* src,
+ int sstride,
+ int v,
+ int h);
+
+cfl_predict_hbd_fn get_predict_hbd_fn_c(TX_SIZE tx_size);
+cfl_predict_hbd_fn get_predict_hbd_fn_ssse3(TX_SIZE tx_size);
+cfl_predict_hbd_fn get_predict_hbd_fn_avx2(TX_SIZE tx_size);
+RTCD_EXTERN cfl_predict_hbd_fn (*get_predict_hbd_fn)(TX_SIZE tx_size);
+
+cfl_predict_lbd_fn get_predict_lbd_fn_c(TX_SIZE tx_size);
+cfl_predict_lbd_fn get_predict_lbd_fn_ssse3(TX_SIZE tx_size);
+cfl_predict_lbd_fn get_predict_lbd_fn_avx2(TX_SIZE tx_size);
+RTCD_EXTERN cfl_predict_lbd_fn (*get_predict_lbd_fn)(TX_SIZE tx_size);
+
+cfl_subtract_average_fn get_subtract_average_fn_c(TX_SIZE tx_size);
+cfl_subtract_average_fn get_subtract_average_fn_sse2(TX_SIZE tx_size);
+cfl_subtract_average_fn get_subtract_average_fn_avx2(TX_SIZE tx_size);
+RTCD_EXTERN cfl_subtract_average_fn (*get_subtract_average_fn)(TX_SIZE tx_size);
+
+void av1_rtcd(void);
+
+#ifdef RTCD_C
+#include "aom_ports/x86.h"
+static void setup_rtcd_internal(void) {
+ int flags = x86_simd_caps();
+
+ (void)flags;
+
+ apply_selfguided_restoration = apply_selfguided_restoration_c;
+ if (flags & HAS_SSE4_1)
+ apply_selfguided_restoration = apply_selfguided_restoration_sse4_1;
+ if (flags & HAS_AVX2)
+ apply_selfguided_restoration = apply_selfguided_restoration_avx2;
+ av1_build_compound_diffwtd_mask = av1_build_compound_diffwtd_mask_c;
+ if (flags & HAS_SSE4_1)
+ av1_build_compound_diffwtd_mask = av1_build_compound_diffwtd_mask_sse4_1;
+ av1_build_compound_diffwtd_mask_d16 = av1_build_compound_diffwtd_mask_d16_c;
+ if (flags & HAS_SSE4_1)
+ av1_build_compound_diffwtd_mask_d16 =
+ av1_build_compound_diffwtd_mask_d16_sse4_1;
+ av1_build_compound_diffwtd_mask_highbd =
+ av1_build_compound_diffwtd_mask_highbd_c;
+ if (flags & HAS_SSSE3)
+ av1_build_compound_diffwtd_mask_highbd =
+ av1_build_compound_diffwtd_mask_highbd_ssse3;
+ if (flags & HAS_AVX2)
+ av1_build_compound_diffwtd_mask_highbd =
+ av1_build_compound_diffwtd_mask_highbd_avx2;
+ av1_convolve_2d_copy_sr = av1_convolve_2d_copy_sr_c;
+ if (flags & HAS_SSE2)
+ av1_convolve_2d_copy_sr = av1_convolve_2d_copy_sr_sse2;
+ if (flags & HAS_AVX2)
+ av1_convolve_2d_copy_sr = av1_convolve_2d_copy_sr_avx2;
+ av1_convolve_2d_scale = av1_convolve_2d_scale_c;
+ if (flags & HAS_SSE4_1)
+ av1_convolve_2d_scale = av1_convolve_2d_scale_sse4_1;
+ av1_convolve_2d_sr = av1_convolve_2d_sr_c;
+ if (flags & HAS_SSE2)
+ av1_convolve_2d_sr = av1_convolve_2d_sr_sse2;
+ if (flags & HAS_AVX2)
+ av1_convolve_2d_sr = av1_convolve_2d_sr_avx2;
+ av1_convolve_horiz_rs = av1_convolve_horiz_rs_c;
+ if (flags & HAS_SSE4_1)
+ av1_convolve_horiz_rs = av1_convolve_horiz_rs_sse4_1;
+ av1_convolve_x_sr = av1_convolve_x_sr_c;
+ if (flags & HAS_SSE2)
+ av1_convolve_x_sr = av1_convolve_x_sr_sse2;
+ if (flags & HAS_AVX2)
+ av1_convolve_x_sr = av1_convolve_x_sr_avx2;
+ av1_convolve_y_sr = av1_convolve_y_sr_c;
+ if (flags & HAS_SSE2)
+ av1_convolve_y_sr = av1_convolve_y_sr_sse2;
+ if (flags & HAS_AVX2)
+ av1_convolve_y_sr = av1_convolve_y_sr_avx2;
+ av1_filter_intra_edge = av1_filter_intra_edge_c;
+ if (flags & HAS_SSE4_1)
+ av1_filter_intra_edge = av1_filter_intra_edge_sse4_1;
+ av1_filter_intra_edge_high = av1_filter_intra_edge_high_c;
+ if (flags & HAS_SSE4_1)
+ av1_filter_intra_edge_high = av1_filter_intra_edge_high_sse4_1;
+ av1_filter_intra_predictor = av1_filter_intra_predictor_c;
+ if (flags & HAS_SSE4_1)
+ av1_filter_intra_predictor = av1_filter_intra_predictor_sse4_1;
+ av1_highbd_convolve_2d_copy_sr = av1_highbd_convolve_2d_copy_sr_c;
+ if (flags & HAS_SSE2)
+ av1_highbd_convolve_2d_copy_sr = av1_highbd_convolve_2d_copy_sr_sse2;
+ if (flags & HAS_AVX2)
+ av1_highbd_convolve_2d_copy_sr = av1_highbd_convolve_2d_copy_sr_avx2;
+ av1_highbd_convolve_2d_scale = av1_highbd_convolve_2d_scale_c;
+ if (flags & HAS_SSE4_1)
+ av1_highbd_convolve_2d_scale = av1_highbd_convolve_2d_scale_sse4_1;
+ av1_highbd_convolve_2d_sr = av1_highbd_convolve_2d_sr_c;
+ if (flags & HAS_SSSE3)
+ av1_highbd_convolve_2d_sr = av1_highbd_convolve_2d_sr_ssse3;
+ if (flags & HAS_AVX2)
+ av1_highbd_convolve_2d_sr = av1_highbd_convolve_2d_sr_avx2;
+ av1_highbd_convolve_horiz_rs = av1_highbd_convolve_horiz_rs_c;
+ if (flags & HAS_SSE4_1)
+ av1_highbd_convolve_horiz_rs = av1_highbd_convolve_horiz_rs_sse4_1;
+ av1_highbd_convolve_x_sr = av1_highbd_convolve_x_sr_c;
+ if (flags & HAS_SSSE3)
+ av1_highbd_convolve_x_sr = av1_highbd_convolve_x_sr_ssse3;
+ if (flags & HAS_AVX2)
+ av1_highbd_convolve_x_sr = av1_highbd_convolve_x_sr_avx2;
+ av1_highbd_convolve_y_sr = av1_highbd_convolve_y_sr_c;
+ if (flags & HAS_SSSE3)
+ av1_highbd_convolve_y_sr = av1_highbd_convolve_y_sr_ssse3;
+ if (flags & HAS_AVX2)
+ av1_highbd_convolve_y_sr = av1_highbd_convolve_y_sr_avx2;
+ av1_highbd_jnt_convolve_2d = av1_highbd_jnt_convolve_2d_c;
+ if (flags & HAS_SSE4_1)
+ av1_highbd_jnt_convolve_2d = av1_highbd_jnt_convolve_2d_sse4_1;
+ if (flags & HAS_AVX2)
+ av1_highbd_jnt_convolve_2d = av1_highbd_jnt_convolve_2d_avx2;
+ av1_highbd_jnt_convolve_2d_copy = av1_highbd_jnt_convolve_2d_copy_c;
+ if (flags & HAS_SSE4_1)
+ av1_highbd_jnt_convolve_2d_copy = av1_highbd_jnt_convolve_2d_copy_sse4_1;
+ if (flags & HAS_AVX2)
+ av1_highbd_jnt_convolve_2d_copy = av1_highbd_jnt_convolve_2d_copy_avx2;
+ av1_highbd_jnt_convolve_x = av1_highbd_jnt_convolve_x_c;
+ if (flags & HAS_SSE4_1)
+ av1_highbd_jnt_convolve_x = av1_highbd_jnt_convolve_x_sse4_1;
+ if (flags & HAS_AVX2)
+ av1_highbd_jnt_convolve_x = av1_highbd_jnt_convolve_x_avx2;
+ av1_highbd_jnt_convolve_y = av1_highbd_jnt_convolve_y_c;
+ if (flags & HAS_SSE4_1)
+ av1_highbd_jnt_convolve_y = av1_highbd_jnt_convolve_y_sse4_1;
+ if (flags & HAS_AVX2)
+ av1_highbd_jnt_convolve_y = av1_highbd_jnt_convolve_y_avx2;
+ av1_highbd_warp_affine = av1_highbd_warp_affine_c;
+ if (flags & HAS_SSE4_1)
+ av1_highbd_warp_affine = av1_highbd_warp_affine_sse4_1;
+ av1_highbd_wiener_convolve_add_src = av1_highbd_wiener_convolve_add_src_c;
+ if (flags & HAS_SSSE3)
+ av1_highbd_wiener_convolve_add_src =
+ av1_highbd_wiener_convolve_add_src_ssse3;
+ if (flags & HAS_AVX2)
+ av1_highbd_wiener_convolve_add_src =
+ av1_highbd_wiener_convolve_add_src_avx2;
+ av1_inv_txfm2d_add_16x16 = av1_inv_txfm2d_add_16x16_c;
+ if (flags & HAS_SSE4_1)
+ av1_inv_txfm2d_add_16x16 = av1_inv_txfm2d_add_16x16_sse4_1;
+ av1_inv_txfm2d_add_32x32 = av1_inv_txfm2d_add_32x32_c;
+ if (flags & HAS_AVX2)
+ av1_inv_txfm2d_add_32x32 = av1_inv_txfm2d_add_32x32_avx2;
+ av1_inv_txfm2d_add_4x4 = av1_inv_txfm2d_add_4x4_c;
+ if (flags & HAS_SSE4_1)
+ av1_inv_txfm2d_add_4x4 = av1_inv_txfm2d_add_4x4_sse4_1;
+ av1_inv_txfm2d_add_64x64 = av1_inv_txfm2d_add_64x64_c;
+ if (flags & HAS_SSE4_1)
+ av1_inv_txfm2d_add_64x64 = av1_inv_txfm2d_add_64x64_sse4_1;
+ av1_inv_txfm2d_add_8x8 = av1_inv_txfm2d_add_8x8_c;
+ if (flags & HAS_SSE4_1)
+ av1_inv_txfm2d_add_8x8 = av1_inv_txfm2d_add_8x8_sse4_1;
+ av1_inv_txfm_add = av1_inv_txfm_add_c;
+ if (flags & HAS_SSSE3)
+ av1_inv_txfm_add = av1_inv_txfm_add_ssse3;
+ if (flags & HAS_AVX2)
+ av1_inv_txfm_add = av1_inv_txfm_add_avx2;
+ av1_jnt_convolve_2d = av1_jnt_convolve_2d_c;
+ if (flags & HAS_SSSE3)
+ av1_jnt_convolve_2d = av1_jnt_convolve_2d_ssse3;
+ if (flags & HAS_AVX2)
+ av1_jnt_convolve_2d = av1_jnt_convolve_2d_avx2;
+ av1_jnt_convolve_2d_copy = av1_jnt_convolve_2d_copy_c;
+ if (flags & HAS_SSE2)
+ av1_jnt_convolve_2d_copy = av1_jnt_convolve_2d_copy_sse2;
+ if (flags & HAS_AVX2)
+ av1_jnt_convolve_2d_copy = av1_jnt_convolve_2d_copy_avx2;
+ av1_jnt_convolve_x = av1_jnt_convolve_x_c;
+ if (flags & HAS_SSE2)
+ av1_jnt_convolve_x = av1_jnt_convolve_x_sse2;
+ if (flags & HAS_AVX2)
+ av1_jnt_convolve_x = av1_jnt_convolve_x_avx2;
+ av1_jnt_convolve_y = av1_jnt_convolve_y_c;
+ if (flags & HAS_SSE2)
+ av1_jnt_convolve_y = av1_jnt_convolve_y_sse2;
+ if (flags & HAS_AVX2)
+ av1_jnt_convolve_y = av1_jnt_convolve_y_avx2;
+ av1_selfguided_restoration = av1_selfguided_restoration_c;
+ if (flags & HAS_SSE4_1)
+ av1_selfguided_restoration = av1_selfguided_restoration_sse4_1;
+ if (flags & HAS_AVX2)
+ av1_selfguided_restoration = av1_selfguided_restoration_avx2;
+ av1_upsample_intra_edge = av1_upsample_intra_edge_c;
+ if (flags & HAS_SSE4_1)
+ av1_upsample_intra_edge = av1_upsample_intra_edge_sse4_1;
+ av1_upsample_intra_edge_high = av1_upsample_intra_edge_high_c;
+ if (flags & HAS_SSE4_1)
+ av1_upsample_intra_edge_high = av1_upsample_intra_edge_high_sse4_1;
+ av1_warp_affine = av1_warp_affine_c;
+ if (flags & HAS_SSE4_1)
+ av1_warp_affine = av1_warp_affine_sse4_1;
+ av1_wiener_convolve_add_src = av1_wiener_convolve_add_src_c;
+ if (flags & HAS_SSE2)
+ av1_wiener_convolve_add_src = av1_wiener_convolve_add_src_sse2;
+ if (flags & HAS_AVX2)
+ av1_wiener_convolve_add_src = av1_wiener_convolve_add_src_avx2;
+ cdef_filter_block = cdef_filter_block_c;
+ if (flags & HAS_SSE2)
+ cdef_filter_block = cdef_filter_block_sse2;
+ if (flags & HAS_SSSE3)
+ cdef_filter_block = cdef_filter_block_ssse3;
+ if (flags & HAS_SSE4_1)
+ cdef_filter_block = cdef_filter_block_sse4_1;
+ if (flags & HAS_AVX2)
+ cdef_filter_block = cdef_filter_block_avx2;
+ cdef_find_dir = cdef_find_dir_c;
+ if (flags & HAS_SSE2)
+ cdef_find_dir = cdef_find_dir_sse2;
+ if (flags & HAS_SSSE3)
+ cdef_find_dir = cdef_find_dir_ssse3;
+ if (flags & HAS_SSE4_1)
+ cdef_find_dir = cdef_find_dir_sse4_1;
+ if (flags & HAS_AVX2)
+ cdef_find_dir = cdef_find_dir_avx2;
+ cfl_get_luma_subsampling_420_hbd = cfl_get_luma_subsampling_420_hbd_c;
+ if (flags & HAS_SSSE3)
+ cfl_get_luma_subsampling_420_hbd = cfl_get_luma_subsampling_420_hbd_ssse3;
+ if (flags & HAS_AVX2)
+ cfl_get_luma_subsampling_420_hbd = cfl_get_luma_subsampling_420_hbd_avx2;
+ cfl_get_luma_subsampling_420_lbd = cfl_get_luma_subsampling_420_lbd_c;
+ if (flags & HAS_SSSE3)
+ cfl_get_luma_subsampling_420_lbd = cfl_get_luma_subsampling_420_lbd_ssse3;
+ if (flags & HAS_AVX2)
+ cfl_get_luma_subsampling_420_lbd = cfl_get_luma_subsampling_420_lbd_avx2;
+ cfl_get_luma_subsampling_422_hbd = cfl_get_luma_subsampling_422_hbd_c;
+ if (flags & HAS_SSSE3)
+ cfl_get_luma_subsampling_422_hbd = cfl_get_luma_subsampling_422_hbd_ssse3;
+ if (flags & HAS_AVX2)
+ cfl_get_luma_subsampling_422_hbd = cfl_get_luma_subsampling_422_hbd_avx2;
+ cfl_get_luma_subsampling_422_lbd = cfl_get_luma_subsampling_422_lbd_c;
+ if (flags & HAS_SSSE3)
+ cfl_get_luma_subsampling_422_lbd = cfl_get_luma_subsampling_422_lbd_ssse3;
+ if (flags & HAS_AVX2)
+ cfl_get_luma_subsampling_422_lbd = cfl_get_luma_subsampling_422_lbd_avx2;
+ cfl_get_luma_subsampling_444_hbd = cfl_get_luma_subsampling_444_hbd_c;
+ if (flags & HAS_SSSE3)
+ cfl_get_luma_subsampling_444_hbd = cfl_get_luma_subsampling_444_hbd_ssse3;
+ if (flags & HAS_AVX2)
+ cfl_get_luma_subsampling_444_hbd = cfl_get_luma_subsampling_444_hbd_avx2;
+ cfl_get_luma_subsampling_444_lbd = cfl_get_luma_subsampling_444_lbd_c;
+ if (flags & HAS_SSSE3)
+ cfl_get_luma_subsampling_444_lbd = cfl_get_luma_subsampling_444_lbd_ssse3;
+ if (flags & HAS_AVX2)
+ cfl_get_luma_subsampling_444_lbd = cfl_get_luma_subsampling_444_lbd_avx2;
+ copy_rect8_16bit_to_16bit = copy_rect8_16bit_to_16bit_c;
+ if (flags & HAS_SSE2)
+ copy_rect8_16bit_to_16bit = copy_rect8_16bit_to_16bit_sse2;
+ if (flags & HAS_SSSE3)
+ copy_rect8_16bit_to_16bit = copy_rect8_16bit_to_16bit_ssse3;
+ if (flags & HAS_SSE4_1)
+ copy_rect8_16bit_to_16bit = copy_rect8_16bit_to_16bit_sse4_1;
+ if (flags & HAS_AVX2)
+ copy_rect8_16bit_to_16bit = copy_rect8_16bit_to_16bit_avx2;
+ copy_rect8_8bit_to_16bit = copy_rect8_8bit_to_16bit_c;
+ if (flags & HAS_SSE2)
+ copy_rect8_8bit_to_16bit = copy_rect8_8bit_to_16bit_sse2;
+ if (flags & HAS_SSSE3)
+ copy_rect8_8bit_to_16bit = copy_rect8_8bit_to_16bit_ssse3;
+ if (flags & HAS_SSE4_1)
+ copy_rect8_8bit_to_16bit = copy_rect8_8bit_to_16bit_sse4_1;
+ if (flags & HAS_AVX2)
+ copy_rect8_8bit_to_16bit = copy_rect8_8bit_to_16bit_avx2;
+ get_predict_hbd_fn = get_predict_hbd_fn_c;
+ if (flags & HAS_SSSE3)
+ get_predict_hbd_fn = get_predict_hbd_fn_ssse3;
+ if (flags & HAS_AVX2)
+ get_predict_hbd_fn = get_predict_hbd_fn_avx2;
+ get_predict_lbd_fn = get_predict_lbd_fn_c;
+ if (flags & HAS_SSSE3)
+ get_predict_lbd_fn = get_predict_lbd_fn_ssse3;
+ if (flags & HAS_AVX2)
+ get_predict_lbd_fn = get_predict_lbd_fn_avx2;
+ get_subtract_average_fn = get_subtract_average_fn_c;
+ if (flags & HAS_SSE2)
+ get_subtract_average_fn = get_subtract_average_fn_sse2;
+ if (flags & HAS_AVX2)
+ get_subtract_average_fn = get_subtract_average_fn_avx2;
+}
+#endif
+
+#ifdef __cplusplus
+} // extern "C"
+#endif
+
+#endif