#ifndef VP9_RTCD_H_
#define VP9_RTCD_H_
#ifdef RTCD_C
#define RTCD_EXTERN
#else
#define RTCD_EXTERN …
#endif
#include "vp9/common/vp9_common.h"
#include "vp9/common/vp9_enums.h"
#include "vp9/common/vp9_filter.h"
#include "vpx/vpx_integer.h"
struct macroblockd;
struct macroblock;
struct macroblock_plane;
struct vp9_sad_table;
struct ScanOrder;
struct search_site_config;
struct mv;
int_mv;
struct yv12_buffer_config;
#ifdef __cplusplus
extern "C" {
#endif
int64_t vp9_block_error_c(const tran_low_t* coeff,
const tran_low_t* dqcoeff,
intptr_t block_size,
int64_t* ssz);
int64_t vp9_block_error_sse2(const tran_low_t* coeff,
const tran_low_t* dqcoeff,
intptr_t block_size,
int64_t* ssz);
int64_t vp9_block_error_avx2(const tran_low_t* coeff,
const tran_low_t* dqcoeff,
intptr_t block_size,
int64_t* ssz);
RTCD_EXTERN int64_t (*vp9_block_error)(const tran_low_t* coeff,
const tran_low_t* dqcoeff,
intptr_t block_size,
int64_t* ssz);
int64_t vp9_block_error_fp_c(const tran_low_t* coeff,
const tran_low_t* dqcoeff,
int block_size);
int64_t vp9_block_error_fp_sse2(const tran_low_t* coeff,
const tran_low_t* dqcoeff,
int block_size);
int64_t vp9_block_error_fp_avx2(const tran_low_t* coeff,
const tran_low_t* dqcoeff,
int block_size);
RTCD_EXTERN int64_t (*vp9_block_error_fp)(const tran_low_t* coeff,
const tran_low_t* dqcoeff,
int block_size);
int vp9_denoiser_filter_c(const uint8_t* sig,
int sig_stride,
const uint8_t* mc_avg,
int mc_avg_stride,
uint8_t* avg,
int avg_stride,
int increase_denoising,
BLOCK_SIZE bs,
int motion_magnitude);
int vp9_denoiser_filter_sse2(const uint8_t* sig,
int sig_stride,
const uint8_t* mc_avg,
int mc_avg_stride,
uint8_t* avg,
int avg_stride,
int increase_denoising,
BLOCK_SIZE bs,
int motion_magnitude);
#define vp9_denoiser_filter …
int vp9_diamond_search_sad_c(const struct macroblock* x,
const struct search_site_config* cfg,
struct mv* ref_mv,
uint32_t start_mv_sad,
struct mv* best_mv,
int search_param,
int sad_per_bit,
int* num00,
const struct vp9_sad_table* sad_fn_ptr,
const struct mv* center_mv);
#define vp9_diamond_search_sad …
void vp9_fht16x16_c(const int16_t* input,
tran_low_t* output,
int stride,
int tx_type);
void vp9_fht16x16_sse2(const int16_t* input,
tran_low_t* output,
int stride,
int tx_type);
#define vp9_fht16x16 …
void vp9_fht4x4_c(const int16_t* input,
tran_low_t* output,
int stride,
int tx_type);
void vp9_fht4x4_sse2(const int16_t* input,
tran_low_t* output,
int stride,
int tx_type);
#define vp9_fht4x4 …
void vp9_fht8x8_c(const int16_t* input,
tran_low_t* output,
int stride,
int tx_type);
void vp9_fht8x8_sse2(const int16_t* input,
tran_low_t* output,
int stride,
int tx_type);
#define vp9_fht8x8 …
void vp9_filter_by_weight16x16_c(const uint8_t* src,
int src_stride,
uint8_t* dst,
int dst_stride,
int src_weight);
void vp9_filter_by_weight16x16_sse2(const uint8_t* src,
int src_stride,
uint8_t* dst,
int dst_stride,
int src_weight);
#define vp9_filter_by_weight16x16 …
void vp9_filter_by_weight8x8_c(const uint8_t* src,
int src_stride,
uint8_t* dst,
int dst_stride,
int src_weight);
void vp9_filter_by_weight8x8_sse2(const uint8_t* src,
int src_stride,
uint8_t* dst,
int dst_stride,
int src_weight);
#define vp9_filter_by_weight8x8 …
void vp9_fwht4x4_c(const int16_t* input, tran_low_t* output, int stride);
void vp9_fwht4x4_sse2(const int16_t* input, tran_low_t* output, int stride);
#define vp9_fwht4x4 …
int64_t vp9_highbd_block_error_c(const tran_low_t* coeff,
const tran_low_t* dqcoeff,
intptr_t block_size,
int64_t* ssz,
int bd);
int64_t vp9_highbd_block_error_sse2(const tran_low_t* coeff,
const tran_low_t* dqcoeff,
intptr_t block_size,
int64_t* ssz,
int bd);
#define vp9_highbd_block_error …
void vp9_highbd_fht16x16_c(const int16_t* input,
tran_low_t* output,
int stride,
int tx_type);
#define vp9_highbd_fht16x16 …
void vp9_highbd_fht4x4_c(const int16_t* input,
tran_low_t* output,
int stride,
int tx_type);
#define vp9_highbd_fht4x4 …
void vp9_highbd_fht8x8_c(const int16_t* input,
tran_low_t* output,
int stride,
int tx_type);
#define vp9_highbd_fht8x8 …
void vp9_highbd_fwht4x4_c(const int16_t* input, tran_low_t* output, int stride);
#define vp9_highbd_fwht4x4 …
void vp9_highbd_iht16x16_256_add_c(const tran_low_t* input,
uint16_t* dest,
int stride,
int tx_type,
int bd);
void vp9_highbd_iht16x16_256_add_sse4_1(const tran_low_t* input,
uint16_t* dest,
int stride,
int tx_type,
int bd);
RTCD_EXTERN void (*vp9_highbd_iht16x16_256_add)(const tran_low_t* input,
uint16_t* dest,
int stride,
int tx_type,
int bd);
void vp9_highbd_iht4x4_16_add_c(const tran_low_t* input,
uint16_t* dest,
int stride,
int tx_type,
int bd);
void vp9_highbd_iht4x4_16_add_sse4_1(const tran_low_t* input,
uint16_t* dest,
int stride,
int tx_type,
int bd);
RTCD_EXTERN void (*vp9_highbd_iht4x4_16_add)(const tran_low_t* input,
uint16_t* dest,
int stride,
int tx_type,
int bd);
void vp9_highbd_iht8x8_64_add_c(const tran_low_t* input,
uint16_t* dest,
int stride,
int tx_type,
int bd);
void vp9_highbd_iht8x8_64_add_sse4_1(const tran_low_t* input,
uint16_t* dest,
int stride,
int tx_type,
int bd);
RTCD_EXTERN void (*vp9_highbd_iht8x8_64_add)(const tran_low_t* input,
uint16_t* dest,
int stride,
int tx_type,
int bd);
void vp9_highbd_mbpost_proc_across_ip_c(uint16_t* src,
int pitch,
int rows,
int cols,
int flimit);
#define vp9_highbd_mbpost_proc_across_ip …
void vp9_highbd_mbpost_proc_down_c(uint16_t* dst,
int pitch,
int rows,
int cols,
int flimit);
#define vp9_highbd_mbpost_proc_down …
void vp9_highbd_post_proc_down_and_across_c(const uint16_t* src_ptr,
uint16_t* dst_ptr,
int src_pixels_per_line,
int dst_pixels_per_line,
int rows,
int cols,
int flimit);
#define vp9_highbd_post_proc_down_and_across …
void vp9_highbd_quantize_fp_c(const tran_low_t* coeff_ptr,
intptr_t n_coeffs,
const struct macroblock_plane* const mb_plane,
tran_low_t* qcoeff_ptr,
tran_low_t* dqcoeff_ptr,
const int16_t* dequant_ptr,
uint16_t* eob_ptr,
const struct ScanOrder* const scan_order);
void vp9_highbd_quantize_fp_avx2(const tran_low_t* coeff_ptr,
intptr_t n_coeffs,
const struct macroblock_plane* const mb_plane,
tran_low_t* qcoeff_ptr,
tran_low_t* dqcoeff_ptr,
const int16_t* dequant_ptr,
uint16_t* eob_ptr,
const struct ScanOrder* const scan_order);
RTCD_EXTERN void (*vp9_highbd_quantize_fp)(
const tran_low_t* coeff_ptr,
intptr_t n_coeffs,
const struct macroblock_plane* const mb_plane,
tran_low_t* qcoeff_ptr,
tran_low_t* dqcoeff_ptr,
const int16_t* dequant_ptr,
uint16_t* eob_ptr,
const struct ScanOrder* const scan_order);
void vp9_highbd_quantize_fp_32x32_c(
const tran_low_t* coeff_ptr,
intptr_t n_coeffs,
const struct macroblock_plane* const mb_plane,
tran_low_t* qcoeff_ptr,
tran_low_t* dqcoeff_ptr,
const int16_t* dequant_ptr,
uint16_t* eob_ptr,
const struct ScanOrder* const scan_order);
void vp9_highbd_quantize_fp_32x32_avx2(
const tran_low_t* coeff_ptr,
intptr_t n_coeffs,
const struct macroblock_plane* const mb_plane,
tran_low_t* qcoeff_ptr,
tran_low_t* dqcoeff_ptr,
const int16_t* dequant_ptr,
uint16_t* eob_ptr,
const struct ScanOrder* const scan_order);
RTCD_EXTERN void (*vp9_highbd_quantize_fp_32x32)(
const tran_low_t* coeff_ptr,
intptr_t n_coeffs,
const struct macroblock_plane* const mb_plane,
tran_low_t* qcoeff_ptr,
tran_low_t* dqcoeff_ptr,
const int16_t* dequant_ptr,
uint16_t* eob_ptr,
const struct ScanOrder* const scan_order);
void vp9_highbd_temporal_filter_apply_c(const uint8_t* frame1,
unsigned int stride,
const uint8_t* frame2,
unsigned int block_width,
unsigned int block_height,
int strength,
int* blk_fw,
int use_32x32,
uint32_t* accumulator,
uint16_t* count);
#define vp9_highbd_temporal_filter_apply …
void vp9_iht16x16_256_add_c(const tran_low_t* input,
uint8_t* dest,
int stride,
int tx_type);
void vp9_iht16x16_256_add_sse2(const tran_low_t* input,
uint8_t* dest,
int stride,
int tx_type);
#define vp9_iht16x16_256_add …
void vp9_iht4x4_16_add_c(const tran_low_t* input,
uint8_t* dest,
int stride,
int tx_type);
void vp9_iht4x4_16_add_sse2(const tran_low_t* input,
uint8_t* dest,
int stride,
int tx_type);
#define vp9_iht4x4_16_add …
void vp9_iht8x8_64_add_c(const tran_low_t* input,
uint8_t* dest,
int stride,
int tx_type);
void vp9_iht8x8_64_add_sse2(const tran_low_t* input,
uint8_t* dest,
int stride,
int tx_type);
#define vp9_iht8x8_64_add …
void vp9_quantize_fp_c(const tran_low_t* coeff_ptr,
intptr_t n_coeffs,
const struct macroblock_plane* const mb_plane,
tran_low_t* qcoeff_ptr,
tran_low_t* dqcoeff_ptr,
const int16_t* dequant_ptr,
uint16_t* eob_ptr,
const struct ScanOrder* const scan_order);
void vp9_quantize_fp_sse2(const tran_low_t* coeff_ptr,
intptr_t n_coeffs,
const struct macroblock_plane* const mb_plane,
tran_low_t* qcoeff_ptr,
tran_low_t* dqcoeff_ptr,
const int16_t* dequant_ptr,
uint16_t* eob_ptr,
const struct ScanOrder* const scan_order);
void vp9_quantize_fp_ssse3(const tran_low_t* coeff_ptr,
intptr_t n_coeffs,
const struct macroblock_plane* const mb_plane,
tran_low_t* qcoeff_ptr,
tran_low_t* dqcoeff_ptr,
const int16_t* dequant_ptr,
uint16_t* eob_ptr,
const struct ScanOrder* const scan_order);
void vp9_quantize_fp_avx2(const tran_low_t* coeff_ptr,
intptr_t n_coeffs,
const struct macroblock_plane* const mb_plane,
tran_low_t* qcoeff_ptr,
tran_low_t* dqcoeff_ptr,
const int16_t* dequant_ptr,
uint16_t* eob_ptr,
const struct ScanOrder* const scan_order);
RTCD_EXTERN void (*vp9_quantize_fp)(
const tran_low_t* coeff_ptr,
intptr_t n_coeffs,
const struct macroblock_plane* const mb_plane,
tran_low_t* qcoeff_ptr,
tran_low_t* dqcoeff_ptr,
const int16_t* dequant_ptr,
uint16_t* eob_ptr,
const struct ScanOrder* const scan_order);
void vp9_quantize_fp_32x32_c(const tran_low_t* coeff_ptr,
intptr_t n_coeffs,
const struct macroblock_plane* const mb_plane,
tran_low_t* qcoeff_ptr,
tran_low_t* dqcoeff_ptr,
const int16_t* dequant_ptr,
uint16_t* eob_ptr,
const struct ScanOrder* const scan_order);
void vp9_quantize_fp_32x32_ssse3(const tran_low_t* coeff_ptr,
intptr_t n_coeffs,
const struct macroblock_plane* const mb_plane,
tran_low_t* qcoeff_ptr,
tran_low_t* dqcoeff_ptr,
const int16_t* dequant_ptr,
uint16_t* eob_ptr,
const struct ScanOrder* const scan_order);
void vp9_quantize_fp_32x32_avx2(const tran_low_t* coeff_ptr,
intptr_t n_coeffs,
const struct macroblock_plane* const mb_plane,
tran_low_t* qcoeff_ptr,
tran_low_t* dqcoeff_ptr,
const int16_t* dequant_ptr,
uint16_t* eob_ptr,
const struct ScanOrder* const scan_order);
RTCD_EXTERN void (*vp9_quantize_fp_32x32)(
const tran_low_t* coeff_ptr,
intptr_t n_coeffs,
const struct macroblock_plane* const mb_plane,
tran_low_t* qcoeff_ptr,
tran_low_t* dqcoeff_ptr,
const int16_t* dequant_ptr,
uint16_t* eob_ptr,
const struct ScanOrder* const scan_order);
void vp9_scale_and_extend_frame_c(const struct yv12_buffer_config* src,
struct yv12_buffer_config* dst,
INTERP_FILTER filter_type,
int phase_scaler);
void vp9_scale_and_extend_frame_ssse3(const struct yv12_buffer_config* src,
struct yv12_buffer_config* dst,
INTERP_FILTER filter_type,
int phase_scaler);
RTCD_EXTERN void (*vp9_scale_and_extend_frame)(
const struct yv12_buffer_config* src,
struct yv12_buffer_config* dst,
INTERP_FILTER filter_type,
int phase_scaler);
void vp9_rtcd(void);
#ifdef RTCD_C
#include "vpx_ports/x86.h"
static void setup_rtcd_internal(void) {
int flags = x86_simd_caps();
(void)flags;
vp9_block_error = vp9_block_error_sse2;
if (flags & HAS_AVX2)
vp9_block_error = vp9_block_error_avx2;
vp9_block_error_fp = vp9_block_error_fp_sse2;
if (flags & HAS_AVX2)
vp9_block_error_fp = vp9_block_error_fp_avx2;
vp9_highbd_iht16x16_256_add = vp9_highbd_iht16x16_256_add_c;
if (flags & HAS_SSE4_1)
vp9_highbd_iht16x16_256_add = vp9_highbd_iht16x16_256_add_sse4_1;
vp9_highbd_iht4x4_16_add = vp9_highbd_iht4x4_16_add_c;
if (flags & HAS_SSE4_1)
vp9_highbd_iht4x4_16_add = vp9_highbd_iht4x4_16_add_sse4_1;
vp9_highbd_iht8x8_64_add = vp9_highbd_iht8x8_64_add_c;
if (flags & HAS_SSE4_1)
vp9_highbd_iht8x8_64_add = vp9_highbd_iht8x8_64_add_sse4_1;
vp9_highbd_quantize_fp = vp9_highbd_quantize_fp_c;
if (flags & HAS_AVX2)
vp9_highbd_quantize_fp = vp9_highbd_quantize_fp_avx2;
vp9_highbd_quantize_fp_32x32 = vp9_highbd_quantize_fp_32x32_c;
if (flags & HAS_AVX2)
vp9_highbd_quantize_fp_32x32 = vp9_highbd_quantize_fp_32x32_avx2;
vp9_quantize_fp = vp9_quantize_fp_sse2;
if (flags & HAS_SSSE3)
vp9_quantize_fp = vp9_quantize_fp_ssse3;
if (flags & HAS_AVX2)
vp9_quantize_fp = vp9_quantize_fp_avx2;
vp9_quantize_fp_32x32 = vp9_quantize_fp_32x32_c;
if (flags & HAS_SSSE3)
vp9_quantize_fp_32x32 = vp9_quantize_fp_32x32_ssse3;
if (flags & HAS_AVX2)
vp9_quantize_fp_32x32 = vp9_quantize_fp_32x32_avx2;
vp9_scale_and_extend_frame = vp9_scale_and_extend_frame_c;
if (flags & HAS_SSSE3)
vp9_scale_and_extend_frame = vp9_scale_and_extend_frame_ssse3;
}
#endif
#ifdef __cplusplus
}
#endif
#endif