#include <emmintrin.h>
#include "./vpx_dsp_rtcd.h"
#include "vpx_dsp/x86/inv_txfm_sse2.h"
#include "vpx_dsp/x86/transpose_sse2.h"
#include "vpx_dsp/x86/txfm_common_sse2.h"
static INLINE void transpose_16bit_4(__m128i *res) { … }
void vpx_idct4x4_16_add_sse2(const tran_low_t *input, uint8_t *dest,
int stride) { … }
void vpx_idct4x4_1_add_sse2(const tran_low_t *input, uint8_t *dest,
int stride) { … }
void idct4_sse2(__m128i *const in) { … }
void iadst4_sse2(__m128i *const in) { … }
static INLINE void load_buffer_8x8(const tran_low_t *const input,
__m128i *const in) { … }
void vpx_idct8x8_64_add_sse2(const tran_low_t *input, uint8_t *dest,
int stride) { … }
void vpx_idct8x8_12_add_sse2(const tran_low_t *input, uint8_t *dest,
int stride) { … }
static INLINE void recon_and_store_8_dual(uint8_t *const dest,
const __m128i in_x,
const int stride) { … }
void vpx_idct8x8_1_add_sse2(const tran_low_t *input, uint8_t *dest,
int stride) { … }
void vpx_idct8_sse2(__m128i *const in) { … }
void iadst8_sse2(__m128i *const in) { … }
static INLINE void idct16_load8x8(const tran_low_t *const input,
__m128i *const in) { … }
void vpx_idct16x16_256_add_sse2(const tran_low_t *input, uint8_t *dest,
int stride) { … }
void vpx_idct16x16_38_add_sse2(const tran_low_t *input, uint8_t *dest,
int stride) { … }
void vpx_idct16x16_10_add_sse2(const tran_low_t *input, uint8_t *dest,
int stride) { … }
static INLINE void recon_and_store_16(uint8_t *const dest, const __m128i in_x) { … }
void vpx_idct16x16_1_add_sse2(const tran_low_t *input, uint8_t *dest,
int stride) { … }
void vpx_iadst16_8col_sse2(__m128i *const in) { … }
void idct16_sse2(__m128i *const in0, __m128i *const in1) { … }
void iadst16_sse2(__m128i *const in0, __m128i *const in1) { … }
static INLINE void idct32_34_8x32_quarter_1(const __m128i *const in ,
__m128i *const out ) { … }
static INLINE void idct32_34_8x32_quarter_2(const __m128i *const in ,
__m128i *const out ) { … }
static INLINE void idct32_34_8x32_quarter_1_2(
const __m128i *const in , __m128i *const out ) { … }
static INLINE void idct32_34_8x32_quarter_3_4(
const __m128i *const in , __m128i *const out ) { … }
void idct32_34_8x32_sse2(const __m128i *const in ,
__m128i *const out ) { … }
void vpx_idct32x32_34_add_sse2(const tran_low_t *input, uint8_t *dest,
int stride) { … }
static INLINE void idct32_1024_8x32_quarter_1(
const __m128i *const in , __m128i *const out ) { … }
static INLINE void idct32_1024_8x32_quarter_2(
const __m128i *const in , __m128i *const out ) { … }
static INLINE void idct32_1024_8x32_quarter_1_2(
const __m128i *const in , __m128i *const out ) { … }
static INLINE void idct32_1024_8x32_quarter_3_4(
const __m128i *const in , __m128i *const out ) { … }
void idct32_1024_8x32(const __m128i *const in ,
__m128i *const out ) { … }
void vpx_idct32x32_1024_add_sse2(const tran_low_t *input, uint8_t *dest,
int stride) { … }
void vpx_idct32x32_135_add_sse2(const tran_low_t *input, uint8_t *dest,
int stride) { … }
void vpx_idct32x32_1_add_sse2(const tran_low_t *input, uint8_t *dest,
int stride) { … }