#ifndef VPX_VPX_DSP_X86_FWD_TXFM_SSE2_H_
#define VPX_VPX_DSP_X86_FWD_TXFM_SSE2_H_
#ifdef __cplusplus
extern "C" {
#endif
#define pair_set_epi32(a, b) …
static INLINE __m128i k_madd_epi32(__m128i a, __m128i b) { … }
static INLINE __m128i k_packs_epi64(__m128i a, __m128i b) { … }
static INLINE int check_epi16_overflow_x2(const __m128i *preg0,
const __m128i *preg1) { … }
static INLINE int check_epi16_overflow_x4(const __m128i *preg0,
const __m128i *preg1,
const __m128i *preg2,
const __m128i *preg3) { … }
static INLINE int check_epi16_overflow_x8(
const __m128i *preg0, const __m128i *preg1, const __m128i *preg2,
const __m128i *preg3, const __m128i *preg4, const __m128i *preg5,
const __m128i *preg6, const __m128i *preg7) { … }
static INLINE int check_epi16_overflow_x12(
const __m128i *preg0, const __m128i *preg1, const __m128i *preg2,
const __m128i *preg3, const __m128i *preg4, const __m128i *preg5,
const __m128i *preg6, const __m128i *preg7, const __m128i *preg8,
const __m128i *preg9, const __m128i *preg10, const __m128i *preg11) { … }
static INLINE int check_epi16_overflow_x16(
const __m128i *preg0, const __m128i *preg1, const __m128i *preg2,
const __m128i *preg3, const __m128i *preg4, const __m128i *preg5,
const __m128i *preg6, const __m128i *preg7, const __m128i *preg8,
const __m128i *preg9, const __m128i *preg10, const __m128i *preg11,
const __m128i *preg12, const __m128i *preg13, const __m128i *preg14,
const __m128i *preg15) { … }
static INLINE int check_epi16_overflow_x32(
const __m128i *preg0, const __m128i *preg1, const __m128i *preg2,
const __m128i *preg3, const __m128i *preg4, const __m128i *preg5,
const __m128i *preg6, const __m128i *preg7, const __m128i *preg8,
const __m128i *preg9, const __m128i *preg10, const __m128i *preg11,
const __m128i *preg12, const __m128i *preg13, const __m128i *preg14,
const __m128i *preg15, const __m128i *preg16, const __m128i *preg17,
const __m128i *preg18, const __m128i *preg19, const __m128i *preg20,
const __m128i *preg21, const __m128i *preg22, const __m128i *preg23,
const __m128i *preg24, const __m128i *preg25, const __m128i *preg26,
const __m128i *preg27, const __m128i *preg28, const __m128i *preg29,
const __m128i *preg30, const __m128i *preg31) { … }
static INLINE int k_check_epi32_overflow_4(const __m128i *preg0,
const __m128i *preg1,
const __m128i *preg2,
const __m128i *preg3,
const __m128i *zero) { … }
static INLINE int k_check_epi32_overflow_8(
const __m128i *preg0, const __m128i *preg1, const __m128i *preg2,
const __m128i *preg3, const __m128i *preg4, const __m128i *preg5,
const __m128i *preg6, const __m128i *preg7, const __m128i *zero) { … }
static INLINE int k_check_epi32_overflow_16(
const __m128i *preg0, const __m128i *preg1, const __m128i *preg2,
const __m128i *preg3, const __m128i *preg4, const __m128i *preg5,
const __m128i *preg6, const __m128i *preg7, const __m128i *preg8,
const __m128i *preg9, const __m128i *preg10, const __m128i *preg11,
const __m128i *preg12, const __m128i *preg13, const __m128i *preg14,
const __m128i *preg15, const __m128i *zero) { … }
static INLINE int k_check_epi32_overflow_32(
const __m128i *preg0, const __m128i *preg1, const __m128i *preg2,
const __m128i *preg3, const __m128i *preg4, const __m128i *preg5,
const __m128i *preg6, const __m128i *preg7, const __m128i *preg8,
const __m128i *preg9, const __m128i *preg10, const __m128i *preg11,
const __m128i *preg12, const __m128i *preg13, const __m128i *preg14,
const __m128i *preg15, const __m128i *preg16, const __m128i *preg17,
const __m128i *preg18, const __m128i *preg19, const __m128i *preg20,
const __m128i *preg21, const __m128i *preg22, const __m128i *preg23,
const __m128i *preg24, const __m128i *preg25, const __m128i *preg26,
const __m128i *preg27, const __m128i *preg28, const __m128i *preg29,
const __m128i *preg30, const __m128i *preg31, const __m128i *zero) { … }
static INLINE void store_output(const __m128i *poutput, tran_low_t *dst_ptr) { … }
static INLINE void storeu_output(const __m128i *poutput, tran_low_t *dst_ptr) { … }
static INLINE __m128i mult_round_shift(const __m128i *pin0, const __m128i *pin1,
const __m128i *pmultiplier,
const __m128i *prounding,
const int shift) { … }
static INLINE void transpose_and_output8x8(
const __m128i *pin00, const __m128i *pin01, const __m128i *pin02,
const __m128i *pin03, const __m128i *pin04, const __m128i *pin05,
const __m128i *pin06, const __m128i *pin07, const int pass,
int16_t *out0_ptr, tran_low_t *out1_ptr) { … }
#ifdef __cplusplus
}
#endif
#endif