#ifndef AOM_AOM_DSP_X86_MEM_SSE2_H_
#define AOM_AOM_DSP_X86_MEM_SSE2_H_
#include <emmintrin.h>
#include <string.h>
#include "config/aom_config.h"
#include "aom/aom_integer.h"
static inline int16_t loadu_int16(const void *src) { … }
static inline int32_t loadu_int32(const void *src) { … }
static inline int64_t loadu_int64(const void *src) { … }
static inline void _mm_storeh_epi64(__m128i *const d, const __m128i s) { … }
static inline __m128i loadh_epi64(const void *const src, const __m128i s) { … }
static inline __m128i load_8bit_4x4_to_1_reg_sse2(const void *const src,
const int byte_stride) { … }
static inline __m128i load_8bit_8x2_to_1_reg_sse2(const void *const src,
const int byte_stride) { … }
static inline void store_8bit_8x4_from_16x2(const __m128i *const s,
uint8_t *const d,
const ptrdiff_t stride) { … }
static inline void store_8bit_4x4(const __m128i *const s, uint8_t *const d,
const ptrdiff_t stride) { … }
static inline void store_8bit_4x4_sse2(const __m128i s, uint8_t *const d,
const ptrdiff_t stride) { … }
static inline void load_8bit_4x4(const uint8_t *const s, const ptrdiff_t stride,
__m128i *const d) { … }
static inline void load_8bit_4x8(const uint8_t *const s, const ptrdiff_t stride,
__m128i *const d) { … }
static inline void load_8bit_8x4(const uint8_t *const s, const ptrdiff_t stride,
__m128i *const d) { … }
static inline void loadu_8bit_16x4(const uint8_t *const s,
const ptrdiff_t stride, __m128i *const d) { … }
static inline void load_8bit_8x8(const uint8_t *const s, const ptrdiff_t stride,
__m128i *const d) { … }
static inline void load_8bit_16x8(const uint8_t *const s,
const ptrdiff_t stride, __m128i *const d) { … }
static inline void loadu_8bit_16x8(const uint8_t *const s,
const ptrdiff_t stride, __m128i *const d) { … }
static inline void store_8bit_8x8(const __m128i *const s, uint8_t *const d,
const ptrdiff_t stride) { … }
static inline void storeu_8bit_16x4(const __m128i *const s, uint8_t *const d,
const ptrdiff_t stride) { … }
#endif