/* * Copyright (c) 2016, Alliance for Open Media. All rights reserved * * This source code is subject to the terms of the BSD 2 Clause License and * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License * was not distributed with this source code in the LICENSE file, you can * obtain it at www.aomedia.org/license/software. If the Alliance for Open * Media Patent License 1.0 was not distributed with this source code in the * PATENTS file, you can obtain it at www.aomedia.org/license/patent. */ #ifndef AOM_DSP_X86_FWD_TXFM_AVX2_H #define AOM_DSP_X86_FWD_TXFM_AVX2_H #include "./aom_config.h" static INLINE void storeu_output_avx2(const __m256i *coeff, tran_low_t *out) { if (sizeof(tran_low_t) == 4) { const __m256i zero = _mm256_setzero_si256(); const __m256i sign = _mm256_cmpgt_epi16(zero, *coeff); __m256i x0 = _mm256_unpacklo_epi16(*coeff, sign); __m256i x1 = _mm256_unpackhi_epi16(*coeff, sign); __m256i y0 = _mm256_permute2x128_si256(x0, x1, 0x20); __m256i y1 = _mm256_permute2x128_si256(x0, x1, 0x31); _mm256_storeu_si256((__m256i *)out, y0); _mm256_storeu_si256((__m256i *)(out + 8), y1); } else { _mm256_storeu_si256((__m256i *)out, *coeff); } } #endif // AOM_DSP_X86_FWD_TXFM_AVX2_H