diff options
Diffstat (limited to 'third_party/aom/aom_ports')
-rw-r--r-- | third_party/aom/aom_ports/aom_once.h | 138 | ||||
-rw-r--r-- | third_party/aom/aom_ports/aom_ports.cmake | 81 | ||||
-rw-r--r-- | third_party/aom/aom_ports/aom_timer.h | 111 | ||||
-rw-r--r-- | third_party/aom/aom_ports/arm.h | 41 | ||||
-rw-r--r-- | third_party/aom/aom_ports/arm_cpudetect.c | 150 | ||||
-rw-r--r-- | third_party/aom/aom_ports/bitops.h | 78 | ||||
-rw-r--r-- | third_party/aom/aom_ports/emmintrin_compat.h | 56 | ||||
-rw-r--r-- | third_party/aom/aom_ports/emms.asm | 41 | ||||
-rw-r--r-- | third_party/aom/aom_ports/mem.h | 69 | ||||
-rw-r--r-- | third_party/aom/aom_ports/mem_ops.h | 228 | ||||
-rw-r--r-- | third_party/aom/aom_ports/mem_ops_aligned.h | 173 | ||||
-rw-r--r-- | third_party/aom/aom_ports/msvc.h | 75 | ||||
-rw-r--r-- | third_party/aom/aom_ports/ppc.h | 30 | ||||
-rw-r--r-- | third_party/aom/aom_ports/ppc_cpudetect.c | 82 | ||||
-rw-r--r-- | third_party/aom/aom_ports/sanitizer.h | 38 | ||||
-rw-r--r-- | third_party/aom/aom_ports/system_state.h | 23 | ||||
-rw-r--r-- | third_party/aom/aom_ports/x86.h | 325 | ||||
-rw-r--r-- | third_party/aom/aom_ports/x86_abi_support.asm | 395 |
18 files changed, 0 insertions, 2134 deletions
diff --git a/third_party/aom/aom_ports/aom_once.h b/third_party/aom/aom_ports/aom_once.h deleted file mode 100644 index 4d77aac5a..000000000 --- a/third_party/aom/aom_ports/aom_once.h +++ /dev/null @@ -1,138 +0,0 @@ -/* - * Copyright (c) 2016, Alliance for Open Media. All rights reserved - * - * This source code is subject to the terms of the BSD 2 Clause License and - * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License - * was not distributed with this source code in the LICENSE file, you can - * obtain it at www.aomedia.org/license/software. If the Alliance for Open - * Media Patent License 1.0 was not distributed with this source code in the - * PATENTS file, you can obtain it at www.aomedia.org/license/patent. - */ - -#ifndef AOM_AOM_PORTS_AOM_ONCE_H_ -#define AOM_AOM_PORTS_AOM_ONCE_H_ - -#include "config/aom_config.h" - -/* Implement a function wrapper to guarantee initialization - * thread-safety for library singletons. - * - * NOTE: This function uses static locks, and can only be - * used with one common argument per compilation unit. So - * - * file1.c: - * aom_once(foo); - * ... - * aom_once(foo); - * - * file2.c: - * aom_once(bar); - * - * will ensure foo() and bar() are each called only once, but in - * - * file1.c: - * aom_once(foo); - * aom_once(bar): - * - * bar() will never be called because the lock is used up - * by the call to foo(). - */ - -#if CONFIG_MULTITHREAD && defined(_WIN32) -#include <windows.h> -#include <stdlib.h> -/* Declare a per-compilation-unit state variable to track the progress - * of calling func() only once. This must be at global scope because - * local initializers are not thread-safe in MSVC prior to Visual - * Studio 2015. - * - * As a static, aom_once_state will be zero-initialized as program start. - */ -static LONG aom_once_state; -static void aom_once(void (*func)(void)) { - /* Try to advance aom_once_state from its initial value of 0 to 1. - * Only one thread can succeed in doing so. - */ - if (InterlockedCompareExchange(&aom_once_state, 1, 0) == 0) { - /* We're the winning thread, having set aom_once_state to 1. - * Call our function. */ - func(); - /* Now advance aom_once_state to 2, unblocking any other threads. */ - InterlockedIncrement(&aom_once_state); - return; - } - - /* We weren't the winning thread, but we want to block on - * the state variable so we don't return before func() - * has finished executing elsewhere. - * - * Try to advance aom_once_state from 2 to 2, which is only possible - * after the winning thead advances it from 1 to 2. - */ - while (InterlockedCompareExchange(&aom_once_state, 2, 2) != 2) { - /* State isn't yet 2. Try again. - * - * We are used for singleton initialization functions, - * which should complete quickly. Contention will likewise - * be rare, so it's worthwhile to use a simple but cpu- - * intensive busy-wait instead of successive backoff, - * waiting on a kernel object, or another heavier-weight scheme. - * - * We can at least yield our timeslice. - */ - Sleep(0); - } - - /* We've seen aom_once_state advance to 2, so we know func() - * has been called. And we've left aom_once_state as we found it, - * so other threads will have the same experience. - * - * It's safe to return now. - */ - return; -} - -#elif CONFIG_MULTITHREAD && defined(__OS2__) -#define INCL_DOS -#include <os2.h> -static void aom_once(void (*func)(void)) { - static int done; - - /* If the initialization is complete, return early. */ - if (done) return; - - /* Causes all other threads in the process to block themselves - * and give up their time slice. - */ - DosEnterCritSec(); - - if (!done) { - func(); - done = 1; - } - - /* Restores normal thread dispatching for the current process. */ - DosExitCritSec(); -} - -#elif CONFIG_MULTITHREAD && HAVE_PTHREAD_H -#include <pthread.h> -static void aom_once(void (*func)(void)) { - static pthread_once_t lock = PTHREAD_ONCE_INIT; - pthread_once(&lock, func); -} - -#else -/* Default version that performs no synchronization. */ - -static void aom_once(void (*func)(void)) { - static int done; - - if (!done) { - func(); - done = 1; - } -} -#endif - -#endif // AOM_AOM_PORTS_AOM_ONCE_H_ diff --git a/third_party/aom/aom_ports/aom_ports.cmake b/third_party/aom/aom_ports/aom_ports.cmake deleted file mode 100644 index 6272fc0e3..000000000 --- a/third_party/aom/aom_ports/aom_ports.cmake +++ /dev/null @@ -1,81 +0,0 @@ -# -# Copyright (c) 2017, Alliance for Open Media. All rights reserved -# -# This source code is subject to the terms of the BSD 2 Clause License and the -# Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License was -# not distributed with this source code in the LICENSE file, you can obtain it -# at www.aomedia.org/license/software. If the Alliance for Open Media Patent -# License 1.0 was not distributed with this source code in the PATENTS file, you -# can obtain it at www.aomedia.org/license/patent. -# -if(AOM_AOM_PORTS_AOM_PORTS_CMAKE_) - return() -endif() # AOM_AOM_PORTS_AOM_PORTS_CMAKE_ -set(AOM_AOM_PORTS_AOM_PORTS_CMAKE_ 1) - -list(APPEND AOM_PORTS_INCLUDES - "${AOM_ROOT}/aom_ports/aom_once.h" - "${AOM_ROOT}/aom_ports/aom_timer.h" - "${AOM_ROOT}/aom_ports/bitops.h" - "${AOM_ROOT}/aom_ports/emmintrin_compat.h" - "${AOM_ROOT}/aom_ports/mem.h" - "${AOM_ROOT}/aom_ports/mem_ops.h" - "${AOM_ROOT}/aom_ports/mem_ops_aligned.h" - "${AOM_ROOT}/aom_ports/msvc.h" - "${AOM_ROOT}/aom_ports/sanitizer.h" - "${AOM_ROOT}/aom_ports/system_state.h") - -list(APPEND AOM_PORTS_ASM_X86 "${AOM_ROOT}/aom_ports/emms.asm") - -list(APPEND AOM_PORTS_INCLUDES_X86 "${AOM_ROOT}/aom_ports/x86_abi_support.asm") - -list(APPEND AOM_PORTS_SOURCES_ARM "${AOM_ROOT}/aom_ports/arm.h" - "${AOM_ROOT}/aom_ports/arm_cpudetect.c") - -list(APPEND AOM_PORTS_SOURCES_PPC "${AOM_ROOT}/aom_ports/ppc.h" - "${AOM_ROOT}/aom_ports/ppc_cpudetect.c") - -# For arm and x86 targets: -# -# * Creates the aom_ports build target, adds the includes in aom_ports to the -# target, and makes libaom depend on it. -# -# Otherwise: -# -# * Adds the includes in aom_ports to the libaom target. -# -# For all target platforms: -# -# * The libaom target must exist before this function is called. -function(setup_aom_ports_targets) - if("${AOM_TARGET_CPU}" MATCHES "^x86") - add_asm_library("aom_ports" "AOM_PORTS_ASM_X86" "aom") - set(aom_ports_has_symbols 1) - elseif("${AOM_TARGET_CPU}" MATCHES "arm") - add_library(aom_ports OBJECT ${AOM_PORTS_SOURCES_ARM}) - set(aom_ports_has_symbols 1) - target_sources(aom PRIVATE $<TARGET_OBJECTS:aom_ports>) - elseif("${AOM_TARGET_CPU}" MATCHES "ppc") - add_library(aom_ports OBJECT ${AOM_PORTS_SOURCES_PPC}) - set(aom_ports_has_symbols 1) - target_sources(aom PRIVATE $<TARGET_OBJECTS:aom_ports>) - endif() - - if(aom_ports_has_symbols) - target_sources(aom_ports PRIVATE ${AOM_PORTS_INCLUDES}) - - if("${AOM_TARGET_CPU}" STREQUAL "x86" OR "${AOM_TARGET_CPU}" STREQUAL - "x86_64") - target_sources(aom_ports PRIVATE ${AOM_PORTS_INCLUDES_X86}) - endif() - - set(AOM_LIB_TARGETS ${AOM_LIB_TARGETS} PARENT_SCOPE) - else() - target_sources(aom PRIVATE ${AOM_PORTS_INCLUDES}) - - if("${AOM_TARGET_CPU}" STREQUAL "x86" OR "${AOM_TARGET_CPU}" STREQUAL - "x86_64") - target_sources(aom PRIVATE ${AOM_PORTS_INCLUDES_X86}) - endif() - endif() -endfunction() diff --git a/third_party/aom/aom_ports/aom_timer.h b/third_party/aom/aom_ports/aom_timer.h deleted file mode 100644 index 9b17b8983..000000000 --- a/third_party/aom/aom_ports/aom_timer.h +++ /dev/null @@ -1,111 +0,0 @@ -/* - * Copyright (c) 2016, Alliance for Open Media. All rights reserved - * - * This source code is subject to the terms of the BSD 2 Clause License and - * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License - * was not distributed with this source code in the LICENSE file, you can - * obtain it at www.aomedia.org/license/software. If the Alliance for Open - * Media Patent License 1.0 was not distributed with this source code in the - * PATENTS file, you can obtain it at www.aomedia.org/license/patent. - */ - -#ifndef AOM_AOM_PORTS_AOM_TIMER_H_ -#define AOM_AOM_PORTS_AOM_TIMER_H_ - -#include "config/aom_config.h" - -#include "aom/aom_integer.h" - -#if CONFIG_OS_SUPPORT - -#if defined(_WIN32) -/* - * Win32 specific includes - */ -#ifndef WIN32_LEAN_AND_MEAN -#define WIN32_LEAN_AND_MEAN -#endif -#include <windows.h> -#else -/* - * POSIX specific includes - */ -#include <sys/time.h> - -/* timersub is not provided by msys at this time. */ -#ifndef timersub -#define timersub(a, b, result) \ - do { \ - (result)->tv_sec = (a)->tv_sec - (b)->tv_sec; \ - (result)->tv_usec = (a)->tv_usec - (b)->tv_usec; \ - if ((result)->tv_usec < 0) { \ - --(result)->tv_sec; \ - (result)->tv_usec += 1000000; \ - } \ - } while (0) -#endif -#endif - -struct aom_usec_timer { -#if defined(_WIN32) - LARGE_INTEGER begin, end; -#else - struct timeval begin, end; -#endif -}; - -static INLINE void aom_usec_timer_start(struct aom_usec_timer *t) { -#if defined(_WIN32) - QueryPerformanceCounter(&t->begin); -#else - gettimeofday(&t->begin, NULL); -#endif -} - -static INLINE void aom_usec_timer_mark(struct aom_usec_timer *t) { -#if defined(_WIN32) - QueryPerformanceCounter(&t->end); -#else - gettimeofday(&t->end, NULL); -#endif -} - -static INLINE int64_t aom_usec_timer_elapsed(struct aom_usec_timer *t) { -#if defined(_WIN32) - LARGE_INTEGER freq, diff; - - diff.QuadPart = t->end.QuadPart - t->begin.QuadPart; - - QueryPerformanceFrequency(&freq); - return diff.QuadPart * 1000000 / freq.QuadPart; -#else - struct timeval diff; - - timersub(&t->end, &t->begin, &diff); - return ((int64_t)diff.tv_sec) * 1000000 + diff.tv_usec; -#endif -} - -#else /* CONFIG_OS_SUPPORT = 0*/ - -/* Empty timer functions if CONFIG_OS_SUPPORT = 0 */ -#ifndef timersub -#define timersub(a, b, result) -#endif - -struct aom_usec_timer { - void *dummy; -}; - -static INLINE void aom_usec_timer_start(struct aom_usec_timer *t) { (void)t; } - -static INLINE void aom_usec_timer_mark(struct aom_usec_timer *t) { (void)t; } - -static INLINE int aom_usec_timer_elapsed(struct aom_usec_timer *t) { - (void)t; - return 0; -} - -#endif /* CONFIG_OS_SUPPORT */ - -#endif // AOM_AOM_PORTS_AOM_TIMER_H_ diff --git a/third_party/aom/aom_ports/arm.h b/third_party/aom/aom_ports/arm.h deleted file mode 100644 index cb1fb9bec..000000000 --- a/third_party/aom/aom_ports/arm.h +++ /dev/null @@ -1,41 +0,0 @@ -/* - * Copyright (c) 2016, Alliance for Open Media. All rights reserved - * - * This source code is subject to the terms of the BSD 2 Clause License and - * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License - * was not distributed with this source code in the LICENSE file, you can - * obtain it at www.aomedia.org/license/software. If the Alliance for Open - * Media Patent License 1.0 was not distributed with this source code in the - * PATENTS file, you can obtain it at www.aomedia.org/license/patent. - */ - -#ifndef AOM_AOM_PORTS_ARM_H_ -#define AOM_AOM_PORTS_ARM_H_ -#include <stdlib.h> - -#include "config/aom_config.h" - -#ifdef __cplusplus -extern "C" { -#endif - -/*ARMv5TE "Enhanced DSP" instructions.*/ -#define HAS_EDSP 0x01 -/*ARMv6 "Parallel" or "Media" instructions.*/ -#define HAS_MEDIA 0x02 -/*ARMv7 optional NEON instructions.*/ -#define HAS_NEON 0x04 - -int aom_arm_cpu_caps(void); - -// Earlier gcc compilers have issues with some neon intrinsics -#if !defined(__clang__) && defined(__GNUC__) && __GNUC__ == 4 && \ - __GNUC_MINOR__ <= 6 -#define AOM_INCOMPATIBLE_GCC -#endif - -#ifdef __cplusplus -} // extern "C" -#endif - -#endif // AOM_AOM_PORTS_ARM_H_ diff --git a/third_party/aom/aom_ports/arm_cpudetect.c b/third_party/aom/aom_ports/arm_cpudetect.c deleted file mode 100644 index 5a75bb348..000000000 --- a/third_party/aom/aom_ports/arm_cpudetect.c +++ /dev/null @@ -1,150 +0,0 @@ -/* - * Copyright (c) 2016, Alliance for Open Media. All rights reserved - * - * This source code is subject to the terms of the BSD 2 Clause License and - * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License - * was not distributed with this source code in the LICENSE file, you can - * obtain it at www.aomedia.org/license/software. If the Alliance for Open - * Media Patent License 1.0 was not distributed with this source code in the - * PATENTS file, you can obtain it at www.aomedia.org/license/patent. - */ - -#include <stdlib.h> -#include <string.h> -#include "aom_ports/arm.h" -#include "config/aom_config.h" - -#ifdef WINAPI_FAMILY -#include <winapifamily.h> -#if !WINAPI_FAMILY_PARTITION(WINAPI_PARTITION_DESKTOP) -#define getenv(x) NULL -#endif -#endif - -static int arm_cpu_env_flags(int *flags) { - char *env; - env = getenv("AOM_SIMD_CAPS"); - if (env && *env) { - *flags = (int)strtol(env, NULL, 0); - return 0; - } - *flags = 0; - return -1; -} - -static int arm_cpu_env_mask(void) { - char *env; - env = getenv("AOM_SIMD_CAPS_MASK"); - return env && *env ? (int)strtol(env, NULL, 0) : ~0; -} - -#if !CONFIG_RUNTIME_CPU_DETECT - -int aom_arm_cpu_caps(void) { - /* This function should actually be a no-op. There is no way to adjust any of - * these because the RTCD tables do not exist: the functions are called - * statically */ - int flags; - int mask; - if (!arm_cpu_env_flags(&flags)) { - return flags; - } - mask = arm_cpu_env_mask(); -#if HAVE_NEON - flags |= HAS_NEON; -#endif /* HAVE_NEON */ - return flags & mask; -} - -#elif defined(_MSC_VER) /* end !CONFIG_RUNTIME_CPU_DETECT */ -/*For GetExceptionCode() and EXCEPTION_ILLEGAL_INSTRUCTION.*/ -#define WIN32_LEAN_AND_MEAN -#define WIN32_EXTRA_LEAN -#include <windows.h> - -int aom_arm_cpu_caps(void) { - int flags; - int mask; - if (!arm_cpu_env_flags(&flags)) { - return flags; - } - mask = arm_cpu_env_mask(); -/* MSVC has no inline __asm support for ARM, but it does let you __emit - * instructions via their assembled hex code. - * All of these instructions should be essentially nops. - */ -#if HAVE_NEON - if (mask & HAS_NEON) { - __try { - /*VORR q0,q0,q0*/ - __emit(0xF2200150); - flags |= HAS_NEON; - } __except (GetExceptionCode() == EXCEPTION_ILLEGAL_INSTRUCTION) { - /*Ignore exception.*/ - } - } -#endif /* HAVE_NEON */ - return flags & mask; -} - -#elif defined(__ANDROID__) /* end _MSC_VER */ -#include <cpu-features.h> - -int aom_arm_cpu_caps(void) { - int flags; - int mask; - uint64_t features; - if (!arm_cpu_env_flags(&flags)) { - return flags; - } - mask = arm_cpu_env_mask(); - features = android_getCpuFeatures(); - -#if HAVE_NEON - if (features & ANDROID_CPU_ARM_FEATURE_NEON) flags |= HAS_NEON; -#endif /* HAVE_NEON */ - return flags & mask; -} - -#elif defined(__linux__) /* end __ANDROID__ */ - -#include <stdio.h> - -int aom_arm_cpu_caps(void) { - FILE *fin; - int flags; - int mask; - if (!arm_cpu_env_flags(&flags)) { - return flags; - } - mask = arm_cpu_env_mask(); - /* Reading /proc/self/auxv would be easier, but that doesn't work reliably - * on Android. - * This also means that detection will fail in Scratchbox. - */ - fin = fopen("/proc/cpuinfo", "r"); - if (fin != NULL) { - /* 512 should be enough for anybody (it's even enough for all the flags - * that x86 has accumulated... so far). - */ - char buf[512]; - while (fgets(buf, 511, fin) != NULL) { -#if HAVE_NEON - if (memcmp(buf, "Features", 8) == 0) { - char *p; - p = strstr(buf, " neon"); - if (p != NULL && (p[5] == ' ' || p[5] == '\n')) { - flags |= HAS_NEON; - } - } -#endif /* HAVE_NEON */ - } - fclose(fin); - } - return flags & mask; -} -#else /* end __linux__ */ -#error \ - "--enable-runtime-cpu-detect selected, but no CPU detection method " \ -"available for your platform. Reconfigure with --disable-runtime-cpu-detect." -#endif diff --git a/third_party/aom/aom_ports/bitops.h b/third_party/aom/aom_ports/bitops.h deleted file mode 100644 index 44df17307..000000000 --- a/third_party/aom/aom_ports/bitops.h +++ /dev/null @@ -1,78 +0,0 @@ -/* - * Copyright (c) 2016, Alliance for Open Media. All rights reserved - * - * This source code is subject to the terms of the BSD 2 Clause License and - * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License - * was not distributed with this source code in the LICENSE file, you can - * obtain it at www.aomedia.org/license/software. If the Alliance for Open - * Media Patent License 1.0 was not distributed with this source code in the - * PATENTS file, you can obtain it at www.aomedia.org/license/patent. - */ - -#ifndef AOM_AOM_PORTS_BITOPS_H_ -#define AOM_AOM_PORTS_BITOPS_H_ - -#include <assert.h> - -#include "aom_ports/msvc.h" -#include "config/aom_config.h" - -#ifdef _MSC_VER -#if defined(_M_X64) || defined(_M_IX86) -#include <intrin.h> -#define USE_MSC_INTRINSICS -#endif -#endif - -#ifdef __cplusplus -extern "C" { -#endif - -// get_msb: -// Returns (int)floor(log2(n)). n must be > 0. -// These versions of get_msb() are only valid when n != 0 because all -// of the optimized versions are undefined when n == 0: -// https://gcc.gnu.org/onlinedocs/gcc/Other-Builtins.html - -// use GNU builtins where available. -#if defined(__GNUC__) && \ - ((__GNUC__ == 3 && __GNUC_MINOR__ >= 4) || __GNUC__ >= 4) -static INLINE int get_msb(unsigned int n) { - assert(n != 0); - return 31 ^ __builtin_clz(n); -} -#elif defined(USE_MSC_INTRINSICS) -#pragma intrinsic(_BitScanReverse) - -static INLINE int get_msb(unsigned int n) { - unsigned long first_set_bit; - assert(n != 0); - _BitScanReverse(&first_set_bit, n); - return first_set_bit; -} -#undef USE_MSC_INTRINSICS -#else -static INLINE int get_msb(unsigned int n) { - int log = 0; - unsigned int value = n; - int i; - - assert(n != 0); - - for (i = 4; i >= 0; --i) { - const int shift = (1 << i); - const unsigned int x = value >> shift; - if (x != 0) { - value = x; - log += shift; - } - } - return log; -} -#endif - -#ifdef __cplusplus -} // extern "C" -#endif - -#endif // AOM_AOM_PORTS_BITOPS_H_ diff --git a/third_party/aom/aom_ports/emmintrin_compat.h b/third_party/aom/aom_ports/emmintrin_compat.h deleted file mode 100644 index 85d218a3d..000000000 --- a/third_party/aom/aom_ports/emmintrin_compat.h +++ /dev/null @@ -1,56 +0,0 @@ -/* - * Copyright (c) 2016, Alliance for Open Media. All rights reserved - * - * This source code is subject to the terms of the BSD 2 Clause License and - * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License - * was not distributed with this source code in the LICENSE file, you can - * obtain it at www.aomedia.org/license/software. If the Alliance for Open - * Media Patent License 1.0 was not distributed with this source code in the - * PATENTS file, you can obtain it at www.aomedia.org/license/patent. - */ - -#ifndef AOM_AOM_PORTS_EMMINTRIN_COMPAT_H_ -#define AOM_AOM_PORTS_EMMINTRIN_COMPAT_H_ - -#if defined(__GNUC__) && __GNUC__ < 4 -/* From emmintrin.h (gcc 4.5.3) */ -/* Casts between various SP, DP, INT vector types. Note that these do no - conversion of values, they just change the type. */ -extern __inline __m128 - __attribute__((__gnu_inline__, __always_inline__, __artificial__)) - _mm_castpd_ps(__m128d __A) { - return (__m128)__A; -} - -extern __inline __m128i - __attribute__((__gnu_inline__, __always_inline__, __artificial__)) - _mm_castpd_si128(__m128d __A) { - return (__m128i)__A; -} - -extern __inline __m128d - __attribute__((__gnu_inline__, __always_inline__, __artificial__)) - _mm_castps_pd(__m128 __A) { - return (__m128d)__A; -} - -extern __inline __m128i - __attribute__((__gnu_inline__, __always_inline__, __artificial__)) - _mm_castps_si128(__m128 __A) { - return (__m128i)__A; -} - -extern __inline __m128 - __attribute__((__gnu_inline__, __always_inline__, __artificial__)) - _mm_castsi128_ps(__m128i __A) { - return (__m128)__A; -} - -extern __inline __m128d - __attribute__((__gnu_inline__, __always_inline__, __artificial__)) - _mm_castsi128_pd(__m128i __A) { - return (__m128d)__A; -} -#endif - -#endif // AOM_AOM_PORTS_EMMINTRIN_COMPAT_H_ diff --git a/third_party/aom/aom_ports/emms.asm b/third_party/aom/aom_ports/emms.asm deleted file mode 100644 index 90776bacb..000000000 --- a/third_party/aom/aom_ports/emms.asm +++ /dev/null @@ -1,41 +0,0 @@ -; -; Copyright (c) 2016, Alliance for Open Media. All rights reserved -; -; This source code is subject to the terms of the BSD 2 Clause License and -; the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License -; was not distributed with this source code in the LICENSE file, you can -; obtain it at www.aomedia.org/license/software. If the Alliance for Open -; Media Patent License 1.0 was not distributed with this source code in the -; PATENTS file, you can obtain it at www.aomedia.org/license/patent. -; - -; - - -%include "aom_ports/x86_abi_support.asm" - -section .text -global sym(aom_reset_mmx_state) PRIVATE -sym(aom_reset_mmx_state): - emms - ret - - -%if LIBAOM_YASM_WIN64 -global sym(aom_winx64_fldcw) PRIVATE -sym(aom_winx64_fldcw): - sub rsp, 8 - mov [rsp], rcx ; win x64 specific - fldcw [rsp] - add rsp, 8 - ret - - -global sym(aom_winx64_fstcw) PRIVATE -sym(aom_winx64_fstcw): - sub rsp, 8 - fstcw [rsp] - mov rax, [rsp] - add rsp, 8 - ret -%endif diff --git a/third_party/aom/aom_ports/mem.h b/third_party/aom/aom_ports/mem.h deleted file mode 100644 index 3ffea3cd6..000000000 --- a/third_party/aom/aom_ports/mem.h +++ /dev/null @@ -1,69 +0,0 @@ -/* - * Copyright (c) 2016, Alliance for Open Media. All rights reserved - * - * This source code is subject to the terms of the BSD 2 Clause License and - * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License - * was not distributed with this source code in the LICENSE file, you can - * obtain it at www.aomedia.org/license/software. If the Alliance for Open - * Media Patent License 1.0 was not distributed with this source code in the - * PATENTS file, you can obtain it at www.aomedia.org/license/patent. - */ - -#ifndef AOM_AOM_PORTS_MEM_H_ -#define AOM_AOM_PORTS_MEM_H_ - -#include "aom/aom_integer.h" -#include "config/aom_config.h" - -#if (defined(__GNUC__) && __GNUC__) || defined(__SUNPRO_C) -#define DECLARE_ALIGNED(n, typ, val) typ val __attribute__((aligned(n))) -#elif defined(_MSC_VER) -#define DECLARE_ALIGNED(n, typ, val) __declspec(align(n)) typ val -#else -#warning No alignment directives known for this compiler. -#define DECLARE_ALIGNED(n, typ, val) typ val -#endif - -/* Indicates that the usage of the specified variable has been audited to assure - * that it's safe to use uninitialized. Silences 'may be used uninitialized' - * warnings on gcc. - */ -#if defined(__GNUC__) && __GNUC__ -#define UNINITIALIZED_IS_SAFE(x) x = x -#else -#define UNINITIALIZED_IS_SAFE(x) x -#endif - -#if HAVE_NEON && defined(_MSC_VER) -#define __builtin_prefetch(x) -#endif - -/* Shift down with rounding for use when n >= 0, value >= 0 */ -#define ROUND_POWER_OF_TWO(value, n) (((value) + (((1 << (n)) >> 1))) >> (n)) - -/* Shift down with rounding for signed integers, for use when n >= 0 */ -#define ROUND_POWER_OF_TWO_SIGNED(value, n) \ - (((value) < 0) ? -ROUND_POWER_OF_TWO(-(value), (n)) \ - : ROUND_POWER_OF_TWO((value), (n))) - -/* Shift down with rounding for use when n >= 0, value >= 0 for (64 bit) */ -#define ROUND_POWER_OF_TWO_64(value, n) \ - (((value) + ((((int64_t)1 << (n)) >> 1))) >> (n)) -/* Shift down with rounding for signed integers, for use when n >= 0 (64 bit) */ -#define ROUND_POWER_OF_TWO_SIGNED_64(value, n) \ - (((value) < 0) ? -ROUND_POWER_OF_TWO_64(-(value), (n)) \ - : ROUND_POWER_OF_TWO_64((value), (n))) - -/* shift right or left depending on sign of n */ -#define RIGHT_SIGNED_SHIFT(value, n) \ - ((n) < 0 ? ((value) << (-(n))) : ((value) >> (n))) - -#define ALIGN_POWER_OF_TWO(value, n) \ - (((value) + ((1 << (n)) - 1)) & ~((1 << (n)) - 1)) - -#define DIVIDE_AND_ROUND(x, y) (((x) + ((y) >> 1)) / (y)) - -#define CONVERT_TO_SHORTPTR(x) ((uint16_t *)(((uintptr_t)(x)) << 1)) -#define CONVERT_TO_BYTEPTR(x) ((uint8_t *)(((uintptr_t)(x)) >> 1)) - -#endif // AOM_AOM_PORTS_MEM_H_ diff --git a/third_party/aom/aom_ports/mem_ops.h b/third_party/aom/aom_ports/mem_ops.h deleted file mode 100644 index 2b5bc0f0f..000000000 --- a/third_party/aom/aom_ports/mem_ops.h +++ /dev/null @@ -1,228 +0,0 @@ -/* - * Copyright (c) 2016, Alliance for Open Media. All rights reserved - * - * This source code is subject to the terms of the BSD 2 Clause License and - * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License - * was not distributed with this source code in the LICENSE file, you can - * obtain it at www.aomedia.org/license/software. If the Alliance for Open - * Media Patent License 1.0 was not distributed with this source code in the - * PATENTS file, you can obtain it at www.aomedia.org/license/patent. - */ - -#ifndef AOM_AOM_PORTS_MEM_OPS_H_ -#define AOM_AOM_PORTS_MEM_OPS_H_ - -/* \file - * \brief Provides portable memory access primitives - * - * This function provides portable primitives for getting and setting of - * signed and unsigned integers in 16, 24, and 32 bit sizes. The operations - * can be performed on unaligned data regardless of hardware support for - * unaligned accesses. - * - * The type used to pass the integral values may be changed by defining - * MEM_VALUE_T with the appropriate type. The type given must be an integral - * numeric type. - * - * The actual functions instantiated have the MEM_VALUE_T type name pasted - * on to the symbol name. This allows the developer to instantiate these - * operations for multiple types within the same translation unit. This is - * of somewhat questionable utility, but the capability exists nonetheless. - * Users not making use of this functionality should call the functions - * without the type name appended, and the preprocessor will take care of - * it. - * - * NOTE: This code is not supported on platforms where char > 1 octet ATM. - */ - -#ifndef MAU_T -/* Minimum Access Unit for this target */ -#define MAU_T unsigned char -#endif - -#ifndef MEM_VALUE_T -#define MEM_VALUE_T int -#endif - -#undef MEM_VALUE_T_SZ_BITS -#define MEM_VALUE_T_SZ_BITS (sizeof(MEM_VALUE_T) << 3) - -#undef mem_ops_wrap_symbol -#define mem_ops_wrap_symbol(fn) mem_ops_wrap_symbol2(fn, MEM_VALUE_T) -#undef mem_ops_wrap_symbol2 -#define mem_ops_wrap_symbol2(fn, typ) mem_ops_wrap_symbol3(fn, typ) -#undef mem_ops_wrap_symbol3 -#define mem_ops_wrap_symbol3(fn, typ) fn##_as_##typ - -/* - * Include aligned access routines - */ -#define INCLUDED_BY_MEM_OPS_H -#include "mem_ops_aligned.h" -#undef INCLUDED_BY_MEM_OPS_H - -#undef mem_get_be16 -#define mem_get_be16 mem_ops_wrap_symbol(mem_get_be16) -static unsigned MEM_VALUE_T mem_get_be16(const void *vmem) { - unsigned MEM_VALUE_T val; - const MAU_T *mem = (const MAU_T *)vmem; - - val = mem[0] << 8; - val |= mem[1]; - return val; -} - -#undef mem_get_be24 -#define mem_get_be24 mem_ops_wrap_symbol(mem_get_be24) -static unsigned MEM_VALUE_T mem_get_be24(const void *vmem) { - unsigned MEM_VALUE_T val; - const MAU_T *mem = (const MAU_T *)vmem; - - val = mem[0] << 16; - val |= mem[1] << 8; - val |= mem[2]; - return val; -} - -#undef mem_get_be32 -#define mem_get_be32 mem_ops_wrap_symbol(mem_get_be32) -static unsigned MEM_VALUE_T mem_get_be32(const void *vmem) { - unsigned MEM_VALUE_T val; - const MAU_T *mem = (const MAU_T *)vmem; - - val = ((unsigned MEM_VALUE_T)mem[0]) << 24; - val |= mem[1] << 16; - val |= mem[2] << 8; - val |= mem[3]; - return val; -} - -#undef mem_get_le16 -#define mem_get_le16 mem_ops_wrap_symbol(mem_get_le16) -static unsigned MEM_VALUE_T mem_get_le16(const void *vmem) { - unsigned MEM_VALUE_T val; - const MAU_T *mem = (const MAU_T *)vmem; - - val = mem[1] << 8; - val |= mem[0]; - return val; -} - -#undef mem_get_le24 -#define mem_get_le24 mem_ops_wrap_symbol(mem_get_le24) -static unsigned MEM_VALUE_T mem_get_le24(const void *vmem) { - unsigned MEM_VALUE_T val; - const MAU_T *mem = (const MAU_T *)vmem; - - val = mem[2] << 16; - val |= mem[1] << 8; - val |= mem[0]; - return val; -} - -#undef mem_get_le32 -#define mem_get_le32 mem_ops_wrap_symbol(mem_get_le32) -static unsigned MEM_VALUE_T mem_get_le32(const void *vmem) { - unsigned MEM_VALUE_T val; - const MAU_T *mem = (const MAU_T *)vmem; - - val = ((unsigned MEM_VALUE_T)mem[3]) << 24; - val |= mem[2] << 16; - val |= mem[1] << 8; - val |= mem[0]; - return val; -} - -#define mem_get_s_generic(end, sz) \ - static AOM_INLINE signed MEM_VALUE_T mem_get_s##end##sz(const void *vmem) { \ - const MAU_T *mem = (const MAU_T *)vmem; \ - signed MEM_VALUE_T val = mem_get_##end##sz(mem); \ - return (val << (MEM_VALUE_T_SZ_BITS - sz)) >> (MEM_VALUE_T_SZ_BITS - sz); \ - } - -/* clang-format off */ -#undef mem_get_sbe16 -#define mem_get_sbe16 mem_ops_wrap_symbol(mem_get_sbe16) -mem_get_s_generic(be, 16) - -#undef mem_get_sbe24 -#define mem_get_sbe24 mem_ops_wrap_symbol(mem_get_sbe24) -mem_get_s_generic(be, 24) - -#undef mem_get_sbe32 -#define mem_get_sbe32 mem_ops_wrap_symbol(mem_get_sbe32) -mem_get_s_generic(be, 32) - -#undef mem_get_sle16 -#define mem_get_sle16 mem_ops_wrap_symbol(mem_get_sle16) -mem_get_s_generic(le, 16) - -#undef mem_get_sle24 -#define mem_get_sle24 mem_ops_wrap_symbol(mem_get_sle24) -mem_get_s_generic(le, 24) - -#undef mem_get_sle32 -#define mem_get_sle32 mem_ops_wrap_symbol(mem_get_sle32) -mem_get_s_generic(le, 32) - -#undef mem_put_be16 -#define mem_put_be16 mem_ops_wrap_symbol(mem_put_be16) -static AOM_INLINE void mem_put_be16(void *vmem, MEM_VALUE_T val) { - MAU_T *mem = (MAU_T *)vmem; - - mem[0] = (MAU_T)((val >> 8) & 0xff); - mem[1] = (MAU_T)((val >> 0) & 0xff); -} - -#undef mem_put_be24 -#define mem_put_be24 mem_ops_wrap_symbol(mem_put_be24) -static AOM_INLINE void mem_put_be24(void *vmem, MEM_VALUE_T val) { - MAU_T *mem = (MAU_T *)vmem; - - mem[0] = (MAU_T)((val >> 16) & 0xff); - mem[1] = (MAU_T)((val >> 8) & 0xff); - mem[2] = (MAU_T)((val >> 0) & 0xff); -} - -#undef mem_put_be32 -#define mem_put_be32 mem_ops_wrap_symbol(mem_put_be32) -static AOM_INLINE void mem_put_be32(void *vmem, MEM_VALUE_T val) { - MAU_T *mem = (MAU_T *)vmem; - - mem[0] = (MAU_T)((val >> 24) & 0xff); - mem[1] = (MAU_T)((val >> 16) & 0xff); - mem[2] = (MAU_T)((val >> 8) & 0xff); - mem[3] = (MAU_T)((val >> 0) & 0xff); -} - -#undef mem_put_le16 -#define mem_put_le16 mem_ops_wrap_symbol(mem_put_le16) -static AOM_INLINE void mem_put_le16(void *vmem, MEM_VALUE_T val) { - MAU_T *mem = (MAU_T *)vmem; - - mem[0] = (MAU_T)((val >> 0) & 0xff); - mem[1] = (MAU_T)((val >> 8) & 0xff); -} - -#undef mem_put_le24 -#define mem_put_le24 mem_ops_wrap_symbol(mem_put_le24) -static AOM_INLINE void mem_put_le24(void *vmem, MEM_VALUE_T val) { - MAU_T *mem = (MAU_T *)vmem; - - mem[0] = (MAU_T)((val >> 0) & 0xff); - mem[1] = (MAU_T)((val >> 8) & 0xff); - mem[2] = (MAU_T)((val >> 16) & 0xff); -} - -#undef mem_put_le32 -#define mem_put_le32 mem_ops_wrap_symbol(mem_put_le32) -static AOM_INLINE void mem_put_le32(void *vmem, MEM_VALUE_T val) { - MAU_T *mem = (MAU_T *)vmem; - - mem[0] = (MAU_T)((val >> 0) & 0xff); - mem[1] = (MAU_T)((val >> 8) & 0xff); - mem[2] = (MAU_T)((val >> 16) & 0xff); - mem[3] = (MAU_T)((val >> 24) & 0xff); -} -/* clang-format on */ -#endif // AOM_AOM_PORTS_MEM_OPS_H_ diff --git a/third_party/aom/aom_ports/mem_ops_aligned.h b/third_party/aom/aom_ports/mem_ops_aligned.h deleted file mode 100644 index 37c367531..000000000 --- a/third_party/aom/aom_ports/mem_ops_aligned.h +++ /dev/null @@ -1,173 +0,0 @@ -/* - * Copyright (c) 2016, Alliance for Open Media. All rights reserved - * - * This source code is subject to the terms of the BSD 2 Clause License and - * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License - * was not distributed with this source code in the LICENSE file, you can - * obtain it at www.aomedia.org/license/software. If the Alliance for Open - * Media Patent License 1.0 was not distributed with this source code in the - * PATENTS file, you can obtain it at www.aomedia.org/license/patent. - */ - -#ifndef AOM_AOM_PORTS_MEM_OPS_ALIGNED_H_ -#define AOM_AOM_PORTS_MEM_OPS_ALIGNED_H_ - -#include "aom/aom_integer.h" - -/* \file - * \brief Provides portable memory access primitives for operating on aligned - * data - * - * This file is split from mem_ops.h for easier maintenance. See mem_ops.h - * for a more detailed description of these primitives. - */ -#ifndef INCLUDED_BY_MEM_OPS_H -#error Include mem_ops.h, not mem_ops_aligned.h directly. -#endif - -/* Architectures that provide instructions for doing this byte swapping - * could redefine these macros. - */ -#define swap_endian_16(val, raw) \ - do { \ - val = (uint16_t)(((raw >> 8) & 0x00ff) | ((raw << 8) & 0xff00)); \ - } while (0) -#define swap_endian_32(val, raw) \ - do { \ - val = ((raw >> 24) & 0x000000ff) | ((raw >> 8) & 0x0000ff00) | \ - ((raw << 8) & 0x00ff0000) | ((raw << 24) & 0xff000000); \ - } while (0) -#define swap_endian_16_se(val, raw) \ - do { \ - swap_endian_16(val, raw); \ - val = ((val << 16) >> 16); \ - } while (0) -#define swap_endian_32_se(val, raw) swap_endian_32(val, raw) - -#define mem_get_ne_aligned_generic(end, sz) \ - static AOM_INLINE unsigned MEM_VALUE_T mem_get_##end##sz##_aligned( \ - const void *vmem) { \ - const uint##sz##_t *mem = (const uint##sz##_t *)vmem; \ - return *mem; \ - } - -#define mem_get_sne_aligned_generic(end, sz) \ - static AOM_INLINE signed MEM_VALUE_T mem_get_s##end##sz##_aligned( \ - const void *vmem) { \ - const int##sz##_t *mem = (const int##sz##_t *)vmem; \ - return *mem; \ - } - -#define mem_get_se_aligned_generic(end, sz) \ - static AOM_INLINE unsigned MEM_VALUE_T mem_get_##end##sz##_aligned( \ - const void *vmem) { \ - const uint##sz##_t *mem = (const uint##sz##_t *)vmem; \ - unsigned MEM_VALUE_T val, raw = *mem; \ - swap_endian_##sz(val, raw); \ - return val; \ - } - -#define mem_get_sse_aligned_generic(end, sz) \ - static AOM_INLINE signed MEM_VALUE_T mem_get_s##end##sz##_aligned( \ - const void *vmem) { \ - const int##sz##_t *mem = (const int##sz##_t *)vmem; \ - unsigned MEM_VALUE_T val, raw = *mem; \ - swap_endian_##sz##_se(val, raw); \ - return val; \ - } - -#define mem_put_ne_aligned_generic(end, sz) \ - static AOM_INLINE void mem_put_##end##sz##_aligned(void *vmem, \ - MEM_VALUE_T val) { \ - uint##sz##_t *mem = (uint##sz##_t *)vmem; \ - *mem = (uint##sz##_t)val; \ - } - -#define mem_put_se_aligned_generic(end, sz) \ - static AOM_INLINE void mem_put_##end##sz##_aligned(void *vmem, \ - MEM_VALUE_T val) { \ - uint##sz##_t *mem = (uint##sz##_t *)vmem, raw; \ - swap_endian_##sz(raw, val); \ - *mem = (uint##sz##_t)raw; \ - } - -#include "config/aom_config.h" - -#if CONFIG_BIG_ENDIAN -#define mem_get_be_aligned_generic(sz) mem_get_ne_aligned_generic(be, sz) -#define mem_get_sbe_aligned_generic(sz) mem_get_sne_aligned_generic(be, sz) -#define mem_get_le_aligned_generic(sz) mem_get_se_aligned_generic(le, sz) -#define mem_get_sle_aligned_generic(sz) mem_get_sse_aligned_generic(le, sz) -#define mem_put_be_aligned_generic(sz) mem_put_ne_aligned_generic(be, sz) -#define mem_put_le_aligned_generic(sz) mem_put_se_aligned_generic(le, sz) -#else -#define mem_get_be_aligned_generic(sz) mem_get_se_aligned_generic(be, sz) -#define mem_get_sbe_aligned_generic(sz) mem_get_sse_aligned_generic(be, sz) -#define mem_get_le_aligned_generic(sz) mem_get_ne_aligned_generic(le, sz) -#define mem_get_sle_aligned_generic(sz) mem_get_sne_aligned_generic(le, sz) -#define mem_put_be_aligned_generic(sz) mem_put_se_aligned_generic(be, sz) -#define mem_put_le_aligned_generic(sz) mem_put_ne_aligned_generic(le, sz) -#endif - -/* clang-format off */ -#undef mem_get_be16_aligned -#define mem_get_be16_aligned mem_ops_wrap_symbol(mem_get_be16_aligned) -mem_get_be_aligned_generic(16) - -#undef mem_get_be32_aligned -#define mem_get_be32_aligned mem_ops_wrap_symbol(mem_get_be32_aligned) -mem_get_be_aligned_generic(32) - -#undef mem_get_le16_aligned -#define mem_get_le16_aligned mem_ops_wrap_symbol(mem_get_le16_aligned) -mem_get_le_aligned_generic(16) - -#undef mem_get_le32_aligned -#define mem_get_le32_aligned mem_ops_wrap_symbol(mem_get_le32_aligned) -mem_get_le_aligned_generic(32) - -#undef mem_get_sbe16_aligned -#define mem_get_sbe16_aligned mem_ops_wrap_symbol(mem_get_sbe16_aligned) -mem_get_sbe_aligned_generic(16) - -#undef mem_get_sbe32_aligned -#define mem_get_sbe32_aligned mem_ops_wrap_symbol(mem_get_sbe32_aligned) -mem_get_sbe_aligned_generic(32) - -#undef mem_get_sle16_aligned -#define mem_get_sle16_aligned mem_ops_wrap_symbol(mem_get_sle16_aligned) -mem_get_sle_aligned_generic(16) - -#undef mem_get_sle32_aligned -#define mem_get_sle32_aligned mem_ops_wrap_symbol(mem_get_sle32_aligned) -mem_get_sle_aligned_generic(32) - -#undef mem_put_be16_aligned -#define mem_put_be16_aligned mem_ops_wrap_symbol(mem_put_be16_aligned) -mem_put_be_aligned_generic(16) - -#undef mem_put_be32_aligned -#define mem_put_be32_aligned mem_ops_wrap_symbol(mem_put_be32_aligned) -mem_put_be_aligned_generic(32) - -#undef mem_put_le16_aligned -#define mem_put_le16_aligned mem_ops_wrap_symbol(mem_put_le16_aligned) -mem_put_le_aligned_generic(16) - -#undef mem_put_le32_aligned -#define mem_put_le32_aligned mem_ops_wrap_symbol(mem_put_le32_aligned) -mem_put_le_aligned_generic(32) - -#undef mem_get_ne_aligned_generic -#undef mem_get_se_aligned_generic -#undef mem_get_sne_aligned_generic -#undef mem_get_sse_aligned_generic -#undef mem_put_ne_aligned_generic -#undef mem_put_se_aligned_generic -#undef swap_endian_16 -#undef swap_endian_32 -#undef swap_endian_16_se -#undef swap_endian_32_se -/* clang-format on */ - -#endif // AOM_AOM_PORTS_MEM_OPS_ALIGNED_H_ diff --git a/third_party/aom/aom_ports/msvc.h b/third_party/aom/aom_ports/msvc.h deleted file mode 100644 index e78e605f2..000000000 --- a/third_party/aom/aom_ports/msvc.h +++ /dev/null @@ -1,75 +0,0 @@ -/* - * Copyright (c) 2016, Alliance for Open Media. All rights reserved - * - * This source code is subject to the terms of the BSD 2 Clause License and - * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License - * was not distributed with this source code in the LICENSE file, you can - * obtain it at www.aomedia.org/license/software. If the Alliance for Open - * Media Patent License 1.0 was not distributed with this source code in the - * PATENTS file, you can obtain it at www.aomedia.org/license/patent. - */ - -#ifndef AOM_AOM_PORTS_MSVC_H_ -#define AOM_AOM_PORTS_MSVC_H_ -#ifdef _MSC_VER - -#include "config/aom_config.h" - -#if _MSC_VER < 1900 // VS2015 provides snprintf -#define snprintf _snprintf -#endif // _MSC_VER < 1900 - -#if _MSC_VER < 1800 // VS2013 provides round -#include <math.h> -static INLINE double round(double x) { - if (x < 0) - return ceil(x - 0.5); - else - return floor(x + 0.5); -} - -static INLINE float roundf(float x) { - if (x < 0) - return (float)ceil(x - 0.5f); - else - return (float)floor(x + 0.5f); -} - -static INLINE long lroundf(float x) { - if (x < 0) - return (long)(x - 0.5f); - else - return (long)(x + 0.5f); -} -#endif // _MSC_VER < 1800 - -#if HAVE_AVX -#include <immintrin.h> -// Note: -// _mm256_insert_epi16 intrinsics is available from vs2017. -// We define this macro for vs2015 and earlier. The -// intrinsics used here are in vs2015 document: -// https://msdn.microsoft.com/en-us/library/hh977022.aspx -// Input parameters: -// a: __m256i, -// d: int16_t, -// indx: imm8 (0 - 15) -#if _MSC_VER <= 1900 -#define _mm256_insert_epi16(a, d, indx) \ - _mm256_insertf128_si256( \ - a, \ - _mm_insert_epi16(_mm256_extractf128_si256(a, indx >> 3), d, indx % 8), \ - indx >> 3) - -static INLINE int _mm256_extract_epi32(__m256i a, const int i) { - return a.m256i_i32[i & 7]; -} -static INLINE __m256i _mm256_insert_epi32(__m256i a, int b, const int i) { - __m256i c = a; - c.m256i_i32[i & 7] = b; - return c; -} -#endif // _MSC_VER <= 1900 -#endif // HAVE_AVX -#endif // _MSC_VER -#endif // AOM_AOM_PORTS_MSVC_H_ diff --git a/third_party/aom/aom_ports/ppc.h b/third_party/aom/aom_ports/ppc.h deleted file mode 100644 index 3159bda68..000000000 --- a/third_party/aom/aom_ports/ppc.h +++ /dev/null @@ -1,30 +0,0 @@ -/* - * Copyright (c) 2018, Alliance for Open Media. All rights reserved - * - * This source code is subject to the terms of the BSD 2 Clause License and - * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License - * was not distributed with this source code in the LICENSE file, you can - * obtain it at www.aomedia.org/license/software. If the Alliance for Open - * Media Patent License 1.0 was not distributed with this source code in the - * PATENTS file, you can obtain it at www.aomedia.org/license/patent. - */ - -#ifndef AOM_AOM_PORTS_PPC_H_ -#define AOM_AOM_PORTS_PPC_H_ -#include <stdlib.h> - -#include "config/aom_config.h" - -#ifdef __cplusplus -extern "C" { -#endif - -#define HAS_VSX 0x01 - -int ppc_simd_caps(void); - -#ifdef __cplusplus -} // extern "C" -#endif - -#endif // AOM_AOM_PORTS_PPC_H_ diff --git a/third_party/aom/aom_ports/ppc_cpudetect.c b/third_party/aom/aom_ports/ppc_cpudetect.c deleted file mode 100644 index 82b4f58cc..000000000 --- a/third_party/aom/aom_ports/ppc_cpudetect.c +++ /dev/null @@ -1,82 +0,0 @@ -/* - * Copyright (c) 2018, Alliance for Open Media. All rights reserved - * - * This source code is subject to the terms of the BSD 2 Clause License and - * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License - * was not distributed with this source code in the LICENSE file, you can - * obtain it at www.aomedia.org/license/software. If the Alliance for Open - * Media Patent License 1.0 was not distributed with this source code in the - * PATENTS file, you can obtain it at www.aomedia.org/license/patent. - */ - -#include <fcntl.h> -#include <unistd.h> -#include <stdint.h> -#include <asm/cputable.h> -#include <linux/auxvec.h> - -#include "config/aom_config.h" - -#include "aom_ports/ppc.h" - -#if CONFIG_RUNTIME_CPU_DETECT -static int cpu_env_flags(int *flags) { - char *env; - env = getenv("AOM_SIMD_CAPS"); - if (env && *env) { - *flags = (int)strtol(env, NULL, 0); - return 0; - } - *flags = 0; - return -1; -} - -static int cpu_env_mask(void) { - char *env; - env = getenv("AOM_SIMD_CAPS_MASK"); - return env && *env ? (int)strtol(env, NULL, 0) : ~0; -} - -int ppc_simd_caps(void) { - int flags; - int mask; - int fd; - ssize_t count; - unsigned int i; - uint64_t buf[64]; - - // If VPX_SIMD_CAPS is set then allow only those capabilities. - if (!cpu_env_flags(&flags)) { - return flags; - } - - mask = cpu_env_mask(); - - fd = open("/proc/self/auxv", O_RDONLY); - if (fd < 0) { - return 0; - } - - while ((count = read(fd, buf, sizeof(buf))) > 0) { - for (i = 0; i < (count / sizeof(*buf)); i += 2) { - if (buf[i] == AT_HWCAP) { -#if HAVE_VSX - if (buf[i + 1] & PPC_FEATURE_HAS_VSX) { - flags |= HAS_VSX; - } -#endif // HAVE_VSX - goto out_close; - } else if (buf[i] == AT_NULL) { - goto out_close; - } - } - } -out_close: - close(fd); - return flags & mask; -} -#else -// If there is no RTCD the function pointers are not used and can not be -// changed. -int ppc_simd_caps(void) { return 0; } -#endif // CONFIG_RUNTIME_CPU_DETECT diff --git a/third_party/aom/aom_ports/sanitizer.h b/third_party/aom/aom_ports/sanitizer.h deleted file mode 100644 index 1dd8eb4cf..000000000 --- a/third_party/aom/aom_ports/sanitizer.h +++ /dev/null @@ -1,38 +0,0 @@ -/* - * Copyright (c) 2018, Alliance for Open Media. All rights reserved - * - * This source code is subject to the terms of the BSD 2 Clause License and - * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License - * was not distributed with this source code in the LICENSE file, you can - * obtain it at www.aomedia.org/license/software. If the Alliance for Open - * Media Patent License 1.0 was not distributed with this source code in the - * PATENTS file, you can obtain it at www.aomedia.org/license/patent. - */ - -#ifndef AOM_AOM_PORTS_SANITIZER_H_ -#define AOM_AOM_PORTS_SANITIZER_H_ - -// AddressSanitizer support. - -// Define AOM_ADDRESS_SANITIZER if AddressSanitizer is used. -// Clang. -#if defined(__has_feature) -#if __has_feature(address_sanitizer) -#define AOM_ADDRESS_SANITIZER 1 -#endif -#endif // defined(__has_feature) -// GCC. -#if defined(__SANITIZE_ADDRESS__) -#define AOM_ADDRESS_SANITIZER 1 -#endif // defined(__SANITIZE_ADDRESS__) - -// Define the macros for AddressSanitizer manual memory poisoning. See -// https://github.com/google/sanitizers/wiki/AddressSanitizerManualPoisoning. -#if defined(AOM_ADDRESS_SANITIZER) -#include <sanitizer/asan_interface.h> -#else -#define ASAN_POISON_MEMORY_REGION(addr, size) ((void)(addr), (void)(size)) -#define ASAN_UNPOISON_MEMORY_REGION(addr, size) ((void)(addr), (void)(size)) -#endif - -#endif // AOM_AOM_PORTS_SANITIZER_H_ diff --git a/third_party/aom/aom_ports/system_state.h b/third_party/aom/aom_ports/system_state.h deleted file mode 100644 index 6640839d8..000000000 --- a/third_party/aom/aom_ports/system_state.h +++ /dev/null @@ -1,23 +0,0 @@ -/* - * Copyright (c) 2016, Alliance for Open Media. All rights reserved - * - * This source code is subject to the terms of the BSD 2 Clause License and - * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License - * was not distributed with this source code in the LICENSE file, you can - * obtain it at www.aomedia.org/license/software. If the Alliance for Open - * Media Patent License 1.0 was not distributed with this source code in the - * PATENTS file, you can obtain it at www.aomedia.org/license/patent. - */ - -#ifndef AOM_AOM_PORTS_SYSTEM_STATE_H_ -#define AOM_AOM_PORTS_SYSTEM_STATE_H_ - -#include "config/aom_config.h" - -#if ARCH_X86 || ARCH_X86_64 -void aom_reset_mmx_state(void); -#define aom_clear_system_state() aom_reset_mmx_state() -#else -#define aom_clear_system_state() -#endif // ARCH_X86 || ARCH_X86_64 -#endif // AOM_AOM_PORTS_SYSTEM_STATE_H_ diff --git a/third_party/aom/aom_ports/x86.h b/third_party/aom/aom_ports/x86.h deleted file mode 100644 index 52ee49cb3..000000000 --- a/third_party/aom/aom_ports/x86.h +++ /dev/null @@ -1,325 +0,0 @@ -/* - * Copyright (c) 2016, Alliance for Open Media. All rights reserved - * - * This source code is subject to the terms of the BSD 2 Clause License and - * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License - * was not distributed with this source code in the LICENSE file, you can - * obtain it at www.aomedia.org/license/software. If the Alliance for Open - * Media Patent License 1.0 was not distributed with this source code in the - * PATENTS file, you can obtain it at www.aomedia.org/license/patent. - */ - -#ifndef AOM_AOM_PORTS_X86_H_ -#define AOM_AOM_PORTS_X86_H_ -#include <stdlib.h> - -#if defined(_MSC_VER) -#include <intrin.h> /* For __cpuidex, __rdtsc */ -#endif - -#include "aom/aom_integer.h" -#include "config/aom_config.h" - -#ifdef __cplusplus -extern "C" { -#endif - -typedef enum { - AOM_CPU_UNKNOWN = -1, - AOM_CPU_AMD, - AOM_CPU_AMD_OLD, - AOM_CPU_CENTAUR, - AOM_CPU_CYRIX, - AOM_CPU_INTEL, - AOM_CPU_NEXGEN, - AOM_CPU_NSC, - AOM_CPU_RISE, - AOM_CPU_SIS, - AOM_CPU_TRANSMETA, - AOM_CPU_TRANSMETA_OLD, - AOM_CPU_UMC, - AOM_CPU_VIA, - - AOM_CPU_LAST -} aom_cpu_t; - -#if defined(__GNUC__) && __GNUC__ || defined(__ANDROID__) -#if ARCH_X86_64 -#define cpuid(func, func2, ax, bx, cx, dx) \ - __asm__ __volatile__("cpuid \n\t" \ - : "=a"(ax), "=b"(bx), "=c"(cx), "=d"(dx) \ - : "a"(func), "c"(func2)); -#else -#define cpuid(func, func2, ax, bx, cx, dx) \ - __asm__ __volatile__( \ - "mov %%ebx, %%edi \n\t" \ - "cpuid \n\t" \ - "xchg %%edi, %%ebx \n\t" \ - : "=a"(ax), "=D"(bx), "=c"(cx), "=d"(dx) \ - : "a"(func), "c"(func2)); -#endif -#elif defined(__SUNPRO_C) || \ - defined(__SUNPRO_CC) /* end __GNUC__ or __ANDROID__*/ -#if ARCH_X86_64 -#define cpuid(func, func2, ax, bx, cx, dx) \ - asm volatile( \ - "xchg %rsi, %rbx \n\t" \ - "cpuid \n\t" \ - "movl %ebx, %edi \n\t" \ - "xchg %rsi, %rbx \n\t" \ - : "=a"(ax), "=D"(bx), "=c"(cx), "=d"(dx) \ - : "a"(func), "c"(func2)); -#else -#define cpuid(func, func2, ax, bx, cx, dx) \ - asm volatile( \ - "pushl %ebx \n\t" \ - "cpuid \n\t" \ - "movl %ebx, %edi \n\t" \ - "popl %ebx \n\t" \ - : "=a"(ax), "=D"(bx), "=c"(cx), "=d"(dx) \ - : "a"(func), "c"(func2)); -#endif -#else /* end __SUNPRO__ */ -#if ARCH_X86_64 -#if defined(_MSC_VER) && _MSC_VER > 1500 -#define cpuid(func, func2, a, b, c, d) \ - do { \ - int regs[4]; \ - __cpuidex(regs, func, func2); \ - a = regs[0]; \ - b = regs[1]; \ - c = regs[2]; \ - d = regs[3]; \ - } while (0) -#else -#define cpuid(func, func2, a, b, c, d) \ - do { \ - int regs[4]; \ - __cpuid(regs, func); \ - a = regs[0]; \ - b = regs[1]; \ - c = regs[2]; \ - d = regs[3]; \ - } while (0) -#endif -#else -/* clang-format off */ -#define cpuid(func, func2, a, b, c, d) \ - __asm mov eax, func \ - __asm mov ecx, func2 \ - __asm cpuid \ - __asm mov a, eax \ - __asm mov b, ebx \ - __asm mov c, ecx \ - __asm mov d, edx -#endif -/* clang-format on */ -#endif /* end others */ - -// NaCl has no support for xgetbv or the raw opcode. -#if !defined(__native_client__) && (defined(__i386__) || defined(__x86_64__)) -static INLINE uint64_t xgetbv(void) { - const uint32_t ecx = 0; - uint32_t eax, edx; - // Use the raw opcode for xgetbv for compatibility with older toolchains. - __asm__ volatile(".byte 0x0f, 0x01, 0xd0\n" - : "=a"(eax), "=d"(edx) - : "c"(ecx)); - return ((uint64_t)edx << 32) | eax; -} -#elif (defined(_M_X64) || defined(_M_IX86)) && defined(_MSC_FULL_VER) && \ - _MSC_FULL_VER >= 160040219 // >= VS2010 SP1 -#include <immintrin.h> -#define xgetbv() _xgetbv(0) -#elif defined(_MSC_VER) && defined(_M_IX86) -static INLINE uint64_t xgetbv(void) { - uint32_t eax_, edx_; - __asm { - xor ecx, ecx // ecx = 0 - // Use the raw opcode for xgetbv for compatibility with older toolchains. - __asm _emit 0x0f __asm _emit 0x01 __asm _emit 0xd0 - mov eax_, eax - mov edx_, edx - } - return ((uint64_t)edx_ << 32) | eax_; -} -#else -#define xgetbv() 0U // no AVX for older x64 or unrecognized toolchains. -#endif - -#if defined(_MSC_VER) && _MSC_VER >= 1700 -#include <windows.h> -#if WINAPI_FAMILY_PARTITION(WINAPI_FAMILY_APP) -#define getenv(x) NULL -#endif -#endif - -#define HAS_MMX 0x01 -#define HAS_SSE 0x02 -#define HAS_SSE2 0x04 -#define HAS_SSE3 0x08 -#define HAS_SSSE3 0x10 -#define HAS_SSE4_1 0x20 -#define HAS_AVX 0x40 -#define HAS_AVX2 0x80 -#define HAS_SSE4_2 0x100 -#ifndef BIT -#define BIT(n) (1 << n) -#endif - -static INLINE int x86_simd_caps(void) { - unsigned int flags = 0; - unsigned int mask = ~0; - unsigned int max_cpuid_val, reg_eax, reg_ebx, reg_ecx, reg_edx; - char *env; - (void)reg_ebx; - - /* See if the CPU capabilities are being overridden by the environment */ - env = getenv("AOM_SIMD_CAPS"); - - if (env && *env) return (int)strtol(env, NULL, 0); - - env = getenv("AOM_SIMD_CAPS_MASK"); - - if (env && *env) mask = (unsigned int)strtoul(env, NULL, 0); - - /* Ensure that the CPUID instruction supports extended features */ - cpuid(0, 0, max_cpuid_val, reg_ebx, reg_ecx, reg_edx); - - if (max_cpuid_val < 1) return 0; - - /* Get the standard feature flags */ - cpuid(1, 0, reg_eax, reg_ebx, reg_ecx, reg_edx); - - if (reg_edx & BIT(23)) flags |= HAS_MMX; - - if (reg_edx & BIT(25)) flags |= HAS_SSE; /* aka xmm */ - - if (reg_edx & BIT(26)) flags |= HAS_SSE2; /* aka wmt */ - - if (reg_ecx & BIT(0)) flags |= HAS_SSE3; - - if (reg_ecx & BIT(9)) flags |= HAS_SSSE3; - - if (reg_ecx & BIT(19)) flags |= HAS_SSE4_1; - - if (reg_ecx & BIT(20)) flags |= HAS_SSE4_2; - - // bits 27 (OSXSAVE) & 28 (256-bit AVX) - if ((reg_ecx & (BIT(27) | BIT(28))) == (BIT(27) | BIT(28))) { - if ((xgetbv() & 0x6) == 0x6) { - flags |= HAS_AVX; - - if (max_cpuid_val >= 7) { - /* Get the leaf 7 feature flags. Needed to check for AVX2 support */ - cpuid(7, 0, reg_eax, reg_ebx, reg_ecx, reg_edx); - - if (reg_ebx & BIT(5)) flags |= HAS_AVX2; - } - } - } - - return flags & mask; -} - -// Note: -// 32-bit CPU cycle counter is light-weighted for most function performance -// measurement. For large function (CPU time > a couple of seconds), 64-bit -// counter should be used. -// 32-bit CPU cycle counter -static INLINE unsigned int x86_readtsc(void) { -#if defined(__GNUC__) && __GNUC__ - unsigned int tsc; - __asm__ __volatile__("rdtsc\n\t" : "=a"(tsc) :); - return tsc; -#elif defined(__SUNPRO_C) || defined(__SUNPRO_CC) - unsigned int tsc; - asm volatile("rdtsc\n\t" : "=a"(tsc) :); - return tsc; -#else -#if ARCH_X86_64 - return (unsigned int)__rdtsc(); -#else - __asm rdtsc; -#endif -#endif -} -// 64-bit CPU cycle counter -static INLINE uint64_t x86_readtsc64(void) { -#if defined(__GNUC__) && __GNUC__ - uint32_t hi, lo; - __asm__ __volatile__("rdtsc" : "=a"(lo), "=d"(hi)); - return ((uint64_t)hi << 32) | lo; -#elif defined(__SUNPRO_C) || defined(__SUNPRO_CC) - uint_t hi, lo; - asm volatile("rdtsc\n\t" : "=a"(lo), "=d"(hi)); - return ((uint64_t)hi << 32) | lo; -#else -#if ARCH_X86_64 - return (uint64_t)__rdtsc(); -#else - __asm rdtsc; -#endif -#endif -} - -#if defined(__GNUC__) && __GNUC__ -#define x86_pause_hint() __asm__ __volatile__("pause \n\t") -#elif defined(__SUNPRO_C) || defined(__SUNPRO_CC) -#define x86_pause_hint() asm volatile("pause \n\t") -#else -#if ARCH_X86_64 -#define x86_pause_hint() _mm_pause(); -#else -#define x86_pause_hint() __asm pause -#endif -#endif - -#if defined(__GNUC__) && __GNUC__ -static void x87_set_control_word(unsigned short mode) { - __asm__ __volatile__("fldcw %0" : : "m"(*&mode)); -} -static unsigned short x87_get_control_word(void) { - unsigned short mode; - __asm__ __volatile__("fstcw %0\n\t" : "=m"(*&mode) :); - return mode; -} -#elif defined(__SUNPRO_C) || defined(__SUNPRO_CC) -static void x87_set_control_word(unsigned short mode) { - asm volatile("fldcw %0" : : "m"(*&mode)); -} -static unsigned short x87_get_control_word(void) { - unsigned short mode; - asm volatile("fstcw %0\n\t" : "=m"(*&mode) :); - return mode; -} -#elif ARCH_X86_64 -/* No fldcw intrinsics on Windows x64, punt to external asm */ -extern void aom_winx64_fldcw(unsigned short mode); -extern unsigned short aom_winx64_fstcw(void); -#define x87_set_control_word aom_winx64_fldcw -#define x87_get_control_word aom_winx64_fstcw -#else -static void x87_set_control_word(unsigned short mode) { - __asm { fldcw mode } -} -static unsigned short x87_get_control_word(void) { - unsigned short mode; - __asm { fstcw mode } - return mode; -} -#endif - -static INLINE unsigned int x87_set_double_precision(void) { - unsigned int mode = x87_get_control_word(); - x87_set_control_word((mode & ~0x300) | 0x200); - return mode; -} - -extern void aom_reset_mmx_state(void); - -#ifdef __cplusplus -} // extern "C" -#endif - -#endif // AOM_AOM_PORTS_X86_H_ diff --git a/third_party/aom/aom_ports/x86_abi_support.asm b/third_party/aom/aom_ports/x86_abi_support.asm deleted file mode 100644 index 0e7c26287..000000000 --- a/third_party/aom/aom_ports/x86_abi_support.asm +++ /dev/null @@ -1,395 +0,0 @@ -; -; Copyright (c) 2016, Alliance for Open Media. All rights reserved -; -; This source code is subject to the terms of the BSD 2 Clause License and -; the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License -; was not distributed with this source code in the LICENSE file, you can -; obtain it at www.aomedia.org/license/software. If the Alliance for Open -; Media Patent License 1.0 was not distributed with this source code in the -; PATENTS file, you can obtain it at www.aomedia.org/license/patent. -; - -; - - -%include "config/aom_config.asm" - -; 32/64 bit compatibility macros -; -; In general, we make the source use 64 bit syntax, then twiddle with it using -; the preprocessor to get the 32 bit syntax on 32 bit platforms. -; -%ifidn __OUTPUT_FORMAT__,elf32 -%define ABI_IS_32BIT 1 -%elifidn __OUTPUT_FORMAT__,macho32 -%define ABI_IS_32BIT 1 -%elifidn __OUTPUT_FORMAT__,win32 -%define ABI_IS_32BIT 1 -%elifidn __OUTPUT_FORMAT__,aout -%define ABI_IS_32BIT 1 -%else -%define ABI_IS_32BIT 0 -%endif - -%if ABI_IS_32BIT -%define rax eax -%define rbx ebx -%define rcx ecx -%define rdx edx -%define rsi esi -%define rdi edi -%define rsp esp -%define rbp ebp -%define movsxd mov -%macro movq 2 - %ifidn %1,eax - movd %1,%2 - %elifidn %2,eax - movd %1,%2 - %elifidn %1,ebx - movd %1,%2 - %elifidn %2,ebx - movd %1,%2 - %elifidn %1,ecx - movd %1,%2 - %elifidn %2,ecx - movd %1,%2 - %elifidn %1,edx - movd %1,%2 - %elifidn %2,edx - movd %1,%2 - %elifidn %1,esi - movd %1,%2 - %elifidn %2,esi - movd %1,%2 - %elifidn %1,edi - movd %1,%2 - %elifidn %2,edi - movd %1,%2 - %elifidn %1,esp - movd %1,%2 - %elifidn %2,esp - movd %1,%2 - %elifidn %1,ebp - movd %1,%2 - %elifidn %2,ebp - movd %1,%2 - %else - movq %1,%2 - %endif -%endmacro -%endif - - -; LIBAOM_YASM_WIN64 -; Set LIBAOM_YASM_WIN64 if output is Windows 64bit so the code will work if x64 -; or win64 is defined on the Yasm command line. -%ifidn __OUTPUT_FORMAT__,win64 -%define LIBAOM_YASM_WIN64 1 -%elifidn __OUTPUT_FORMAT__,x64 -%define LIBAOM_YASM_WIN64 1 -%else -%define LIBAOM_YASM_WIN64 0 -%endif - -; sym() -; Return the proper symbol name for the target ABI. -; -; Certain ABIs, notably MS COFF and Darwin MACH-O, require that symbols -; with C linkage be prefixed with an underscore. -; -%ifidn __OUTPUT_FORMAT__,elf32 -%define sym(x) x -%elifidn __OUTPUT_FORMAT__,elf64 -%define sym(x) x -%elifidn __OUTPUT_FORMAT__,elfx32 -%define sym(x) x -%elif LIBAOM_YASM_WIN64 -%define sym(x) x -%else -%define sym(x) _ %+ x -%endif - -; PRIVATE -; Macro for the attribute to hide a global symbol for the target ABI. -; This is only active if CHROMIUM is defined. -; -; Chromium doesn't like exported global symbols due to symbol clashing with -; plugins among other things. -; -; Requires Chromium's patched copy of yasm: -; http://src.chromium.org/viewvc/chrome?view=rev&revision=73761 -; http://www.tortall.net/projects/yasm/ticket/236 -; -%ifdef CHROMIUM - %ifidn __OUTPUT_FORMAT__,elf32 - %define PRIVATE :hidden - %elifidn __OUTPUT_FORMAT__,elf64 - %define PRIVATE :hidden - %elifidn __OUTPUT_FORMAT__,elfx32 - %define PRIVATE :hidden - %elif LIBAOM_YASM_WIN64 - %define PRIVATE - %else - %define PRIVATE :private_extern - %endif -%else - %define PRIVATE -%endif - -; arg() -; Return the address specification of the given argument -; -%if ABI_IS_32BIT - %define arg(x) [ebp+8+4*x] -%else - ; 64 bit ABI passes arguments in registers. This is a workaround to get up - ; and running quickly. Relies on SHADOW_ARGS_TO_STACK - %if LIBAOM_YASM_WIN64 - %define arg(x) [rbp+16+8*x] - %else - %define arg(x) [rbp-8-8*x] - %endif -%endif - -; REG_SZ_BYTES, REG_SZ_BITS -; Size of a register -%if ABI_IS_32BIT -%define REG_SZ_BYTES 4 -%define REG_SZ_BITS 32 -%else -%define REG_SZ_BYTES 8 -%define REG_SZ_BITS 64 -%endif - - -; ALIGN_STACK <alignment> <register> -; This macro aligns the stack to the given alignment (in bytes). The stack -; is left such that the previous value of the stack pointer is the first -; argument on the stack (ie, the inverse of this macro is 'pop rsp.') -; This macro uses one temporary register, which is not preserved, and thus -; must be specified as an argument. -%macro ALIGN_STACK 2 - mov %2, rsp - and rsp, -%1 - lea rsp, [rsp - (%1 - REG_SZ_BYTES)] - push %2 -%endmacro - - -; -; The Microsoft assembler tries to impose a certain amount of type safety in -; its register usage. YASM doesn't recognize these directives, so we just -; %define them away to maintain as much compatibility as possible with the -; original inline assembler we're porting from. -; -%idefine PTR -%idefine XMMWORD -%idefine MMWORD - -; PIC macros -; -%if ABI_IS_32BIT - %if CONFIG_PIC=1 - %ifidn __OUTPUT_FORMAT__,elf32 - %define WRT_PLT wrt ..plt - %macro GET_GOT 1 - extern _GLOBAL_OFFSET_TABLE_ - push %1 - call %%get_got - %%sub_offset: - jmp %%exitGG - %%get_got: - mov %1, [esp] - add %1, _GLOBAL_OFFSET_TABLE_ + $$ - %%sub_offset wrt ..gotpc - ret - %%exitGG: - %undef GLOBAL - %define GLOBAL(x) x + %1 wrt ..gotoff - %undef RESTORE_GOT - %define RESTORE_GOT pop %1 - %endmacro - %elifidn __OUTPUT_FORMAT__,macho32 - %macro GET_GOT 1 - push %1 - call %%get_got - %%get_got: - pop %1 - %undef GLOBAL - %define GLOBAL(x) x + %1 - %%get_got - %undef RESTORE_GOT - %define RESTORE_GOT pop %1 - %endmacro - %endif - %endif - - %ifdef CHROMIUM - %ifidn __OUTPUT_FORMAT__,macho32 - %define HIDDEN_DATA(x) x:private_extern - %else - %define HIDDEN_DATA(x) x - %endif - %else - %define HIDDEN_DATA(x) x - %endif -%else - %macro GET_GOT 1 - %endmacro - %define GLOBAL(x) rel x - %ifidn __OUTPUT_FORMAT__,elf64 - %define WRT_PLT wrt ..plt - %define HIDDEN_DATA(x) x:data hidden - %elifidn __OUTPUT_FORMAT__,elfx32 - %define WRT_PLT wrt ..plt - %define HIDDEN_DATA(x) x:data hidden - %elifidn __OUTPUT_FORMAT__,macho64 - %ifdef CHROMIUM - %define HIDDEN_DATA(x) x:private_extern - %else - %define HIDDEN_DATA(x) x - %endif - %else - %define HIDDEN_DATA(x) x - %endif -%endif -%ifnmacro GET_GOT - %macro GET_GOT 1 - %endmacro - %define GLOBAL(x) x -%endif -%ifndef RESTORE_GOT -%define RESTORE_GOT -%endif -%ifndef WRT_PLT -%define WRT_PLT -%endif - -%if ABI_IS_32BIT - %macro SHADOW_ARGS_TO_STACK 1 - %endm - %define UNSHADOW_ARGS -%else -%if LIBAOM_YASM_WIN64 - %macro SHADOW_ARGS_TO_STACK 1 ; argc - %if %1 > 0 - mov arg(0),rcx - %endif - %if %1 > 1 - mov arg(1),rdx - %endif - %if %1 > 2 - mov arg(2),r8 - %endif - %if %1 > 3 - mov arg(3),r9 - %endif - %endm -%else - %macro SHADOW_ARGS_TO_STACK 1 ; argc - %if %1 > 0 - push rdi - %endif - %if %1 > 1 - push rsi - %endif - %if %1 > 2 - push rdx - %endif - %if %1 > 3 - push rcx - %endif - %if %1 > 4 - push r8 - %endif - %if %1 > 5 - push r9 - %endif - %if %1 > 6 - %assign i %1-6 - %assign off 16 - %rep i - mov rax,[rbp+off] - push rax - %assign off off+8 - %endrep - %endif - %endm -%endif - %define UNSHADOW_ARGS mov rsp, rbp -%endif - -; Win64 ABI requires that XMM6:XMM15 are callee saved -; SAVE_XMM n, [u] -; store registers 6-n on the stack -; if u is specified, use unaligned movs. -; Win64 ABI requires 16 byte stack alignment, but then pushes an 8 byte return -; value. Typically we follow this up with 'push rbp' - re-aligning the stack - -; but in some cases this is not done and unaligned movs must be used. -%if LIBAOM_YASM_WIN64 -%macro SAVE_XMM 1-2 a - %if %1 < 6 - %error Only xmm registers 6-15 must be preserved - %else - %assign last_xmm %1 - %define movxmm movdq %+ %2 - %assign xmm_stack_space ((last_xmm - 5) * 16) - sub rsp, xmm_stack_space - %assign i 6 - %rep (last_xmm - 5) - movxmm [rsp + ((i - 6) * 16)], xmm %+ i - %assign i i+1 - %endrep - %endif -%endmacro -%macro RESTORE_XMM 0 - %ifndef last_xmm - %error RESTORE_XMM must be paired with SAVE_XMM n - %else - %assign i last_xmm - %rep (last_xmm - 5) - movxmm xmm %+ i, [rsp +((i - 6) * 16)] - %assign i i-1 - %endrep - add rsp, xmm_stack_space - ; there are a couple functions which return from multiple places. - ; otherwise, we could uncomment these: - ; %undef last_xmm - ; %undef xmm_stack_space - ; %undef movxmm - %endif -%endmacro -%else -%macro SAVE_XMM 1-2 -%endmacro -%macro RESTORE_XMM 0 -%endmacro -%endif - -; Name of the rodata section -; -; .rodata seems to be an elf-ism, as it doesn't work on OSX. -; -%ifidn __OUTPUT_FORMAT__,macho64 -%define SECTION_RODATA section .text -%elifidn __OUTPUT_FORMAT__,macho32 -%macro SECTION_RODATA 0 -section .text -%endmacro -%elifidn __OUTPUT_FORMAT__,aout -%define SECTION_RODATA section .data -%else -%define SECTION_RODATA section .rodata -%endif - - -; Tell GNU ld that we don't require an executable stack. -%ifidn __OUTPUT_FORMAT__,elf32 -section .note.GNU-stack noalloc noexec nowrite progbits -section .text -%elifidn __OUTPUT_FORMAT__,elf64 -section .note.GNU-stack noalloc noexec nowrite progbits -section .text -%elifidn __OUTPUT_FORMAT__,elfx32 -section .note.GNU-stack noalloc noexec nowrite progbits -section .text -%endif |