| /* |
| Simple DirectMedia Layer |
| Copyright (C) 1997-2021 Sam Lantinga <slouken@libsdl.org> |
| |
| This software is provided 'as-is', without any express or implied |
| warranty. In no event will the authors be held liable for any damages |
| arising from the use of this software. |
| |
| Permission is granted to anyone to use this software for any purpose, |
| including commercial applications, and to alter it and redistribute it |
| freely, subject to the following restrictions: |
| |
| 1. The origin of this software must not be misrepresented; you must not |
| claim that you wrote the original software. If you use this software |
| in a product, an acknowledgment in the product documentation would be |
| appreciated but is not required. |
| 2. Altered source versions must be plainly marked as such, and must not be |
| misrepresented as being the original software. |
| 3. This notice may not be removed or altered from any source distribution. |
| */ |
| |
| /** |
| * \file SDL_cpuinfo.h |
| * |
| * CPU feature detection for SDL. |
| */ |
| |
| #ifndef SDL_cpuinfo_h_ |
| #define SDL_cpuinfo_h_ |
| |
| #include "SDL_stdinc.h" |
| |
| /* Need to do this here because intrin.h has C++ code in it */ |
| /* Visual Studio 2005 has a bug where intrin.h conflicts with winnt.h */ |
| #if defined(_MSC_VER) && (_MSC_VER >= 1500) && (defined(_M_IX86) || defined(_M_X64)) |
| #ifdef __clang__ |
| /* Many of the intrinsics SDL uses are not implemented by clang with Visual Studio */ |
| #undef __MMX__ |
| #undef __SSE__ |
| #undef __SSE2__ |
| #else |
| #include <intrin.h> |
| #ifndef _WIN64 |
| #ifndef __MMX__ |
| #define __MMX__ |
| #endif |
| #ifndef __3dNOW__ |
| #define __3dNOW__ |
| #endif |
| #endif |
| #ifndef __SSE__ |
| #define __SSE__ |
| #endif |
| #ifndef __SSE2__ |
| #define __SSE2__ |
| #endif |
| #endif /* __clang__ */ |
| #elif defined(__MINGW64_VERSION_MAJOR) |
| #include <intrin.h> |
| #else |
| /* altivec.h redefining bool causes a number of problems, see bugs 3993 and 4392, so you need to explicitly define SDL_ENABLE_ALTIVEC_H to have it included. */ |
| #if defined(HAVE_ALTIVEC_H) && defined(__ALTIVEC__) && !defined(__APPLE_ALTIVEC__) && defined(SDL_ENABLE_ALTIVEC_H) |
| #include <altivec.h> |
| #endif |
| #if !defined(SDL_DISABLE_ARM_NEON_H) |
| # if defined(__ARM_NEON) |
| # include <arm_neon.h> |
| # elif defined(__WINDOWS__) || defined(__WINRT__) |
| /* Visual Studio doesn't define __ARM_ARCH, but _M_ARM (if set, always 7), and _M_ARM64 (if set, always 1). */ |
| # if defined(_M_ARM) |
| # include <armintr.h> |
| # include <arm_neon.h> |
| # define __ARM_NEON 1 /* Set __ARM_NEON so that it can be used elsewhere, at compile time */ |
| # endif |
| # if defined (_M_ARM64) |
| # include <arm64intr.h> |
| # include <arm64_neon.h> |
| # define __ARM_NEON 1 /* Set __ARM_NEON so that it can be used elsewhere, at compile time */ |
| # endif |
| # endif |
| #endif |
| #if defined(__3dNOW__) && !defined(SDL_DISABLE_MM3DNOW_H) |
| #include <mm3dnow.h> |
| #endif |
| #if defined(HAVE_IMMINTRIN_H) && !defined(SDL_DISABLE_IMMINTRIN_H) |
| #include <immintrin.h> |
| #else |
| #if defined(__MMX__) && !defined(SDL_DISABLE_MMINTRIN_H) |
| #include <mmintrin.h> |
| #endif |
| #if defined(__SSE__) && !defined(SDL_DISABLE_XMMINTRIN_H) |
| #include <xmmintrin.h> |
| #endif |
| #if defined(__SSE2__) && !defined(SDL_DISABLE_EMMINTRIN_H) |
| #include <emmintrin.h> |
| #endif |
| #if defined(__SSE3__) && !defined(SDL_DISABLE_PMMINTRIN_H) |
| #include <pmmintrin.h> |
| #endif |
| #endif /* HAVE_IMMINTRIN_H */ |
| #endif /* compiler version */ |
| |
| #include "begin_code.h" |
| /* Set up for C function definitions, even when using C++ */ |
| #ifdef __cplusplus |
| extern "C" { |
| #endif |
| |
| /* This is a guess for the cacheline size used for padding. |
| * Most x86 processors have a 64 byte cache line. |
| * The 64-bit PowerPC processors have a 128 byte cache line. |
| * We'll use the larger value to be generally safe. |
| */ |
| #define SDL_CACHELINE_SIZE 128 |
| |
| /** |
| * This function returns the number of CPU cores available. |
| */ |
| extern DECLSPEC int SDLCALL SDL_GetCPUCount(void); |
| |
| /** |
| * This function returns the L1 cache line size of the CPU |
| * |
| * This is useful for determining multi-threaded structure padding |
| * or SIMD prefetch sizes. |
| */ |
| extern DECLSPEC int SDLCALL SDL_GetCPUCacheLineSize(void); |
| |
| /** |
| * This function returns true if the CPU has the RDTSC instruction. |
| */ |
| extern DECLSPEC SDL_bool SDLCALL SDL_HasRDTSC(void); |
| |
| /** |
| * This function returns true if the CPU has AltiVec features. |
| */ |
| extern DECLSPEC SDL_bool SDLCALL SDL_HasAltiVec(void); |
| |
| /** |
| * This function returns true if the CPU has MMX features. |
| */ |
| extern DECLSPEC SDL_bool SDLCALL SDL_HasMMX(void); |
| |
| /** |
| * This function returns true if the CPU has 3DNow! features. |
| */ |
| extern DECLSPEC SDL_bool SDLCALL SDL_Has3DNow(void); |
| |
| /** |
| * This function returns true if the CPU has SSE features. |
| */ |
| extern DECLSPEC SDL_bool SDLCALL SDL_HasSSE(void); |
| |
| /** |
| * This function returns true if the CPU has SSE2 features. |
| */ |
| extern DECLSPEC SDL_bool SDLCALL SDL_HasSSE2(void); |
| |
| /** |
| * This function returns true if the CPU has SSE3 features. |
| */ |
| extern DECLSPEC SDL_bool SDLCALL SDL_HasSSE3(void); |
| |
| /** |
| * This function returns true if the CPU has SSE4.1 features. |
| */ |
| extern DECLSPEC SDL_bool SDLCALL SDL_HasSSE41(void); |
| |
| /** |
| * This function returns true if the CPU has SSE4.2 features. |
| */ |
| extern DECLSPEC SDL_bool SDLCALL SDL_HasSSE42(void); |
| |
| /** |
| * This function returns true if the CPU has AVX features. |
| */ |
| extern DECLSPEC SDL_bool SDLCALL SDL_HasAVX(void); |
| |
| /** |
| * This function returns true if the CPU has AVX2 features. |
| */ |
| extern DECLSPEC SDL_bool SDLCALL SDL_HasAVX2(void); |
| |
| /** |
| * This function returns true if the CPU has AVX-512F (foundation) features. |
| */ |
| extern DECLSPEC SDL_bool SDLCALL SDL_HasAVX512F(void); |
| |
| /** |
| * This function returns true if the CPU has ARM SIMD (ARMv6) features. |
| */ |
| extern DECLSPEC SDL_bool SDLCALL SDL_HasARMSIMD(void); |
| |
| /** |
| * This function returns true if the CPU has NEON (ARM SIMD) features. |
| */ |
| extern DECLSPEC SDL_bool SDLCALL SDL_HasNEON(void); |
| |
| /** |
| * This function returns the amount of RAM configured in the system, in MB. |
| */ |
| extern DECLSPEC int SDLCALL SDL_GetSystemRAM(void); |
| |
| /** |
| * \brief Report the alignment this system needs for SIMD allocations. |
| * |
| * This will return the minimum number of bytes to which a pointer must be |
| * aligned to be compatible with SIMD instructions on the current machine. |
| * For example, if the machine supports SSE only, it will return 16, but if |
| * it supports AVX-512F, it'll return 64 (etc). This only reports values for |
| * instruction sets SDL knows about, so if your SDL build doesn't have |
| * SDL_HasAVX512F(), then it might return 16 for the SSE support it sees and |
| * not 64 for the AVX-512 instructions that exist but SDL doesn't know about. |
| * Plan accordingly. |
| */ |
| extern DECLSPEC size_t SDLCALL SDL_SIMDGetAlignment(void); |
| |
| /** |
| * \brief Allocate memory in a SIMD-friendly way. |
| * |
| * This will allocate a block of memory that is suitable for use with SIMD |
| * instructions. Specifically, it will be properly aligned and padded for |
| * the system's supported vector instructions. |
| * |
| * The memory returned will be padded such that it is safe to read or write |
| * an incomplete vector at the end of the memory block. This can be useful |
| * so you don't have to drop back to a scalar fallback at the end of your |
| * SIMD processing loop to deal with the final elements without overflowing |
| * the allocated buffer. |
| * |
| * You must free this memory with SDL_FreeSIMD(), not free() or SDL_free() |
| * or delete[], etc. |
| * |
| * Note that SDL will only deal with SIMD instruction sets it is aware of; |
| * for example, SDL 2.0.8 knows that SSE wants 16-byte vectors |
| * (SDL_HasSSE()), and AVX2 wants 32 bytes (SDL_HasAVX2()), but doesn't |
| * know that AVX-512 wants 64. To be clear: if you can't decide to use an |
| * instruction set with an SDL_Has*() function, don't use that instruction |
| * set with memory allocated through here. |
| * |
| * SDL_AllocSIMD(0) will return a non-NULL pointer, assuming the system isn't |
| * out of memory. |
| * |
| * \param len The length, in bytes, of the block to allocated. The actual |
| * allocated block might be larger due to padding, etc. |
| * \return Pointer to newly-allocated block, NULL if out of memory. |
| * |
| * \sa SDL_SIMDAlignment |
| * \sa SDL_SIMDRealloc |
| * \sa SDL_SIMDFree |
| */ |
| extern DECLSPEC void * SDLCALL SDL_SIMDAlloc(const size_t len); |
| |
| /** |
| * \brief Reallocate memory obtained from SDL_SIMDAlloc |
| * |
| * It is not valid to use this function on a pointer from anything but |
| * SDL_SIMDAlloc(). It can't be used on pointers from malloc, realloc, |
| * SDL_malloc, memalign, new[], etc. |
| * |
| * \param mem The pointer obtained from SDL_SIMDAlloc. This function also |
| * accepts NULL, at which point this function is the same as |
| * calling SDL_realloc with a NULL pointer. |
| * \param len The length, in bytes, of the block to allocated. The actual |
| * allocated block might be larger due to padding, etc. Passing 0 |
| * will return a non-NULL pointer, assuming the system isn't out of |
| * memory. |
| * \return Pointer to newly-reallocated block, NULL if out of memory. |
| * |
| * \sa SDL_SIMDAlignment |
| * \sa SDL_SIMDAlloc |
| * \sa SDL_SIMDFree |
| */ |
| extern DECLSPEC void * SDLCALL SDL_SIMDRealloc(void *mem, const size_t len); |
| |
| /** |
| * \brief Deallocate memory obtained from SDL_SIMDAlloc |
| * |
| * It is not valid to use this function on a pointer from anything but |
| * SDL_SIMDAlloc(). It can't be used on pointers from malloc, realloc, |
| * SDL_malloc, memalign, new[], etc. |
| * |
| * However, SDL_SIMDFree(NULL) is a legal no-op. |
| * |
| * \sa SDL_SIMDAlloc |
| * \sa SDL_SIMDRealloc |
| */ |
| extern DECLSPEC void SDLCALL SDL_SIMDFree(void *ptr); |
| |
| /* vi: set ts=4 sw=4 expandtab: */ |
| /* Ends C function definitions when using C++ */ |
| #ifdef __cplusplus |
| } |
| #endif |
| #include "close_code.h" |
| |
| #endif /* SDL_cpuinfo_h_ */ |
| |
| /* vi: set ts=4 sw=4 expandtab: */ |