|
@@ -658,7 +658,7 @@ if(SDL_ASSEMBLY)
|
|
|
if(USE_GCC OR USE_CLANG OR USE_INTELCC)
|
|
if(USE_GCC OR USE_CLANG OR USE_INTELCC)
|
|
|
string(APPEND CMAKE_REQUIRED_FLAGS " -mmmx")
|
|
string(APPEND CMAKE_REQUIRED_FLAGS " -mmmx")
|
|
|
endif()
|
|
endif()
|
|
|
- check_c_source_compiles("
|
|
|
|
|
|
|
+ check_x86_source_compiles([==[
|
|
|
#include <mmintrin.h>
|
|
#include <mmintrin.h>
|
|
|
void ints_add(int *dest, int *a, int *b, unsigned size) {
|
|
void ints_add(int *dest, int *a, int *b, unsigned size) {
|
|
|
for (; size >= 2; size -= 2, dest += 2, a += 2, b += 2) {
|
|
for (; size >= 2; size -= 2, dest += 2, a += 2, b += 2) {
|
|
@@ -668,7 +668,7 @@ if(SDL_ASSEMBLY)
|
|
|
int main(int argc, char *argv[]) {
|
|
int main(int argc, char *argv[]) {
|
|
|
ints_add((int*)0, (int*)0, (int*)0, 0);
|
|
ints_add((int*)0, (int*)0, (int*)0, 0);
|
|
|
return 0;
|
|
return 0;
|
|
|
- }" COMPILER_SUPPORTS_MMX)
|
|
|
|
|
|
|
+ }]==] COMPILER_SUPPORTS_MMX)
|
|
|
cmake_pop_check_state()
|
|
cmake_pop_check_state()
|
|
|
if(COMPILER_SUPPORTS_MMX)
|
|
if(COMPILER_SUPPORTS_MMX)
|
|
|
set(HAVE_MMX TRUE)
|
|
set(HAVE_MMX TRUE)
|
|
@@ -679,7 +679,7 @@ if(SDL_ASSEMBLY)
|
|
|
if(USE_GCC OR USE_CLANG OR USE_INTELCC)
|
|
if(USE_GCC OR USE_CLANG OR USE_INTELCC)
|
|
|
string(APPEND CMAKE_REQUIRED_FLAGS " -msse")
|
|
string(APPEND CMAKE_REQUIRED_FLAGS " -msse")
|
|
|
endif()
|
|
endif()
|
|
|
- check_c_source_compiles("
|
|
|
|
|
|
|
+ check_x86_source_compiles([==[
|
|
|
#include <xmmintrin.h>
|
|
#include <xmmintrin.h>
|
|
|
void floats_add(float *dest, float *a, float *b, unsigned size) {
|
|
void floats_add(float *dest, float *a, float *b, unsigned size) {
|
|
|
for (; size >= 4; size -= 4, dest += 4, a += 4, b += 4) {
|
|
for (; size >= 4; size -= 4, dest += 4, a += 4, b += 4) {
|
|
@@ -689,7 +689,7 @@ if(SDL_ASSEMBLY)
|
|
|
int main(int argc, char **argv) {
|
|
int main(int argc, char **argv) {
|
|
|
floats_add((float*)0, (float*)0, (float*)0, 0);
|
|
floats_add((float*)0, (float*)0, (float*)0, 0);
|
|
|
return 0;
|
|
return 0;
|
|
|
- }" COMPILER_SUPPORTS_SSE)
|
|
|
|
|
|
|
+ }]==] COMPILER_SUPPORTS_SSE)
|
|
|
cmake_pop_check_state()
|
|
cmake_pop_check_state()
|
|
|
if(COMPILER_SUPPORTS_SSE)
|
|
if(COMPILER_SUPPORTS_SSE)
|
|
|
set(HAVE_SSE TRUE)
|
|
set(HAVE_SSE TRUE)
|
|
@@ -700,7 +700,7 @@ if(SDL_ASSEMBLY)
|
|
|
if(USE_GCC OR USE_CLANG OR USE_INTELCC)
|
|
if(USE_GCC OR USE_CLANG OR USE_INTELCC)
|
|
|
string(APPEND CMAKE_REQUIRED_FLAGS " -msse2")
|
|
string(APPEND CMAKE_REQUIRED_FLAGS " -msse2")
|
|
|
endif()
|
|
endif()
|
|
|
- check_c_source_compiles("
|
|
|
|
|
|
|
+ check_x86_source_compiles([==[
|
|
|
#include <emmintrin.h>
|
|
#include <emmintrin.h>
|
|
|
void doubles_add(double *dest, double *a, double *b, unsigned size) {
|
|
void doubles_add(double *dest, double *a, double *b, unsigned size) {
|
|
|
for (; size >= 4; size -= 4, dest += 4, a += 4, b += 4) {
|
|
for (; size >= 4; size -= 4, dest += 4, a += 4, b += 4) {
|
|
@@ -710,7 +710,7 @@ if(SDL_ASSEMBLY)
|
|
|
int main(int argc, char **argv) {
|
|
int main(int argc, char **argv) {
|
|
|
doubles_add((double*)0, (double*)0, (double*)0, 0);
|
|
doubles_add((double*)0, (double*)0, (double*)0, 0);
|
|
|
return 0;
|
|
return 0;
|
|
|
- }" COMPILER_SUPPORTS_SSE2)
|
|
|
|
|
|
|
+ }]==] COMPILER_SUPPORTS_SSE2)
|
|
|
cmake_pop_check_state()
|
|
cmake_pop_check_state()
|
|
|
if(COMPILER_SUPPORTS_SSE2)
|
|
if(COMPILER_SUPPORTS_SSE2)
|
|
|
set(HAVE_SSE2 TRUE)
|
|
set(HAVE_SSE2 TRUE)
|
|
@@ -721,7 +721,7 @@ if(SDL_ASSEMBLY)
|
|
|
if(USE_GCC OR USE_CLANG OR USE_INTELCC)
|
|
if(USE_GCC OR USE_CLANG OR USE_INTELCC)
|
|
|
string(APPEND CMAKE_REQUIRED_FLAGS " -msse3")
|
|
string(APPEND CMAKE_REQUIRED_FLAGS " -msse3")
|
|
|
endif()
|
|
endif()
|
|
|
- check_c_source_compiles("
|
|
|
|
|
|
|
+ check_x86_source_compiles([==[
|
|
|
#include <pmmintrin.h>
|
|
#include <pmmintrin.h>
|
|
|
void ints_add(int *dest, int *a, int *b, unsigned size) {
|
|
void ints_add(int *dest, int *a, int *b, unsigned size) {
|
|
|
for (; size >= 4; size -= 4, dest += 4, a += 4, b += 4) {
|
|
for (; size >= 4; size -= 4, dest += 4, a += 4, b += 4) {
|
|
@@ -731,7 +731,7 @@ if(SDL_ASSEMBLY)
|
|
|
int main(int argc, char **argv) {
|
|
int main(int argc, char **argv) {
|
|
|
ints_add((int*)0, (int*)0, (int*)0, 0);
|
|
ints_add((int*)0, (int*)0, (int*)0, 0);
|
|
|
return 0;
|
|
return 0;
|
|
|
- }" COMPILER_SUPPORTS_SSE3)
|
|
|
|
|
|
|
+ }]==] COMPILER_SUPPORTS_SSE3)
|
|
|
cmake_pop_check_state()
|
|
cmake_pop_check_state()
|
|
|
if(COMPILER_SUPPORTS_SSE3)
|
|
if(COMPILER_SUPPORTS_SSE3)
|
|
|
set(HAVE_SSE3 TRUE)
|
|
set(HAVE_SSE3 TRUE)
|
|
@@ -742,7 +742,7 @@ if(SDL_ASSEMBLY)
|
|
|
if(USE_GCC OR USE_CLANG OR USE_INTELCC)
|
|
if(USE_GCC OR USE_CLANG OR USE_INTELCC)
|
|
|
string(APPEND CMAKE_REQUIRED_FLAGS " -msse4.1")
|
|
string(APPEND CMAKE_REQUIRED_FLAGS " -msse4.1")
|
|
|
endif()
|
|
endif()
|
|
|
- check_c_source_compiles("
|
|
|
|
|
|
|
+ check_x86_source_compiles([==[
|
|
|
#include <smmintrin.h>
|
|
#include <smmintrin.h>
|
|
|
void ints_mul(int *dest, int *a, int *b, unsigned size) {
|
|
void ints_mul(int *dest, int *a, int *b, unsigned size) {
|
|
|
for (; size >= 4; size -= 4, dest += 4, a += 4, b += 4) {
|
|
for (; size >= 4; size -= 4, dest += 4, a += 4, b += 4) {
|
|
@@ -752,7 +752,7 @@ if(SDL_ASSEMBLY)
|
|
|
int main(int argc, char **argv) {
|
|
int main(int argc, char **argv) {
|
|
|
ints_mul((int*)0, (int*)0, (int*)0, 0);
|
|
ints_mul((int*)0, (int*)0, (int*)0, 0);
|
|
|
return 0;
|
|
return 0;
|
|
|
- }" COMPILER_SUPPORTS_SSE4_1)
|
|
|
|
|
|
|
+ }]==] COMPILER_SUPPORTS_SSE4_1)
|
|
|
cmake_pop_check_state()
|
|
cmake_pop_check_state()
|
|
|
if(COMPILER_SUPPORTS_SSE4_1)
|
|
if(COMPILER_SUPPORTS_SSE4_1)
|
|
|
set(HAVE_SSE4_1 TRUE)
|
|
set(HAVE_SSE4_1 TRUE)
|
|
@@ -763,14 +763,14 @@ if(SDL_ASSEMBLY)
|
|
|
if(USE_GCC OR USE_CLANG OR USE_INTELCC)
|
|
if(USE_GCC OR USE_CLANG OR USE_INTELCC)
|
|
|
string(APPEND CMAKE_REQUIRED_FLAGS " -msse4.2")
|
|
string(APPEND CMAKE_REQUIRED_FLAGS " -msse4.2")
|
|
|
endif()
|
|
endif()
|
|
|
- check_c_source_compiles("
|
|
|
|
|
|
|
+ check_x86_source_compiles([==[
|
|
|
#include <nmmintrin.h>
|
|
#include <nmmintrin.h>
|
|
|
__m128i bitmask;
|
|
__m128i bitmask;
|
|
|
char data[16];
|
|
char data[16];
|
|
|
int main(int argc, char **argv) {
|
|
int main(int argc, char **argv) {
|
|
|
bitmask = _mm_cmpgt_epi64(_mm_set1_epi64x(0), _mm_loadu_si128((void*)data));
|
|
bitmask = _mm_cmpgt_epi64(_mm_set1_epi64x(0), _mm_loadu_si128((void*)data));
|
|
|
return 0;
|
|
return 0;
|
|
|
- }" COMPILER_SUPPORTS_SSE4_2)
|
|
|
|
|
|
|
+ }]==] COMPILER_SUPPORTS_SSE4_2)
|
|
|
cmake_pop_check_state()
|
|
cmake_pop_check_state()
|
|
|
if(COMPILER_SUPPORTS_SSE4_2)
|
|
if(COMPILER_SUPPORTS_SSE4_2)
|
|
|
set(HAVE_SSE4_2 TRUE)
|
|
set(HAVE_SSE4_2 TRUE)
|
|
@@ -781,7 +781,7 @@ if(SDL_ASSEMBLY)
|
|
|
if(USE_GCC OR USE_CLANG OR USE_INTELCC)
|
|
if(USE_GCC OR USE_CLANG OR USE_INTELCC)
|
|
|
string(APPEND CMAKE_REQUIRED_FLAGS " -mavx")
|
|
string(APPEND CMAKE_REQUIRED_FLAGS " -mavx")
|
|
|
endif()
|
|
endif()
|
|
|
- check_c_source_compiles("
|
|
|
|
|
|
|
+ check_x86_source_compiles([==[
|
|
|
#include <immintrin.h>
|
|
#include <immintrin.h>
|
|
|
void floats_add(float *dest, float *a, float *b, unsigned size) {
|
|
void floats_add(float *dest, float *a, float *b, unsigned size) {
|
|
|
for (; size >= 8; size -= 8, dest += 8, a += 8, b += 8) {
|
|
for (; size >= 8; size -= 8, dest += 8, a += 8, b += 8) {
|
|
@@ -791,7 +791,7 @@ if(SDL_ASSEMBLY)
|
|
|
int main(int argc, char **argv) {
|
|
int main(int argc, char **argv) {
|
|
|
floats_add((float*)0, (float*)0, (float*)0, 0);
|
|
floats_add((float*)0, (float*)0, (float*)0, 0);
|
|
|
return 0;
|
|
return 0;
|
|
|
- }" COMPILER_SUPPORTS_AVX)
|
|
|
|
|
|
|
+ }]==] COMPILER_SUPPORTS_AVX)
|
|
|
cmake_pop_check_state()
|
|
cmake_pop_check_state()
|
|
|
if(COMPILER_SUPPORTS_AVX)
|
|
if(COMPILER_SUPPORTS_AVX)
|
|
|
set(HAVE_AVX TRUE)
|
|
set(HAVE_AVX TRUE)
|
|
@@ -802,7 +802,7 @@ if(SDL_ASSEMBLY)
|
|
|
if(USE_GCC OR USE_CLANG OR USE_INTELCC)
|
|
if(USE_GCC OR USE_CLANG OR USE_INTELCC)
|
|
|
string(APPEND CMAKE_REQUIRED_FLAGS " -mavx2")
|
|
string(APPEND CMAKE_REQUIRED_FLAGS " -mavx2")
|
|
|
endif()
|
|
endif()
|
|
|
- check_c_source_compiles("
|
|
|
|
|
|
|
+ check_x86_source_compiles([==[
|
|
|
#include <immintrin.h>
|
|
#include <immintrin.h>
|
|
|
void ints_add(int *dest, int *a, int *b, unsigned size) {
|
|
void ints_add(int *dest, int *a, int *b, unsigned size) {
|
|
|
for (; size >= 8; size -= 8, dest += 8, a += 8, b += 8) {
|
|
for (; size >= 8; size -= 8, dest += 8, a += 8, b += 8) {
|
|
@@ -812,7 +812,7 @@ if(SDL_ASSEMBLY)
|
|
|
int main(int argc, char **argv) {
|
|
int main(int argc, char **argv) {
|
|
|
ints_add((int*)0, (int*)0, (int*)0, 0);
|
|
ints_add((int*)0, (int*)0, (int*)0, 0);
|
|
|
return 0;
|
|
return 0;
|
|
|
- }" COMPILER_SUPPORTS_AVX2)
|
|
|
|
|
|
|
+ }]==] COMPILER_SUPPORTS_AVX2)
|
|
|
cmake_pop_check_state()
|
|
cmake_pop_check_state()
|
|
|
if(COMPILER_SUPPORTS_AVX2)
|
|
if(COMPILER_SUPPORTS_AVX2)
|
|
|
set(HAVE_AVX2 TRUE)
|
|
set(HAVE_AVX2 TRUE)
|
|
@@ -823,7 +823,7 @@ if(SDL_ASSEMBLY)
|
|
|
if(USE_GCC OR USE_CLANG OR USE_INTELCC)
|
|
if(USE_GCC OR USE_CLANG OR USE_INTELCC)
|
|
|
string(APPEND CMAKE_REQUIRED_FLAGS " -mavx512f")
|
|
string(APPEND CMAKE_REQUIRED_FLAGS " -mavx512f")
|
|
|
endif()
|
|
endif()
|
|
|
- check_c_source_compiles("
|
|
|
|
|
|
|
+ check_x86_source_compiles([==[
|
|
|
#include <immintrin.h>
|
|
#include <immintrin.h>
|
|
|
void floats_add(float *dest, float *a, float *b, unsigned size) {
|
|
void floats_add(float *dest, float *a, float *b, unsigned size) {
|
|
|
for (; size >= 16; size -= 16, dest += 16, a += 16, b += 16) {
|
|
for (; size >= 16; size -= 16, dest += 16, a += 16, b += 16) {
|
|
@@ -833,7 +833,7 @@ if(SDL_ASSEMBLY)
|
|
|
int main(int argc, char **argv) {
|
|
int main(int argc, char **argv) {
|
|
|
floats_add((float*)0, (float*)0, (float*)0, 0);
|
|
floats_add((float*)0, (float*)0, (float*)0, 0);
|
|
|
return 0;
|
|
return 0;
|
|
|
- }" COMPILER_SUPPORTS_AVX512F)
|
|
|
|
|
|
|
+ }]==] COMPILER_SUPPORTS_AVX512F)
|
|
|
cmake_pop_check_state()
|
|
cmake_pop_check_state()
|
|
|
if(COMPILER_SUPPORTS_AVX512F)
|
|
if(COMPILER_SUPPORTS_AVX512F)
|
|
|
set(HAVE_AVX512F TRUE)
|
|
set(HAVE_AVX512F TRUE)
|
|
@@ -841,18 +841,17 @@ if(SDL_ASSEMBLY)
|
|
|
endif()
|
|
endif()
|
|
|
|
|
|
|
|
if(SDL_ARMNEON)
|
|
if(SDL_ARMNEON)
|
|
|
- check_c_source_compiles("
|
|
|
|
|
- #include <arm_neon.h>
|
|
|
|
|
- void floats_add(float *dest, float *a, float *b, unsigned size) {
|
|
|
|
|
- for (; size >= 4; size -= 4, dest += 4, a += 4, b += 4) {
|
|
|
|
|
- vst1q_f32(dest, vaddq_f32(vld1q_f32(a), vld1q_f32(b)));
|
|
|
|
|
- }
|
|
|
|
|
|
|
+ check_arm_source_compiles([==[
|
|
|
|
|
+ #include <arm_neon.h>
|
|
|
|
|
+ void floats_add(float *dest, float *a, float *b, unsigned size) {
|
|
|
|
|
+ for (; size >= 4; size -= 4, dest += 4, a += 4, b += 4) {
|
|
|
|
|
+ vst1q_f32(dest, vaddq_f32(vld1q_f32(a), vld1q_f32(b)));
|
|
|
}
|
|
}
|
|
|
- int main(int argc, char *argv[]) {
|
|
|
|
|
- floats_add((float*)0, (float*)0, (float*)0, 0);
|
|
|
|
|
- return 0;
|
|
|
|
|
- }" COMPILER_SUPPORTS_ARMNEON)
|
|
|
|
|
-
|
|
|
|
|
|
|
+ }
|
|
|
|
|
+ int main(int argc, char *argv[]) {
|
|
|
|
|
+ floats_add((float*)0, (float*)0, (float*)0, 0);
|
|
|
|
|
+ return 0;
|
|
|
|
|
+ }]==] COMPILER_SUPPORTS_ARMNEON)
|
|
|
if(COMPILER_SUPPORTS_ARMNEON)
|
|
if(COMPILER_SUPPORTS_ARMNEON)
|
|
|
set(HAVE_ARMNEON TRUE)
|
|
set(HAVE_ARMNEON TRUE)
|
|
|
endif()
|
|
endif()
|