mirror of
https://github.com/TREX-CoE/qmckl.git
synced 2024-12-22 20:36:01 +01:00
Added AVX2 detection to autoconfig script.
Fixed minor SIMD bug in tests.
This commit is contained in:
parent
9a779f2a94
commit
2e45927e04
@ -223,6 +223,8 @@ AC_RUN_IFELSE(
|
|||||||
int simd=1;
|
int simd=1;
|
||||||
#if defined(__AVX512F__)
|
#if defined(__AVX512F__)
|
||||||
simd=8;
|
simd=8;
|
||||||
|
#elif defined(__AVX2__)
|
||||||
|
simd=4;
|
||||||
#elif defined(__AVX__)
|
#elif defined(__AVX__)
|
||||||
simd=4;
|
simd=4;
|
||||||
#elif defined(__SSE2__)
|
#elif defined(__SSE2__)
|
||||||
|
@ -418,7 +418,7 @@ The tests for the kernels are executed on datasets that are extracted from a run
|
|||||||
|
|
||||||
#+begin_src c :tangle (eval c_test)
|
#+begin_src c :tangle (eval c_test)
|
||||||
const uint64_t Dim = 21;
|
const uint64_t Dim = 21;
|
||||||
const uint64_t LDS = (1 + (Dim) / SIMD_LENGTH) * SIMD_LENGTH;
|
const uint64_t LDS = (1+(Dim-1)/SIMD_LENGTH)*SIMD_LENGTH;
|
||||||
const double breakdown = 1e-3;
|
const double breakdown = 1e-3;
|
||||||
const double tolerance = 1e-3;
|
const double tolerance = 1e-3;
|
||||||
double res[441];
|
double res[441];
|
||||||
|
Loading…
Reference in New Issue
Block a user