Merge pull request #408 from hiddenSymmetries/avx512

Disable Avx512
hiddenSymmetries · Apr 29, 2024 · fe1087e · fe1087e
2 parents 295ac65 + f595c3d
commit fe1087e
Show file tree

Hide file tree

Showing 2 changed files with 4 additions and 1 deletion.
diff --git a/LICENSE b/LICENSE
@@ -19,3 +19,4 @@ AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
 OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
 SOFTWARE.
+
diff --git a/src/simsoptpp/simdhelpers.h b/src/simsoptpp/simdhelpers.h
@@ -129,6 +129,7 @@ using AlignedPaddedVec = std::vector<double, AlignedPaddedAllocator<double>>;
 #endif
 
 #if defined(USE_XSIMD)
+/*
 #if __AVX512F__ 
 // On skylake _mm512_sqrt_pd takes 24 CPI and _mm512_div_pd takes 16 CPI, so
 // 1/sqrt(vec) takes 40 CPI. Instead we can use the approximate inverse square
@@ -147,6 +148,7 @@ inline simd_t rsqrt(simd_t r2){
   return rinv;
 }
 #else
+*/
 inline simd_t rsqrt(const simd_t& r2){
     //On my avx2 machine, computing the sqrt and then the inverse is actually a
     //bit faster. just keeping this line here to remind myself how to compute
@@ -155,7 +157,7 @@ inline simd_t rsqrt(const simd_t& r2){
     return 1./sqrt(r2);
 }
 
-#endif
+//#endif
 #endif
 
 inline double rsqrt(const double& r2){