Use SIMDe for NEON acceleration

This commit is contained in:
Cameron Gutman
2026-02-19 00:05:29 -06:00
parent de364b6ecd
commit 5551d29ba2
5 changed files with 9 additions and 4 deletions

View File

@@ -8,8 +8,7 @@
#define OBLAS_SSE3
#else
#if defined(__aarch64__) || (defined(_MSC_VER) && defined(_M_ARM64))
// To be replaced with SIMDe
// #define OBLAS_NEON
#define OBLAS_NEON
#endif
#endif
#endif

View File

@@ -176,7 +176,8 @@ void obl_axpyb32_ref(u8 *a, u32 *b, u8 u, unsigned k)
#else
#if defined(OBLAS_SSE3) || defined(OBLAS_NEON)
#if defined(OBLAS_NEON)
#include "sse2neon/sse2neon.h"
#define SIMDE_ENABLE_NATIVE_ALIASES
#include <simde/x86/ssse3.h>
#else
#include <emmintrin.h>
#include <tmmintrin.h>

1
nanors/deps/simde Submodule

Submodule nanors/deps/simde added at 595b743dce