File tree 2 files changed +10
-0
lines changed
2 files changed +10
-0
lines changed Original file line number Diff line number Diff line change @@ -892,6 +892,14 @@ endif()
892
892
893
893
if (USE_SLEEF_FOR_ARM_VEC256)
894
894
string (APPEND CMAKE_CXX_FLAGS " -DAT_BUILD_ARM_VEC256_WITH_SLEEF" )
895
+ add_definitions (-DAT_BUILD_ARM_VEC256_WITH_SLEEF)
896
+ endif ()
897
+
898
+ # Enable sleef on macOS with Apple silicon by default
899
+ if ((${CMAKE_SYSTEM_NAME} STREQUAL "Darwin" ) AND (${CMAKE_SYSTEM_PROCESSOR} STREQUAL "arm64" ))
900
+ message (STATUS "Running on macOS with Apple silicon" )
901
+ string (APPEND CMAKE_CXX_FLAGS " -DAT_BUILD_ARM_VEC256_WITH_SLEEF" )
902
+ add_definitions (-DAT_BUILD_ARM_VEC256_WITH_SLEEF)
895
903
endif ()
896
904
897
905
if (USE_XNNPACK)
Original file line number Diff line number Diff line change @@ -1327,6 +1327,8 @@ def __bool__(self) -> bool:
1327
1327
class VecNEON (VecISA ):
1328
1328
_bit_width = 256 # This is required to leverage the compute implemented in aten/src/ATen/cpu/vec/vec256/vec256_float_neon.h
1329
1329
_macro = "-DCPU_CAPABILITY_NEON"
1330
+ if sys .platform == "darwin" and platform .processor () == "arm" :
1331
+ _macro += " -DAT_BUILD_ARM_VEC256_WITH_SLEEF"
1330
1332
_arch_flags = "" # Unused
1331
1333
_dtype_nelements = {torch .float : 8 , torch .bfloat16 : 16 , torch .float16 : 16 }
1332
1334
You can’t perform that action at this time.
0 commit comments