Add support for fast math compiler flags when building ArrayFire

umar456 · umar456 · commit 45b6a3f585e9 · 2022-11-22T12:27:57.000-05:00
diff --git a/CMakeLists.txt b/CMakeLists.txt
@@ -92,6 +92,7 @@ option(AF_WITH_STATIC_MKL "Link against static Intel MKL libraries" OFF)
 option(AF_WITH_STATIC_CUDA_NUMERIC_LIBS "Link libafcuda with static numeric libraries(cublas, cufft, etc.)" OFF)
 option(AF_WITH_SPDLOG_HEADER_ONLY "Build ArrayFire with header only version of spdlog" OFF)
 option(AF_WITH_FMT_HEADER_ONLY "Build ArrayFire with header only version of fmt" OFF)
+option(AF_WITH_FAST_MATH "Use lower precision but high performance numeric optimizations" OFF)
 
 if(AF_WITH_STATIC_CUDA_NUMERIC_LIBS)
   option(AF_WITH_PRUNE_STATIC_CUDA_NUMERIC_LIBS "Prune CUDA static libraries to reduce binary size.(WARNING: May break some libs on older CUDA toolkits for some compute arch)" OFF)
diff --git a/CMakeModules/InternalUtils.cmake b/CMakeModules/InternalUtils.cmake
@@ -25,6 +25,13 @@ if(WIN32)
   check_cxx_compiler_flag(/permissive- cxx_compliance)
 endif()
 
+check_cxx_compiler_flag(-ffast-math has_cxx_fast_math)
+check_cxx_compiler_flag("-fp-model fast" has_cxx_fp_model)
+check_cxx_compiler_flag(-fno-errno-math has_cxx_no_errno_math)
+check_cxx_compiler_flag(-fno-trapping-math  has_cxx_no_trapping_math)
+check_cxx_compiler_flag(-fno-signed-zeros  has_cxx_no_signed_zeros)
+check_cxx_compiler_flag(-mno-ieee-fp has_cxx_no_ieee_fp)
+
 function(arrayfire_set_default_cxx_flags target)
   target_compile_options(${target}
     PRIVATE
@@ -51,7 +58,19 @@ function(arrayfire_set_default_cxx_flags target)
               # ignored attribute warnings in the OpenCL
               # headers
               $<$<BOOL:${has_ignored_attributes_flag}>:-Wno-ignored-attributes>
-              $<$<BOOL:${has_all_warnings_flag}>:-Wall>>
+              $<$<BOOL:${has_all_warnings_flag}>:-Wall>
+
+              $<$<BOOL:${AF_WITH_FAST_MATH}>:
+                  $<$<BOOL:${has_cxx_fast_math}>:-ffast-math>
+                  $<$<BOOL:${has_cxx_no_errno_math}>:-fno-errno-math>
+                  $<$<BOOL:${has_cxx_no_trapping_math}>:-fno-trapping-math>
+                  $<$<BOOL:${has_cxx_no_signed_zeros}>:-fno-signed-zeros>
+                  $<$<BOOL:${has_cxx_no_ieee_fp}>:-mno-ieee-fp>
+                  >
+
+              $<$<NOT:$<BOOL:${AF_WITH_FAST_MATH}>>:
+                    $<$<BOOL:${has_cxx_fp_model}>:-fp-model precise>>
+                      >
     )
 
   target_compile_definitions(${target}
@@ -65,6 +84,7 @@ function(arrayfire_set_default_cxx_flags target)
 
       $<$<BOOL:${AF_WITH_LOGGING}>:           AF_WITH_LOGGING>
       $<$<BOOL:${AF_CACHE_KERNELS_TO_DISK}>:  AF_CACHE_KERNELS_TO_DISK>
+      $<$<BOOL:${AF_WITH_FAST_MATH}>:         AF_WITH_FAST_MATH>
   )
 endfunction()
 
diff --git a/test/CMakeLists.txt b/test/CMakeLists.txt
@@ -124,6 +124,10 @@ target_include_directories(arrayfire_test
 # The tautological-constant-compare warning is always thrown for std::nan
 # and std::info calls. Its unnecessarily verbose.
 target_compile_options(arrayfire_test
+  PUBLIC
+    # Intel compilers use fast math by default and ignore special floating point
+    # values like NaN and Infs.
+    $<$<BOOL:${has_cxx_fp_model}>:-fp-model precise>
   PRIVATE
     $<$<BOOL:${has_tautological_constant_compare_flag}>:-Wno-tautological-constant-compare>
     $<$<CXX_COMPILER_ID:MSVC>: /bigobj
@@ -137,6 +141,8 @@ if(WIN32)
 endif()
 
 target_compile_definitions(arrayfire_test
+  PUBLIC
+    $<$<BOOL:${AF_WITH_FAST_MATH}>:AF_WITH_FAST_MATH>
   PRIVATE
     TEST_RESULT_IMAGE_DIR="${CMAKE_BINARY_DIR}/test/"
     USE_MTX)
diff --git a/test/approx1.cpp b/test/approx1.cpp
@@ -777,6 +777,9 @@ TEST(Approx1, CPPUniformInvalidStepSize) {
 // specified by the user, ArrayFire will assume a regular grid with a
 // starting index of 0 and a step value of 1.
 TEST(Approx1, CPPInfCheck) {
+#ifdef __INTEL_LLVM_COMPILER
+    SKIP_IF_FAST_MATH_ENABLED();
+#endif
     array sampled(seq(0.0, 5.0, 0.5));
     sampled(0) = af::Inf;
     seq xo(0.0, 2.0, 0.25);
@@ -799,6 +802,9 @@ TEST(Approx1, CPPInfCheck) {
 }
 
 TEST(Approx1, CPPUniformInfCheck) {
+#ifdef __INTEL_LLVM_COMPILER
+    SKIP_IF_FAST_MATH_ENABLED();
+#endif
     array sampled(seq(10.0, 50.0, 10.0));
     sampled(0) = af::Inf;
     seq xo(0.0, 8.0, 2.0);
diff --git a/test/half.cpp b/test/half.cpp
@@ -87,6 +87,7 @@ TEST(Half, arith) {
 
 TEST(Half, isInf) {
     SUPPORTED_TYPE_CHECK(af_half);
+    SKIP_IF_FAST_MATH_ENABLED();
     half_float::half hinf = std::numeric_limits<half_float::half>::infinity();
 
     vector<half_float::half> input(2, half_float::half(0));
@@ -105,6 +106,7 @@ TEST(Half, isInf) {
 
 TEST(Half, isNan) {
     SUPPORTED_TYPE_CHECK(af_half);
+    SKIP_IF_FAST_MATH_ENABLED();
     half_float::half hnan = std::numeric_limits<half_float::half>::quiet_NaN();
 
     vector<half_float::half> input(2, half_float::half(0));
diff --git a/test/imageio.cpp b/test/imageio.cpp
@@ -289,17 +289,17 @@ TEST(ImageIO, SaveImage16CPP) {
     dim4 dims(16, 24, 3);
 
     array input     = randu(dims, u16);
-    array input_255 = (input / 257).as(u16);
+    array input_255 = floor(input.as(f32) / 257);
 
     std::string testname  = getTestName() + "_" + getBackendName();
     std::string imagename = "saveImage16CPP_" + testname + ".png";
 
     saveImage(imagename.c_str(), input);
 
     array img = loadImage(imagename.c_str(), true);
-    ASSERT_EQ(img.type(), f32);  // loadImage should always return float
 
-    ASSERT_FALSE(anyTrue<bool>(abs(img - input_255)));
+    ASSERT_EQ(img.type(), f32);  // loadImage should always return float
+    ASSERT_IMAGES_NEAR(input_255, img, 0.001);
 }
 
 ////////////////////////////////////////////////////////////////////////////////
diff --git a/test/ireduce.cpp b/test/ireduce.cpp
@@ -192,6 +192,7 @@ TEST(IndexedReduce, MaxReduceDimensionHasSingleValue) {
 }
 
 TEST(IndexedReduce, MinNaN) {
+    SKIP_IF_FAST_MATH_ENABLED();
     float test_data[] = {1.f, NAN, 5.f, 0.1f, NAN, -0.5f, NAN, 0.f};
     int rows          = 4;
     int cols          = 2;
@@ -218,6 +219,7 @@ TEST(IndexedReduce, MinNaN) {
 }
 
 TEST(IndexedReduce, MaxNaN) {
+    SKIP_IF_FAST_MATH_ENABLED();
     float test_data[] = {1.f, NAN, 5.f, 0.1f, NAN, -0.5f, NAN, 0.f};
     int rows          = 4;
     int cols          = 2;
@@ -244,6 +246,7 @@ TEST(IndexedReduce, MaxNaN) {
 }
 
 TEST(IndexedReduce, MinCplxNaN) {
+    SKIP_IF_FAST_MATH_ENABLED();
     float real_wnan_data[] = {0.005f, NAN, -6.3f, NAN,      -0.5f,
                               NAN,    NAN, 0.2f,  -1205.4f, 8.9f};
 
@@ -279,6 +282,7 @@ TEST(IndexedReduce, MinCplxNaN) {
 }
 
 TEST(IndexedReduce, MaxCplxNaN) {
+    SKIP_IF_FAST_MATH_ENABLED();
     float real_wnan_data[] = {0.005f, NAN, -6.3f, NAN,      -0.5f,
                               NAN,    NAN, 0.2f,  -1205.4f, 8.9f};
 
diff --git a/test/meanvar.cpp b/test/meanvar.cpp
@@ -131,7 +131,7 @@ class MeanVarTyped : public ::testing::TestWithParam<meanvar_test<T>> {
             ASSERT_VEC_ARRAY_NEAR(test.variance_, outDim, var, 0.5f);
         } else if (is_same_type<float, outType<T>>::value ||
                    is_same_type<cfloat, outType<T>>::value) {
-            ASSERT_VEC_ARRAY_NEAR(test.mean_, outDim, mean, 0.001f);
+            ASSERT_VEC_ARRAY_NEAR(test.mean_, outDim, mean, 0.0016f);
             ASSERT_VEC_ARRAY_NEAR(test.variance_, outDim, var, 0.2f);
         } else {
             ASSERT_VEC_ARRAY_NEAR(test.mean_, outDim, mean, 0.00001f);
@@ -171,7 +171,7 @@ class MeanVarTyped : public ::testing::TestWithParam<meanvar_test<T>> {
             ASSERT_VEC_ARRAY_NEAR(test.variance_, outDim, var, 0.5f);
         } else if (is_same_type<float, outType<T>>::value ||
                    is_same_type<cfloat, outType<T>>::value) {
-            ASSERT_VEC_ARRAY_NEAR(test.mean_, outDim, mean, 0.001f);
+            ASSERT_VEC_ARRAY_NEAR(test.mean_, outDim, mean, 0.0016f);
             ASSERT_VEC_ARRAY_NEAR(test.variance_, outDim, var, 0.2f);
         } else {
             ASSERT_VEC_ARRAY_NEAR(test.mean_, outDim, mean, 0.00001f);
diff --git a/test/median.cpp b/test/median.cpp
@@ -93,20 +93,21 @@ void median_test(int nx, int ny = 1, int nz = 1, int nw = 1) {
 
     if (sa.dims(dim) % 2 == 1) {
         mSeq[dim] = mSeq[dim] - 1.0;
+        sa        = sa.as((af_dtype)dtype_traits<To>::af_type);
         verify    = sa(mSeq[0], mSeq[1], mSeq[2], mSeq[3]);
     } else {
         dim_t sdim[4] = {0};
         sdim[dim]     = 1;
         sa            = sa.as((af_dtype)dtype_traits<To>::af_type);
         array sas     = shift(sa, sdim[0], sdim[1], sdim[2], sdim[3]);
-        verify        = ((sa + sas) / 2)(mSeq[0], mSeq[1], mSeq[2], mSeq[3]);
+        verify = ((sa + sas) / To(2))(mSeq[0], mSeq[1], mSeq[2], mSeq[3]);
     }
 
     // Test Part
     array out = median(a, dim);
 
     ASSERT_EQ(out.dims() == verify.dims(), true);
-    ASSERT_NEAR(0, sum<double>(abs(out - verify)), 1e-5);
+    ASSERT_ARRAYS_EQ(verify, out);
 }
 
 #define MEDIAN_FLAT(To, Ti)                                                    \
diff --git a/test/reduce.cpp b/test/reduce.cpp
@@ -779,6 +779,7 @@ TEST(ReduceByKey, countReduceByKey) {
 }
 
 TEST(ReduceByKey, ReduceByKeyNans) {
+    SKIP_IF_FAST_MATH_ENABLED();
     const static int testSz      = 8;
     const int testKeys[testSz]   = {0, 2, 2, 9, 5, 5, 5, 8};
     const float testVals[testSz] = {0, 7, NAN, 6, 2, 5, 3, 4};
@@ -1072,6 +1073,7 @@ TYPED_TEST(Reduce, Test_Any_Global) {
 }
 
 TEST(MinMax, MinMaxNaN) {
+    SKIP_IF_FAST_MATH_ENABLED();
     const int num      = 10000;
     array A            = randu(num);
     A(where(A < 0.25)) = NaN;
@@ -1095,6 +1097,7 @@ TEST(MinMax, MinMaxNaN) {
 }
 
 TEST(MinMax, MinCplxNaN) {
+    SKIP_IF_FAST_MATH_ENABLED();
     float real_wnan_data[] = {0.005f, NAN, -6.3f, NAN,      -0.5f,
                               NAN,    NAN, 0.2f,  -1205.4f, 8.9f};
 
@@ -1122,6 +1125,7 @@ TEST(MinMax, MinCplxNaN) {
 }
 
 TEST(MinMax, MaxCplxNaN) {
+    SKIP_IF_FAST_MATH_ENABLED();
     // 4th element is unusually large to cover the case where
     //  one part holds the largest value among the array,
     //  and the other part is NaN.
@@ -1158,6 +1162,7 @@ TEST(MinMax, MaxCplxNaN) {
 }
 
 TEST(Count, NaN) {
+    SKIP_IF_FAST_MATH_ENABLED();
     const int num = 10000;
     array A       = round(5 * randu(num));
     array B       = A;
@@ -1168,6 +1173,7 @@ TEST(Count, NaN) {
 }
 
 TEST(Sum, NaN) {
+    SKIP_IF_FAST_MATH_ENABLED();
     const int num      = 10000;
     array A            = randu(num);
     A(where(A < 0.25)) = NaN;
@@ -1187,6 +1193,7 @@ TEST(Sum, NaN) {
 }
 
 TEST(Product, NaN) {
+    SKIP_IF_FAST_MATH_ENABLED();
     const int num = 5;
     array A       = randu(num);
     A(2)          = NaN;
@@ -1206,6 +1213,7 @@ TEST(Product, NaN) {
 }
 
 TEST(AnyAll, NaN) {
+    SKIP_IF_FAST_MATH_ENABLED();
     const int num = 10000;
     array A       = (randu(num) > 0.5).as(f32);
     array B       = A;
@@ -2263,6 +2271,7 @@ TYPED_TEST(Reduce, Test_Any_Global_Array) {
 
 
 TEST(Reduce, Test_Sum_Global_Array_nanval) {
+    SKIP_IF_FAST_MATH_ENABLED();
     const int num = 100000;
     array a = af::randn(num, 2, 34, 4);
     a(1, 0, 0, 0) = NAN;
diff --git a/test/replace.cpp b/test/replace.cpp
@@ -113,6 +113,7 @@ TYPED_TEST(Replace, Simple) { replaceTest<TypeParam>(dim4(1024, 1024)); }
 TYPED_TEST(Replace, Scalar) { replaceScalarTest<TypeParam>(dim4(5, 5)); }
 
 TEST(Replace, NaN) {
+    SKIP_IF_FAST_MATH_ENABLED();
     dim4 dims(1000, 1250);
     dtype ty = f32;
 
diff --git a/test/select.cpp b/test/select.cpp
@@ -130,6 +130,7 @@ TYPED_TEST(Select, LeftScalar) {
 }
 
 TEST(Select, NaN) {
+    SKIP_IF_FAST_MATH_ENABLED();
     dim4 dims(1000, 1250);
     dtype ty = f32;
 
diff --git a/test/testHelpers.hpp b/test/testHelpers.hpp
@@ -223,9 +223,18 @@ bool noDoubleTests(af::dtype ty);
 
 bool noHalfTests(af::dtype ty);
 
-#define SUPPORTED_TYPE_CHECK(type)                                        \
-    if (noDoubleTests((af_dtype)af::dtype_traits<type>::af_type)) return; \
-    if (noHalfTests((af_dtype)af::dtype_traits<type>::af_type)) return;
+#define SUPPORTED_TYPE_CHECK(type)                                \
+    if (noDoubleTests((af_dtype)af::dtype_traits<type>::af_type)) \
+        GTEST_SKIP() << "Device doesn't support Doubles";         \
+    if (noHalfTests((af_dtype)af::dtype_traits<type>::af_type))   \
+        GTEST_SKIP() << "Device doesn't support Half";
+
+#ifdef AF_WITH_FAST_MATH
+#define SKIP_IF_FAST_MATH_ENABLED() \
+    GTEST_SKIP() << "ArrayFire compiled with AF_WITH_FAST_MATH"
+#else
+#define SKIP_IF_FAST_MATH_ENABLED()
+#endif
 
 bool noImageIOTests();
 
diff --git a/test/threading.cpp b/test/threading.cpp
@@ -53,7 +53,7 @@ void calc(ArithOp opcode, array op1, array op2, float outValue,
     vector<float> out(res.elements());
     res.host((void*)out.data());
 
-    for (unsigned i = 0; i < out.size(); ++i) ASSERT_EQ(out[i], outValue);
+    for (unsigned i = 0; i < out.size(); ++i) ASSERT_FLOAT_EQ(out[i], outValue);
     af::sync();
 }
 

Original file line number	Diff line number	Diff line change
`@@ -192,6 +192,7 @@ TEST(IndexedReduce, MaxReduceDimensionHasSingleValue) {`
`192`	`192`	`}`
`193`	`193`
`194`	`194`	`TEST(IndexedReduce, MinNaN) {`
	`195`	`+ SKIP_IF_FAST_MATH_ENABLED();`
`195`	`196`	`float test_data[] = {1.f, NAN, 5.f, 0.1f, NAN, -0.5f, NAN, 0.f};`
`196`	`197`	`int rows = 4;`
`197`	`198`	`int cols = 2;`
`@@ -218,6 +219,7 @@ TEST(IndexedReduce, MinNaN) {`
`218`	`219`	`}`
`219`	`220`
`220`	`221`	`TEST(IndexedReduce, MaxNaN) {`
	`222`	`+ SKIP_IF_FAST_MATH_ENABLED();`
`221`	`223`	`float test_data[] = {1.f, NAN, 5.f, 0.1f, NAN, -0.5f, NAN, 0.f};`
`222`	`224`	`int rows = 4;`
`223`	`225`	`int cols = 2;`
`@@ -244,6 +246,7 @@ TEST(IndexedReduce, MaxNaN) {`
`244`	`246`	`}`
`245`	`247`
`246`	`248`	`TEST(IndexedReduce, MinCplxNaN) {`
	`249`	`+ SKIP_IF_FAST_MATH_ENABLED();`
`247`	`250`	`float real_wnan_data[] = {0.005f, NAN, -6.3f, NAN, -0.5f,`
`248`	`251`	`NAN, NAN, 0.2f, -1205.4f, 8.9f};`
`249`	`252`
`@@ -279,6 +282,7 @@ TEST(IndexedReduce, MinCplxNaN) {`
`279`	`282`	`}`
`280`	`283`
`281`	`284`	`TEST(IndexedReduce, MaxCplxNaN) {`
	`285`	`+ SKIP_IF_FAST_MATH_ENABLED();`
`282`	`286`	`float real_wnan_data[] = {0.005f, NAN, -6.3f, NAN, -0.5f,`
`283`	`287`	`NAN, NAN, 0.2f, -1205.4f, 8.9f};`
`284`	`288`