uxlfoundation · kala855 · Oct 9, 2024 · Sep 30, 2024 · mgouicem · Oct 10, 2024
@@ -84,9 +84,13 @@ status_t ref_batch_normalization_fwd_t::init(impl::engine_t *engine) {
                 = ::sycl::get_kernel_id<batch_normalization_fwd_kernel_vec_t>();
         CHECK(create_kernel(engine, kid, &kernel_));
     } else {
+        // Enabling the IEEE div compliant implementation
+        setenv("SYCL_PROGRAM_COMPILE_OPTIONS",
+                "-cl-fp32-correctly-rounded-divide-sqrt", 1);
         const auto kid = ::sycl::get_kernel_id<
                 batch_normalization_fwd_kernel_vec_t1>();
         CHECK(create_kernel(engine, kid, &kernel_));
+        unsetenv("SYCL_PROGRAM_COMPILE_OPTIONS");
     }
     return status::success;
 }

@@ -82,9 +82,13 @@ status_t ref_layer_normalization_fwd_t::init(impl::engine_t *engine) {
                 = ::sycl::get_kernel_id<layer_normalization_fwd_kernel_vec_t>();
         CHECK(create_kernel(engine, kid, &kernel_));
     } else {
+        // Enabling the IEEE div compliant implementation
+        setenv("SYCL_PROGRAM_COMPILE_OPTIONS",
+                "-cl-fp32-correctly-rounded-divide-sqrt", 1);
         const auto kid = ::sycl::get_kernel_id<
                 layer_normalization_fwd_kernel_vec1_t>();
         CHECK(create_kernel(engine, kid, &kernel_));
+        unsetenv("SYCL_PROGRAM_COMPILE_OPTIONS");
     }
     return status::success;
 }

@@ -450,7 +450,17 @@ void setup_cmp(compare::compare_t &cmp, const prb_t *prb, data_kind_t kind,
     // exceeds `digits_f32`.
     const int safe_digits = MAX2(0, digits_dt(dnnl_f32) - digits_dt(dt));
     const float trh_coeff = (1 << safe_digits);
+    // The following code is a workaround because a SYCL compiler bug
+    // that is causing precision issues.
+#ifdef DNNL_WITH_SYCL
+    float trh = trh_coeff
+            * ((kind == SRC || kind == DST
+                       || (kind == VAR && prb->dir & FLAG_FWD))
+                            ? 5e-7
+                            : 0);
+#else
     float trh = trh_coeff * ((kind == SRC || kind == DST) ? 5e-7 : 0);
+#endif
     if ((kind == SC || kind == SH) && prb->dir & FLAG_BWD)
         trh = trh_coeff * 5e-6;
     cmp.set_threshold(trh);