oneapi-src
diff --git a/‎features/config/TEMPLATE_math_intel_specific.xml
Lines changed: 1 addition & 0 deletions b/‎features/config/TEMPLATE_math_intel_specific.xml
Lines changed: 1 addition & 0 deletions
diff --git a/‎features/feature_case/math/intel_specific_math.yaml
Lines changed: 36 additions & 0 deletions b/‎features/feature_case/math/intel_specific_math.yaml
Lines changed: 36 additions & 0 deletions
diff --git a/‎features/feature_case/math/math_intel_specific.cu
Lines changed: 1 addition & 53 deletions b/‎features/feature_case/math/math_intel_specific.cu
Lines changed: 1 addition & 53 deletions
diff --git a/‎features/features.xml
Lines changed: 1 addition & 0 deletions b/‎features/features.xml
Lines changed: 1 addition & 0 deletions
diff --git a/‎features/test_feature.py
Lines changed: 2 additions & 2 deletions b/‎features/test_feature.py
Lines changed: 2 additions & 2 deletions
@@ -4,6 +4,7 @@
     <description>test</description>
     <files>
         <file path="feature_case/math/${testName}.cu" />
+        <file path="feature_case/math/intel_specific_math.yaml" />
     </files>
     <rules>
         <optlevelRule GPUFeature="NOT double" excludeOptlevelNameString="gpu" />
 
@@ -0,0 +1,36 @@
+# Copyright (C) Intel Corporation
+# SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
+# See https://llvm.org/LICENSE.txt for license information.
+
+# This file will be installed to folder:
+# {dpct_install_folder}/extensions/opt_rules.
+# The rule specified in this file can be imported with commandline option:
+# --rule-file={dpct_install_folder}/extensions/opt_rules/intel_specific_math.yaml
+---
+- Rule: intel_specific_math_erfinv
+  Kind: API
+  Priority: Takeover
+  In: erfinv
+  Out: sycl::ext::intel::math::erfinv($1)
+  Includes: [<sycl/ext/intel/math.hpp>]
+
+- Rule: intel_specific_math_erfinvf
+  Kind: API
+  Priority: Takeover
+  In: erfinvf
+  Out: sycl::ext::intel::math::erfinv($1)
+  Includes: [<sycl/ext/intel/math.hpp>]
+
+- Rule: intel_specific_math_normcdff
+  Kind: API
+  Priority: Takeover
+  In: normcdff
+  Out: sycl::ext::intel::math::cdfnorm($1)
+  Includes: [<sycl/ext/intel/math.hpp>]
+
+- Rule: intel_specific_math_normcdf
+  Kind: API
+  Priority: Takeover
+  In: normcdf
+  Out: sycl::ext::intel::math::cdfnorm($1)
+  Includes: [<sycl/ext/intel/math.hpp>]
@@ -7,58 +7,24 @@
 //
 // ===----------------------------------------------------------------------===//
 // RUN: dpct --rule-file=%S/../../tools/dpct/DpctOptRules/intel_specific_math.yaml --format-range=none -out-root %T/math_specific_UDR_test %s --cuda-include-path="%cuda-path/include" -- -x cuda --cuda-host-only
-// RUN: FileCheck --input-file %T/math_specific_UDR_test/math_specific_UDR_test.dp.cpp --match-full-lines %s
-
-// CHECK: #include <CL/sycl.hpp>
-// CHECK: #include <dpct/dpct.hpp>
-
-// CHECK: #include <sycl/ext/intel/math.hpp>
 
 #include "cuda_fp16.h"
 #include <iostream>
-// CHECK: void kernelFunc(double *deviceArray) {
-// CHECK:   double &d0 = *deviceArray;
-// CHECK:   d0 = sycl::ext::intel::math::erfinv(d0);
-// CHECK:   d0 = sycl::ext::intel::math::cdfnorm(d0);
-// CHECK: }
+
 __global__ void kernelFunc(double *deviceArray) {
   double &d0 = *deviceArray;
   d0 = erfinv(d0);
   d0 = normcdf(d0);
 
 }
 
-// CHECK: void kernelFunc(float *deviceArray) {
-// CHECK:   float &f0 = *deviceArray;
-// CHECK:   f0 = sycl::ext::intel::math::erfinv(f0);
-// CHECK:   f0 = sycl::ext::intel::math::cdfnorm(f0);
-// CHECK: }
 __global__ void kernelFunc(float *deviceArray) {
   float &f0 = *deviceArray;
   f0 = erfinvf(f0);
   f0 = normcdff(f0);
 
 }
 
-
-// CHECK: void testDouble() {
-// CHECK:   dpct::device_ext &dev_ct1 = dpct::get_current_device();
-// CHECK:   sycl::queue &q_ct1 = dev_ct1.default_queue();
-// CHECK:   const unsigned int NUM = 1;
-// CHECK:   const unsigned int bytes = NUM * sizeof(double);
-// CHECK:   double *hostArrayDouble = (double *)malloc(bytes);
-// CHECK:   memset(hostArrayDouble, 0, bytes);
-// CHECK:   double *deviceArrayDouble;
-// CHECK:   deviceArrayDouble = (double *)sycl::malloc_device(bytes, q_ct1);
-// CHECK:   q_ct1.memcpy(deviceArrayDouble, hostArrayDouble, bytes).wait();
-// CHECK:   q_ct1.parallel_for(
-// CHECK:       sycl::nd_range<3>(sycl::range<3>(1, 1, 1), sycl::range<3>(1, 1, 1)),
-// CHECK:       [=](sycl::nd_item<3> item_ct1) {
-// CHECK:         kernelFunc(deviceArrayDouble);
-// CHECK:       });
-// CHECK:   q_ct1.memcpy(hostArrayDouble, deviceArrayDouble, bytes).wait();
-// CHECK:   sycl::free(deviceArrayDouble, q_ct1);
-// CHECK: }
 bool testDouble() {
   double *hostArrayDouble = (double *)malloc(sizeof(double));
   *hostArrayDouble = 0.956841;
@@ -76,24 +42,6 @@ bool testDouble() {
   return true;
 }
 
-// CHECK: void testFloat() {
-// CHECK:   dpct::device_ext &dev_ct1 = dpct::get_current_device();
-// CHECK:   sycl::queue &q_ct1 = dev_ct1.default_queue();
-// CHECK:   const unsigned int NUM = 1;
-// CHECK:   const unsigned int bytes = NUM * sizeof(float);
-// CHECK:   float *hostArrayFloat = (float *)malloc(bytes);
-// CHECK:   memset(hostArrayFloat, 0, bytes);
-// CHECK:   float *deviceArrayFloat;
-// CHECK:   deviceArrayFloat = (float *)sycl::malloc_device(bytes, q_ct1);
-// CHECK:   q_ct1.memcpy(deviceArrayFloat, hostArrayFloat, bytes).wait();
-// CHECK:   q_ct1.parallel_for(
-// CHECK:       sycl::nd_range<3>(sycl::range<3>(1, 1, 1), sycl::range<3>(1, 1, 1)),
-// CHECK:       [=](sycl::nd_item<3> item_ct1) {
-// CHECK:         kernelFunc(deviceArrayFloat);
-// CHECK:       });
-// CHECK:   q_ct1.memcpy(hostArrayFloat, deviceArrayFloat, bytes).wait();
-// CHECK:   sycl::free(deviceArrayFloat, q_ct1);
-// CHECK: }
 bool testFloat() {
   float *hostArrayFloat = (float *)malloc(sizeof(float));
   *hostArrayFloat = 0.1568541541f;
 
@@ -359,5 +359,6 @@
     <test testName="libcu_atomic" configFile="config/TEMPLATE_libcu.xml" />
     <test testName="pointer_attributes" configFile="config/TEMPLATE_pointer_attributes.xml" />
     <test testName="image" configFile="config/TEMPLATE_image.xml" />
+    <test testName="math_intel_specific" configFile="config/TEMPLATE_math_intel_specific.xml" />
   </tests>
 </suite>
@@ -64,7 +64,7 @@ def migrate_test():
     if test_config.current_test in logical_group_exper:
         src.append(' --use-experimental-features=logical-group ')
     if test_config.current_test == 'math_intel_specific':
-        src.append(' --rule-file=$(dirname $(which dpct))/../extensions/opt_rules/intel_specific_math.yaml ')
+        src.append(' --rule-file=./math_intel_specific/intel_specific_math.yaml')
 
     return do_migrate(src, in_root, test_config.out_root, extra_args)
 
@@ -125,6 +125,6 @@ def run_test():
         return True
     os.environ['SYCL_DEVICE_FILTER'] = test_config.device_filter
     if test_config.current_test == 'ccl':
-        return call_subprocess('mpirun -n 2 ' + os.path.join(os.path.curdir, test_config.current_test + '.run '));
+        return call_subprocess('mpirun -n 2 ' + os.path.join(os.path.curdir, test_config.current_test + '.run '))
     return run_binary_with_args()