IntelPython · vlad-perevezentsev · Feb 10, 2025 · Feb 10, 2025 · Feb 10, 2025 · Feb 11, 2025
@@ -71,31 +71,61 @@ option(DPNP_TARGET_CUDA
     "Build DPNP to target CUDA devices"
     OFF
 )
+option(DPNP_TARGET_HIP
+    "Build DPNP to target HIP devices"
+    OFF
+)
 option(DPNP_USE_ONEMKL_INTERFACES
     "Build DPNP with oneMKL Interfaces"
     OFF
 )
+set(HIP_TARGETS "" CACHE STRING "HIP architecture for target")
-set(HIP_TARGETS "" CACHE STRING "HIP architecture for target")
+set(HIP_TARGET "" CACHE STRING "HIP architecture for target")
-set(HIP_TARGETS "" CACHE STRING "HIP architecture for target")
+set(HIP_TARGET "" CACHE STRING "HIP architecture for target")
+
 set(_dpnp_sycl_targets)
+set(_dpnp_amd_targets)
+set(_use_onemkl_interfaces OFF)
 set(_use_onemkl_interfaces_cuda OFF)
+set(_use_onemkl_interfaces_hip OFF)
+
+set(_dpnp_sycl_target_compile_options)
+set(_dpnp_sycl_target_link_options)
+
 if ("x${DPNP_SYCL_TARGETS}" STREQUAL "x")
-   if(DPNP_TARGET_CUDA)
-      set(_dpnp_sycl_targets "nvptx64-nvidia-cuda,spir64-unknown-unknown")
-      set(_use_onemkl_interfaces_cuda ON)
-   else()
-      if(DEFINED ENV{DPNP_TARGET_CUDA})
-          set(_dpnp_sycl_targets "nvptx64-nvidia-cuda,spir64-unknown-unknown")
-          set(_use_onemkl_interfaces_cuda ON)
-      endif()
-   endif()
+    if(DPNP_TARGET_CUDA)
+        set(_dpnp_sycl_targets "nvptx64-nvidia-cuda,spir64-unknown-unknown")
+        set(_use_onemkl_interfaces_cuda ON)
+    endif()
+    if(DPNP_TARGET_HIP)
+        if (NOT "x${HIP_TARGETS}" STREQUAL "x")
+            set(_dpnp_amd_targets ${HIP_TARGETS})
+            set(_use_onemkl_interfaces_hip ON)
+            if(_dpnp_sycl_targets)
+                set(_dpnp_sycl_targets "amdgcn-amd-amdhsa,${_dpnp_sycl_targets}")
+            else()
+                set(_dpnp_sycl_targets "amdgcn-amd-amdhsa,spir64-unknown-unknown")
+            endif()
+        else()
+            message(FATAL_ERROR "HIP_TARGETS must be specified when using HIP backend")
+        endif()
+    endif()
 else()
-   set(_dpnp_sycl_targets ${DPNP_SYCL_TARGETS})
+    set(_dpnp_sycl_targets ${DPNP_SYCL_TARGETS})
+    if (NOT "x${HIP_TARGETS}" STREQUAL "x")
+        set(_dpnp_amd_targets ${HIP_TARGETS})
+        set(_use_onemkl_interfaces_hip ON)
+    endif()
 endif()
 
-if(_dpnp_sycl_targets)
+if (_dpnp_sycl_targets)
    message(STATUS "Compiling for -fsycl-targets=${_dpnp_sycl_targets}")
+   list(APPEND _dpnp_sycl_target_compile_options -fsycl-targets=${_dpnp_sycl_targets})
+   list(APPEND _dpnp_sycl_target_link_options -fsycl-targets=${_dpnp_sycl_targets})
+   if(_dpnp_amd_targets)
+      list(APPEND _dpnp_sycl_target_compile_options -Xsycl-target-backend=amdgcn-amd-amdhsa --offload-arch=${_dpnp_amd_targets})
+      list(APPEND _dpnp_sycl_target_link_options -Xsycl-target-backend=amdgcn-amd-amdhsa --offload-arch=${_dpnp_amd_targets})
+   endif()
 endif()
 
-set(_use_onemkl_interfaces OFF)
 if(DPNP_USE_ONEMKL_INTERFACES)
     set(_use_onemkl_interfaces ON)
 else()
@@ -107,13 +137,20 @@ endif()
 if(_use_onemkl_interfaces)
     set(BUILD_FUNCTIONAL_TESTS False)
     set(BUILD_EXAMPLES False)
+    set(ENABLE_MKLGPU_BACKEND True)
+    set(ENABLE_MKLCPU_BACKEND True)
+
     if(_use_onemkl_interfaces_cuda)
         set(ENABLE_CUBLAS_BACKEND True)
         set(ENABLE_CUSOLVER_BACKEND True)
         set(ENABLE_CUFFT_BACKEND True)
         # set(ENABLE_CURAND_BACKEND True)
-        set(ENABLE_MKLGPU_BACKEND True)
-        set(ENABLE_MKLCPU_BACKEND True)
+    endif()
+    if(_use_onemkl_interfaces_hip)
+        set(ENABLE_ROCBLAS_BACKEND True)
+        set(ENABLE_ROCSOLVER_BACKEND True)
+        set(ENABLE_ROCFFT_BACKEND True)
+        # set(ENABLE_ROCRAND_BACKEND True)
     endif()
 
     if(DPNP_ONEMKL_INTERFACES_DIR)

@@ -38,12 +38,12 @@ if(_dpnp_sycl_targets)
     target_compile_options(
         ${python_module_name}
         PRIVATE
-        -fsycl-targets=${_dpnp_sycl_targets}
+        ${_dpnp_sycl_target_compile_options}
     )
     target_link_options(
         ${python_module_name}
         PRIVATE
-        -fsycl-targets=${_dpnp_sycl_targets}
+        ${_dpnp_sycl_target_link_options}
     )
 endif()
 

@@ -45,12 +45,12 @@ if(_dpnp_sycl_targets)
     target_compile_options(
         ${python_module_name}
         PRIVATE
-        -fsycl-targets=${_dpnp_sycl_targets}
+        ${_dpnp_sycl_target_compile_options}
     )
     target_link_options(
         ${python_module_name}
         PRIVATE
-        -fsycl-targets=${_dpnp_sycl_targets}
+        ${_dpnp_sycl_target_link_options}
     )
 endif()
 

@@ -77,12 +77,12 @@ if(_dpnp_sycl_targets)
   target_compile_options(
     ${python_module_name}
     PRIVATE
-    -fsycl-targets=${_dpnp_sycl_targets}
+    ${_dpnp_sycl_target_compile_options}
   )
   target_link_options(
     ${python_module_name}
     PRIVATE
-    -fsycl-targets=${_dpnp_sycl_targets}
+    ${_dpnp_sycl_target_link_options}
   )
 endif()
 

@@ -39,6 +39,7 @@ def run(
     verbose=False,
     cmake_opts="",
     target="intel",
+    arch=None,
     onemkl_interfaces=False,
     onemkl_interfaces_dir=None,
 ):
@@ -104,6 +105,16 @@ def run(
         # Always builds using oneMKL interfaces for the cuda target
         onemkl_interfaces = True
 
+    if target == "hip":
+        if not arch:
+            raise ValueError("--arch is required when --target=hip")
+        cmake_args += [
+            "-DDPNP_TARGET_HIP=ON",
+            f"-DHIP_TARGETS={arch}",
+        ]
+        # Always builds using oneMKL interfaces for the hip target
+        onemkl_interfaces = True
+
     if onemkl_interfaces:
         cmake_args += [
             "-DDPNP_USE_ONEMKL_INTERFACES=ON",
@@ -177,6 +188,12 @@ def run(
         default="intel",
         type=str,
     )
+    driver.add_argument(
+        "--arch",
+        help="Architecture for HIP target",
+        dest="arch",
+        type=str,
+    )
     driver.add_argument(
         "--onemkl-interfaces",
         help="Build using oneMKL Interfaces",
@@ -244,6 +261,7 @@ def run(
         verbose=args.verbose,
         cmake_opts=args.cmake_opts,
         target=args.target,
+        arch=args.arch,
         onemkl_interfaces=args.onemkl_interfaces,
         onemkl_interfaces_dir=args.onemkl_interfaces_dir,
     )