File rocprim-add-gfx11XX.patch of Package rocprim
diff --git a/CMakeLists.txt b/CMakeLists.txt
index bdff5831..bb9fcc21 100644
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -91,7 +91,7 @@ if(NOT USE_HIP_CPU)
if(GPU_TARGETS STREQUAL "all")
rocm_check_target_ids(DEFAULT_AMDGPU_TARGETS
- TARGETS "gfx803;gfx900:xnack-;gfx906:xnack-;gfx908:xnack-;gfx90a:xnack-;gfx90a:xnack+;gfx940;gfx941;gfx942;gfx1030;gfx1100;gfx1101;gfx1102"
+ TARGETS "gfx803;gfx900:xnack-;gfx906:xnack-;gfx908:xnack-;gfx90a:xnack-;gfx90a:xnack+;gfx940;gfx941;gfx942;gfx1030;gfx1100;gfx1101;gfx1102;gfx1103"
)
set(GPU_TARGETS "${DEFAULT_AMDGPU_TARGETS}" CACHE STRING "GPU architectures to compile for" FORCE)
endif()
diff --git a/rmake.py b/rmake.py
index 265577f1..321367ca 100644
--- a/rmake.py
+++ b/rmake.py
@@ -37,8 +37,8 @@ def parse_args():
help='Install after build (default: False)')
parser.add_argument( '--cmake-darg', required=False, dest='cmake_dargs', action='append', default=[],
help='List of additional cmake defines for builds (e.g. CMAKE_CXX_COMPILER_LAUNCHER=ccache)')
- parser.add_argument('-a', '--architecture', dest='gpu_architecture', required=False, default="gfx906;gfx1030;gfx1100;gfx1101;gfx1102", #:sramecc+:xnack-" ) #gfx1030" ) #gfx906" ) # gfx1030" )
- help='Set GPU architectures, e.g. all, gfx000, gfx803, gfx906:xnack-;gfx1030;gfx1100 (optional, default: all)')
+ parser.add_argument('-a', '--architecture', dest='gpu_architecture', required=False, default="gfx1100;gfx1101;gfx1102;gfx1103",
+ help='Set GPU architectures, e.g. all, gfx000, gfx803, gfx906:xnack-;gfx1030;gfx1100 (optional, default: gfx1100;gfx1101;gfx1102;gfx1103)')
parser.add_argument('-v', '--verbose', required=False, default=False, action='store_true',
help='Verbose build (default: False)')
return parser.parse_args()
diff --git a/rocprim/include/rocprim/device/config_types.hpp b/rocprim/include/rocprim/device/config_types.hpp
index 484db834..906e72c6 100644
--- a/rocprim/include/rocprim/device/config_types.hpp
+++ b/rocprim/include/rocprim/device/config_types.hpp
@@ -203,7 +203,8 @@ constexpr bool prefix_equals(const char* lhs, const char* rhs, std::size_t n)
constexpr target_arch get_target_arch_from_name(const char* const arch_name, const std::size_t n)
{
constexpr const char* target_names[]
- = {"gfx803", "gfx900", "gfx906", "gfx908", "gfx90a", "gfx1030", "gfx1102"};
+ = {"gfx803", "gfx900", "gfx906", "gfx908", "gfx90a", "gfx1030", "gfx1100",
+ "gfx1101", "gfx1102", "gfx1103"};
constexpr target_arch target_architectures[] = {
target_arch::gfx803,
target_arch::gfx900,
@@ -212,6 +213,9 @@ constexpr target_arch get_target_arch_from_name(const char* const arch_name, con
target_arch::gfx90a,
target_arch::gfx1030,
target_arch::gfx1102,
+ target_arch::gfx1102,
+ target_arch::gfx1102,
+ target_arch::gfx1102,
};
static_assert(sizeof(target_names) / sizeof(target_names[0])
== sizeof(target_architectures) / sizeof(target_architectures[0]),