Perf: Add NO_COMPRESS option to disable slow offload-compress

Tento commit je obsažen v:
Donato Capitella
2026-02-01 11:14:25 +00:00
rodič 3bd4e81a8b
revize 54de8024d3
+2 -2
Zobrazit soubor
@@ -1217,12 +1217,12 @@ if (HAVE_PARALLEL_JOBS)
target_compile_options(rccl PRIVATE -parallel-jobs=12)
endif()
if (ROCM_VERSION VERSION_GREATER_EQUAL "60200")
if (ROCM_VERSION VERSION_GREATER_EQUAL "60200" AND NOT NO_COMPRESS)
target_compile_options(rccl PRIVATE --offload-compress) # Compress GPU code at compile time.
target_link_libraries(rccl PRIVATE --offload-compress) # Compress GPU code at link time.
message(STATUS "--offload-compress enabled - ROCm version >= 6.2.0")
else()
message(STATUS "--offload-compress disabled - ROCm version < 6.2.0")
message(STATUS "--offload-compress disabled (ROCM < 6.2.0 or NO_COMPRESS=ON)")
endif()
target_compile_options(rccl PRIVATE -Werror=uninitialized)