Performance tuning for inter-node communication (#66)
This PR addresses two issues: - reduce the number of contexts supported by the host-interface by default to 1, we are not using those at the moment, and hence we now create fewer MPI_Win at the startup - introduces a micro-sleep in RO progress engine in case there are no pending requests. This leads significant performance improvements observed for inter-node communication with THor2 NICs.
This commit is contained in:
@@ -155,6 +155,12 @@ void rocshmem_env_config_init(void) {
|
||||
if (NULL != env_value) {
|
||||
rocshmem_env_config.ro_disable_ipc = atoi(env_value);
|
||||
}
|
||||
|
||||
env_value = getenv("ROCSHMEM_RO_PROGRESS_DELAY");
|
||||
if (nullptr != env_value) {
|
||||
rocshmem_env_config.ro_progress_delay = atoi(env_value);
|
||||
}
|
||||
|
||||
}
|
||||
|
||||
} // namespace rocshmem
|
||||
|
||||
Reference in New Issue
Block a user