c87e69e522
* Submitting jobs to cdash
* Fail on submit
* submit url env
* submit url env
* try passing submit url as arg
* fix submit url
* Updated default URL
* Add submissions for remaining ubuntu focal workflow jobs
* Replace g++ with gcc in dashboard build name
* Add --ctest-args to run-ci.sh
* Add cdash support for bionic, jammy, and opensuse workflows
* Decrease CTEST_CUSTOM_MAXIMUM_PASSED_TEST_OUTPUT_SIZE
* OMNITRACE_BUILD_CODECOV option
* Support code coverage in CDash script
* CI dyninst built with debug info
* Update ci-containers
- cron schedule moved 4 hours later to UTC+5
* Update implementation of config::configure_signal_handler
- using lambdas failed to compile with codecov flags
* Add codecov job to ubuntu focal workflow
* Fix support for --ctest-args in run-ci script
* Fix ubuntu workflows
* Fix quotation handling in run-ci script
* git safe directory for codecov
* New MPI examples
* Remove --stop-on-failure
* dynamic_library update
- find_library_path checks procfs maps
- invoke find_library_path with no additional args to resolve to mapped file
* RCCLP uses dynamic_library
* check if file exists for memory_map_files metadata
* Testing updates
- include new mpi examples in tests
- fix test labels
- test critical-trace exe
* Update MPI C examples tests (needed arg)
* Remove try/catch block from critical-trace
* Fix sampling max wait when shutting down
* Fix test env for critical-trace
* Fix settings for critical-trace
- disable time output: data is deterministic
- disable PID suffixes: not multiprocess
* Update critical-trace ctest
* Update critical-trace exe
- throw error if input cannot be opened
- throw error if input has no data
* Update lulesh example with more kokkos tools usage
* Fix tasking issue with critical_trace and roctracer
- were not setting pools to active
- also sync before critical_trace::get_entries
* Increase verbosity of critical-trace tests
* Update code coverage tests
- skip code coverage + preload
- code-coverage python example and test
* Remove duplication omnitrace.initialize function
* Skip python3.6 for ubuntu jammy
* Update MPI examples
- use MPI_Isend and MPI_Irecv
- explicitly use MPI_Bcast
* Update Formatting.cmake
- include C files in examples
* run-ci script does not check return of coverage
* mpi-allreduce link to libm
* Update ctest args in run-ci script
* Update dyninst submodule
- safety improvements in BinaryEdit::openResolvedLibraryName
* capture cmake error for ctest_coverage
[ROCm/rocprofiler-systems commit: 46b6db1a4c]
135 lines
3.9 KiB
C
135 lines
3.9 KiB
C
// Author: Wes Kendall
|
|
// Copyright 2011 www.mpitutorial.com
|
|
// This code is provided freely with the tutorials on mpitutorial.com. Feel
|
|
// free to modify it for your own use. Any distribution of the code must
|
|
// either provide a link to www.mpitutorial.com or keep this header intact.
|
|
//
|
|
// Comparison of MPI_Bcast with the my_bcast function
|
|
//
|
|
#include <assert.h>
|
|
#include <mpi.h>
|
|
#include <stdio.h>
|
|
#include <stdlib.h>
|
|
|
|
void
|
|
my_bcast(void* data, int count, MPI_Datatype datatype, int root, MPI_Comm communicator)
|
|
{
|
|
int world_rank;
|
|
MPI_Comm_rank(communicator, &world_rank);
|
|
int world_size;
|
|
MPI_Comm_size(communicator, &world_size);
|
|
|
|
if(world_rank == root)
|
|
{
|
|
// If we are the root process, send our data to everyone
|
|
int i;
|
|
for(i = 0; i < world_size; i++)
|
|
{
|
|
if(i != world_rank)
|
|
{
|
|
MPI_Send(data, count, datatype, i, 0, communicator);
|
|
}
|
|
}
|
|
}
|
|
else
|
|
{
|
|
// If we are a receiver process, receive the data from the root
|
|
MPI_Recv(data, count, datatype, root, 0, communicator, MPI_STATUS_IGNORE);
|
|
}
|
|
}
|
|
|
|
void
|
|
my_ibcast(void* data, int count, MPI_Datatype datatype, int root, MPI_Comm communicator)
|
|
{
|
|
int world_rank;
|
|
MPI_Comm_rank(communicator, &world_rank);
|
|
int world_size;
|
|
MPI_Comm_size(communicator, &world_size);
|
|
MPI_Request request = MPI_REQUEST_NULL;
|
|
|
|
if(world_rank == root)
|
|
{
|
|
// If we are the root process, send our data to everyone
|
|
int i;
|
|
for(i = 0; i < world_size; i++)
|
|
{
|
|
if(i != world_rank)
|
|
{
|
|
MPI_Isend(data, count, datatype, i, 0, communicator, &request);
|
|
}
|
|
}
|
|
}
|
|
else
|
|
{
|
|
// If we are a receiver process, receive the data from the root
|
|
MPI_Irecv(data, count, datatype, root, 0, communicator, &request);
|
|
}
|
|
|
|
MPI_Status status;
|
|
// bloks and waits for destination process to receive data
|
|
MPI_Wait(&request, &status);
|
|
}
|
|
|
|
int
|
|
main(int argc, char** argv)
|
|
{
|
|
int num_elements = 30;
|
|
int num_trials = 50;
|
|
|
|
if(argc != 3) fprintf(stderr, "Usage: compare_bcast [num_elements] [num_trials]\n");
|
|
|
|
if(argc > 1) num_elements = atoi(argv[1]);
|
|
if(argc > 2) num_trials = atoi(argv[2]);
|
|
|
|
MPI_Init(NULL, NULL);
|
|
|
|
int world_rank;
|
|
MPI_Comm_rank(MPI_COMM_WORLD, &world_rank);
|
|
|
|
double total_my_bcast_time = 0.0;
|
|
double total_my_ibcast_time = 0.0;
|
|
double total_mpi_bcast_time = 0.0;
|
|
int i;
|
|
int* data = (int*) malloc(sizeof(int) * num_elements);
|
|
assert(data != NULL);
|
|
|
|
for(i = 0; i < num_trials; i++)
|
|
{
|
|
// Time my_bcast
|
|
// Synchronize before starting timing
|
|
MPI_Barrier(MPI_COMM_WORLD);
|
|
total_my_bcast_time -= MPI_Wtime();
|
|
my_bcast(data, num_elements, MPI_INT, 0, MPI_COMM_WORLD);
|
|
// Synchronize again before obtaining final time
|
|
MPI_Barrier(MPI_COMM_WORLD);
|
|
total_my_bcast_time += MPI_Wtime();
|
|
|
|
MPI_Barrier(MPI_COMM_WORLD);
|
|
total_my_ibcast_time -= MPI_Wtime();
|
|
my_ibcast(data, num_elements, MPI_INT, 0, MPI_COMM_WORLD);
|
|
// Synchronize again before obtaining final time
|
|
MPI_Barrier(MPI_COMM_WORLD);
|
|
total_my_ibcast_time += MPI_Wtime();
|
|
|
|
// Time MPI_Bcast
|
|
MPI_Barrier(MPI_COMM_WORLD);
|
|
total_mpi_bcast_time -= MPI_Wtime();
|
|
MPI_Bcast(data, num_elements, MPI_INT, 0, MPI_COMM_WORLD);
|
|
MPI_Barrier(MPI_COMM_WORLD);
|
|
total_mpi_bcast_time += MPI_Wtime();
|
|
}
|
|
|
|
// Print off timing information
|
|
if(world_rank == 0)
|
|
{
|
|
printf("Data size = %d, Trials = %d\n", num_elements * (int) sizeof(int),
|
|
num_trials);
|
|
printf("Avg my_bcast time = %lf\n", total_my_bcast_time / num_trials);
|
|
printf("Avg my_ibcast time = %lf\n", total_my_ibcast_time / num_trials);
|
|
printf("Avg MPI_Bcast time = %lf\n", total_mpi_bcast_time / num_trials);
|
|
}
|
|
|
|
free(data);
|
|
MPI_Finalize();
|
|
}
|