/* * Copyright (c) 2017 Intel Corporation. All rights reserved. * This software is available to you under the BSD license below: * * Redistribution and use in source and binary forms, with or * without modification, are permitted provided that the following * conditions are met: * * - Redistributions of source code must retain the above * copyright notice, this list of conditions and the following * disclaimer. * * - Redistributions in binary form must reproduce the above * copyright notice, this list of conditions and the following * disclaimer in the documentation and/or other materials * provided with the distribution. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE * SOFTWARE. */ /* Multithreaded All-to-All Test * James Dinan * January, 2014 */ #include #include #include #include #include using namespace rocshmem; #define T 8 long *dest; long *flag; int me, npes; int errors = 0; pthread_barrier_t fencebar; pthread_mutex_t mutex = PTHREAD_MUTEX_INITIALIZER; static void *thread_main(void *arg) { int tid = *(int *)arg; int i, expected; long val; /* TEST CONCURRENT ATOMICS */ val = me; for (i = 1; i <= npes; i++) roc_shmem_int64_atomic_add(&dest[tid], val, (me + i) % npes); /* Ensure that fence does not overlap with communication calls */ pthread_barrier_wait(&fencebar); if (tid == 0) roc_shmem_fence(); pthread_barrier_wait(&fencebar); for (i = 1; i <= npes; i++) roc_shmem_int64_atomic_inc(&flag[tid], (me + i) % npes); roc_shmem_long_wait_until(&flag[tid], ROC_SHMEM_CMP_EQ, npes); expected = (npes - 1) * npes / 2; if (dest[tid] != expected || flag[tid] != npes) { printf( "Atomic test error: [PE = %d | TID = %d] -- " "dest = %ld (expected %d), flag = %ld (expected %d)\n", me, tid, dest[tid], expected, flag[tid], npes); pthread_mutex_lock(&mutex); ++errors; pthread_mutex_unlock(&mutex); } pthread_barrier_wait(&fencebar); if (0 == tid) roc_shmem_barrier_all(); pthread_barrier_wait(&fencebar); /* TEST CONCURRENT PUTS */ val = -1; roc_shmem_long_put(&dest[tid], &val, 1, (me + 1) % npes); /* Ensure that all puts are issued before the shmem barrier is called. */ pthread_barrier_wait(&fencebar); if (0 == tid) roc_shmem_barrier_all(); pthread_barrier_wait(&fencebar); /* TEST CONCURRENT GETS */ for (i = 1; i <= npes; i++) { roc_shmem_long_get(&val, &dest[tid], 1, (me + i) % npes); expected = -1; if (val != expected) { printf( "Put/get test error: [PE = %d | TID = %d] -- From PE %d, got %ld " "expected %d\n", me, tid, (me + i) % npes, val, expected); pthread_mutex_lock(&mutex); ++errors; pthread_mutex_unlock(&mutex); } } pthread_barrier_wait(&fencebar); if (0 == tid) roc_shmem_barrier_all(); return NULL; } int main(int argc, char **argv) { int tl, i, ret; pthread_t threads[T]; int t_arg[T]; roc_shmem_init_thread(ROC_SHMEM_THREAD_MULTIPLE, &tl); if (tl != ROC_SHMEM_THREAD_MULTIPLE) { printf("Init failed (requested thread level %d, got %d)\n", ROC_SHMEM_THREAD_MULTIPLE, tl); roc_shmem_global_exit(1); } me = roc_shmem_my_pe(); npes = roc_shmem_n_pes(); pthread_barrier_init(&fencebar, NULL, T); dest = (long *)roc_shmem_malloc(sizeof(long) * T); flag = (long *)roc_shmem_malloc(sizeof(long) * T); if (me == 0) printf("Starting multithreaded test on %d PEs, %d threads/PE\n", npes, T); for (i = 0; i < T; i++) { int err; dest[i] = 0; flag[i] = 0; t_arg[i] = i; err = pthread_create(&threads[i], NULL, thread_main, (void *)&t_arg[i]); assert(0 == err); } for (i = 0; i < T; i++) { int err; err = pthread_join(threads[i], NULL); assert(0 == err); } pthread_barrier_destroy(&fencebar); if (me == 0) { if (errors) printf("Encountered %d errors\n", errors); else printf("Success\n"); } roc_shmem_free(dest); roc_shmem_free(flag); roc_shmem_finalize(); return (errors == 0) ? 0 : 1; }