From bddb9850de2d82e514ced4e83d0ff1a0bef354c2 Mon Sep 17 00:00:00 2001 From: Laurent Morichetti Date: Fri, 19 Aug 2022 10:31:16 -0700 Subject: [PATCH] Remove roctracer_mark This function has been deprecated since ROCm-2.9, use ROCTX's roctxMark(const char* message) as a replacement for roctracer_mark. Change-Id: Ie4aeae1db238453fc4451746cc9a338032ba817f --- src/roctracer/backward_compat.cpp | 9 +- src/roctracer/roctracer.cpp | 29 +-- src/tracer_tool/tracer_tool.cpp | 27 +-- .../MatrixTranspose_hip_flush_trace.txt | 200 ------------------ .../MatrixTranspose_hip_input_trace.txt | 200 ------------------ .../MatrixTranspose_hip_period_trace.txt | 200 ------------------ .../MatrixTranspose_sys_hsa_trace.txt | 200 ------------------ .../MatrixTranspose_sys_trace.txt | 200 ------------------ test/hip/MatrixTranspose.cpp | 5 - 9 files changed, 14 insertions(+), 1056 deletions(-) diff --git a/src/roctracer/backward_compat.cpp b/src/roctracer/backward_compat.cpp index 2fa761b9e4..3d8d22c905 100644 --- a/src/roctracer/backward_compat.cpp +++ b/src/roctracer/backward_compat.cpp @@ -20,9 +20,8 @@ #include "roctracer.h" -#define PUBLIC_API __attribute__((visibility("default"))) - // Deprecated functions: -extern "C" PUBLIC_API int roctracer_load() { return 1; } -extern "C" PUBLIC_API void roctracer_unload() {} -extern "C" PUBLIC_API void roctracer_flush_buf() {} +extern "C" ROCTRACER_API int roctracer_load() { return 1; } +extern "C" ROCTRACER_API void roctracer_unload() {} +extern "C" ROCTRACER_API void roctracer_flush_buf() {} +extern "C" ROCTRACER_API void roctracer_mark(const char*) {} diff --git a/src/roctracer/roctracer.cpp b/src/roctracer/roctracer.cpp index 30bf49283b..2526b8f62c 100644 --- a/src/roctracer/roctracer.cpp +++ b/src/roctracer/roctracer.cpp @@ -93,13 +93,6 @@ static inline uint32_t GetPid() { return syscall(__NR_getpid); } -/////////////////////////////////////////////////////////////////////////////////////////////////// -// Mark callback -// -typedef void(mark_api_callback_t)(uint32_t domain, uint32_t cid, const void* callback_data, - void* arg); -mark_api_callback_t* mark_api_callback_ptr = nullptr; - /////////////////////////////////////////////////////////////////////////////////////////////////// // Internal library methods // @@ -1134,15 +1127,6 @@ roctracer_activity_pop_external_correlation_id(activity_correlation_id_t* last_i API_METHOD_SUFFIX } -// Mark API (FIXME: why isn't it in the roctracer_ext.h header?) -extern "C" ROCTRACER_API void roctracer_mark(const char* str) { - if (mark_api_callback_ptr) { - mark_api_callback_ptr(ACTIVITY_DOMAIN_EXT_API, ACTIVITY_EXT_OP_MARK, str, nullptr); - NextCorrelationId(); // account for user-defined markers when tracking - // correlation id - } -} - // Start API ROCTRACER_API void roctracer_start() { if (set_stopped(0)) { @@ -1187,18 +1171,11 @@ ROCTRACER_API roctracer_status_t roctracer_set_properties(roctracer_domain_t dom void* properties) { API_METHOD_PREFIX switch (domain) { - case ACTIVITY_DOMAIN_HSA_OPS: { - break; - } - case ACTIVITY_DOMAIN_HSA_EVT: { - break; - } - case ACTIVITY_DOMAIN_HSA_API: { - break; - } + case ACTIVITY_DOMAIN_HSA_OPS: + case ACTIVITY_DOMAIN_HSA_EVT: + case ACTIVITY_DOMAIN_HSA_API: case ACTIVITY_DOMAIN_HIP_OPS: case ACTIVITY_DOMAIN_HIP_API: { - mark_api_callback_ptr = reinterpret_cast(properties); break; } case ACTIVITY_DOMAIN_EXT_API: { diff --git a/src/tracer_tool/tracer_tool.cpp b/src/tracer_tool/tracer_tool.cpp index 79fbde8d96..a1dc81a2ef 100644 --- a/src/tracer_tool/tracer_tool.cpp +++ b/src/tracer_tool/tracer_tool.cpp @@ -295,11 +295,11 @@ struct hip_api_trace_entry_t { hip_api_data_t data; }; - hip_api_trace_entry_t(activity_domain_t domain, uint32_t cid, roctracer_timestamp_t begin, - roctracer_timestamp_t end, uint32_t pid, uint32_t tid, - const hip_api_data_t& hip_api_data, const char* name) + hip_api_trace_entry_t(uint32_t cid, roctracer_timestamp_t begin, roctracer_timestamp_t end, + uint32_t pid, uint32_t tid, const hip_api_data_t& hip_api_data, + const char* name) : valid(roctracer::TRACE_ENTRY_INIT) { - record.domain = domain; + record.domain = ACTIVITY_DOMAIN_HIP_API; record.op = cid; record.kind = 0; record.begin_ns = begin; @@ -417,24 +417,13 @@ void hip_api_callback(uint32_t domain, uint32_t cid, const void* callback_data, // Post init of HIP APU args hipApiArgsInit((hip_api_id_t)cid, const_cast(data)); kernel_name = getKernelName(cid, data); - hip_api_trace_entry_t& entry = hip_api_trace_buffer.Emplace( - static_cast(domain), cid, hip_begin_timestamp, timestamp, GetPid(), - GetTid(), *data, kernel_name ? kernel_name->c_str() : nullptr); + hip_api_trace_entry_t& entry = + hip_api_trace_buffer.Emplace(cid, hip_begin_timestamp, timestamp, GetPid(), GetTid(), *data, + kernel_name ? kernel_name->c_str() : nullptr); entry.valid.store(roctracer::TRACE_ENTRY_COMPLETE, std::memory_order_release); } } -void mark_api_callback(uint32_t domain, uint32_t cid, const void* callback_data, void* arg) { - (void)arg; - const char* name = reinterpret_cast(callback_data); - - const roctracer_timestamp_t timestamp = timestamp_ns(); - hip_api_trace_entry_t& entry = - hip_api_trace_buffer.Emplace(static_cast(domain), cid, timestamp, - timestamp + 1, GetPid(), GetTid(), hip_api_data_t{}, name); - entry.valid.store(roctracer::TRACE_ENTRY_COMPLETE, std::memory_order_release); -} - /////////////////////////////////////////////////////////////////////////////////////////////////////// // Input parser std::string normalize_token(const std::string& token, bool not_empty, const std::string& label) { @@ -757,8 +746,6 @@ ROCTRACER_EXPORT bool OnLoad(HsaApiTable* table, uint64_t runtime_version, if (trace_hip_api || trace_hip_activity) { fprintf(stdout, " HIP-trace()\n"); fflush(stdout); - // roctracer properties - roctracer_set_properties(ACTIVITY_DOMAIN_HIP_API, (void*)mark_api_callback); // Allocating tracing pool open_tracing_pool(); diff --git a/test/golden_traces/MatrixTranspose_hip_flush_trace.txt b/test/golden_traces/MatrixTranspose_hip_flush_trace.txt index 6f0c4d17aa..051d58b27b 100644 --- a/test/golden_traces/MatrixTranspose_hip_flush_trace.txt +++ b/test/golden_traces/MatrixTranspose_hip_flush_trace.txt @@ -26,32 +26,24 @@ PASSED! 129855989696159:129855990920319 0:0 KernelExecution:29:14696 129855989668256:129855991384209 0:0 CopyDeviceToHost:31:14696 129855605540988:129855957443403 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :4 -129855957456260:129855957456261 14696:14696 MARK(name(before HIP LaunchKernel)) 129855957507034:129855957514510 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :6 129855957521000:129855957523014 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :7 129855957529950:129855958671150 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :8 -129855958701410:129855958701411 14696:14696 MARK(name(after HIP LaunchKernel)) 129855958708321:129855961719221 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :10 129855971408776:129855972257972 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :11 -129855972261515:129855972261516 14696:14696 MARK(name(before HIP LaunchKernel)) 129855972266736:129855972268234 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :13 129855972271629:129855972272780 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :14 129855972276181:129855972282118 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :15 -129855972663504:129855972663505 14696:14696 MARK(name(after HIP LaunchKernel)) 129855972666015:129855974143463 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :17 129855980222888:129855981023250 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :18 -129855981025473:129855981025474 14696:14696 MARK(name(before HIP LaunchKernel)) 129855981028834:129855981029831 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :20 129855981032043:129855981032913 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :21 129855981035237:129855981038997 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :22 -129855981041265:129855981041266 14696:14696 MARK(name(after HIP LaunchKernel)) 129855981043695:129855982796928 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :24 129855988764565:129855989615901 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :25 -129855989618073:129855989618074 14696:14696 MARK(name(before HIP LaunchKernel)) 129855989621096:129855989622129 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :27 129855989624243:129855989625087 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :28 129855989627271:129855989630934 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :29 -129855989632959:129855989632960 14696:14696 MARK(name(after HIP LaunchKernel)) 129855989635351:129855991396402 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :31 PASSED! ## Iteration (95) ################# @@ -114,88 +106,64 @@ PASSED! 129856094767987:129856095991348 0:0 KernelExecution:113:14696 129856094739044:129856096520182 0:0 CopyDeviceToHost:115:14696 129855997303698:129855998134058 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :32 -129855998136242:129855998136243 14696:14696 MARK(name(before HIP LaunchKernel)) 129855998138933:129855998139817 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :34 129855998141918:129855998142773 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :35 129855998144935:129855998149221 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :36 -129855998151431:129855998151432 14696:14696 MARK(name(after HIP LaunchKernel)) 129855998153828:129855999937506 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :38 129856005829520:129856006665192 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :39 -129856006667396:129856006667397 14696:14696 MARK(name(before HIP LaunchKernel)) 129856006670307:129856006671160 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :41 129856006673376:129856006674209 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :42 129856006676323:129856006679651 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :43 -129856006681635:129856006681636 14696:14696 MARK(name(after HIP LaunchKernel)) 129856006683967:129856008469471 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :45 129856014360174:129856015191285 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :46 -129856015193489:129856015193490 14696:14696 MARK(name(before HIP LaunchKernel)) 129856015196342:129856015197217 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :48 129856015199400:129856015200221 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :49 129856015202314:129856015205930 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :50 -129856015208058:129856015208059 14696:14696 MARK(name(after HIP LaunchKernel)) 129856015210764:129856017001555 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :52 129856022908053:129856023733985 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :53 -129856023736320:129856023736321 14696:14696 MARK(name(before HIP LaunchKernel)) 129856023739178:129856023740063 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :55 129856023742240:129856023743090 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :56 129856023745309:129856023748845 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :57 -129856023750891:129856023750892 14696:14696 MARK(name(after HIP LaunchKernel)) 129856023753396:129856025556257 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :59 129856031530409:129856032503170 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :60 -129856032505392:129856032505393 14696:14696 MARK(name(before HIP LaunchKernel)) 129856032508345:129856032509226 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :62 129856032511486:129856032512316 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :63 129856032514599:129856032518036 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :64 -129856032520150:129856032520151 14696:14696 MARK(name(after HIP LaunchKernel)) 129856032522410:129856034373111 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :66 129856040397979:129856041130687 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :67 -129856041132973:129856041132974 14696:14696 MARK(name(before HIP LaunchKernel)) 129856041136399:129856041137389 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :69 129856041139653:129856041140500 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :70 129856041142893:129856041146663 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :71 -129856041148645:129856041148646 14696:14696 MARK(name(after HIP LaunchKernel)) 129856041151128:129856042953843 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :73 129856048994841:129856049829566 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :74 -129856049831724:129856049831725 14696:14696 MARK(name(before HIP LaunchKernel)) 129856049834527:129856049835413 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :76 129856049837759:129856049838585 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :77 129856049840796:129856049844487 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :78 -129856049846529:129856049846530 14696:14696 MARK(name(after HIP LaunchKernel)) 129856049848934:129856051663797 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :80 129856057798518:129856058633464 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :81 -129856058635650:129856058635651 14696:14696 MARK(name(before HIP LaunchKernel)) 129856058638530:129856058639560 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :83 129856058641994:129856058642826 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :84 129856058645125:129856058648721 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :85 -129856058650749:129856058650750 14696:14696 MARK(name(after HIP LaunchKernel)) 129856058653478:129856060466863 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :87 129856066704603:129856067541502 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :88 -129856067543802:129856067543803 14696:14696 MARK(name(before HIP LaunchKernel)) 129856067546791:129856067547681 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :90 129856067550027:129856067550854 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :91 129856067553125:129856067556952 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :92 -129856067559149:129856067559150 14696:14696 MARK(name(after HIP LaunchKernel)) 129856067561903:129856069442958 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :94 129856075719215:129856076572398 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :95 -129856076574828:129856076574829 14696:14696 MARK(name(before HIP LaunchKernel)) 129856076578071:129856076578997 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :97 129856076581286:129856076582119 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :98 129856076584498:129856076588395 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :99 -129856076590554:129856076590555 14696:14696 MARK(name(after HIP LaunchKernel)) 129856076592857:129856078406672 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :101 129856084768530:129856085607081 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :102 -129856085609437:129856085609438 14696:14696 MARK(name(before HIP LaunchKernel)) 129856085612528:129856085613498 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :104 129856085615751:129856085616602 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :105 129856085618831:129856085623039 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :106 -129856085625178:129856085625179 14696:14696 MARK(name(after HIP LaunchKernel)) 129856085627731:129856087451206 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :108 129856093846767:129856094686797 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :109 -129856094689153:129856094689154 14696:14696 MARK(name(before HIP LaunchKernel)) 129856094692497:129856094693485 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :111 129856094695727:129856094696598 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :112 129856094698884:129856094702856 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :113 -129856094705178:129856094705179 14696:14696 MARK(name(after HIP LaunchKernel)) 129856094707931:129856096534639 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :115 PASSED! ## Iteration (83) ################# @@ -253,83 +221,61 @@ PASSED! 129856192345329:129856193569809 0:0 KernelExecution:190:14696 129856192317767:129856194105080 0:0 CopyDeviceToHost:192:14696 129856103003811:129856103844379 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :116 -129856103846787:129856103846788 14696:14696 MARK(name(before HIP LaunchKernel)) 129856103849922:129856103850838 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :118 129856103853240:129856103854136 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :119 129856103856444:129856103860149 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :120 -129856103862386:129856103862387 14696:14696 MARK(name(after HIP LaunchKernel)) 129856103864691:129856105741098 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :122 129856112200226:129856113019342 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :123 -129856113021598:129856113021599 14696:14696 MARK(name(before HIP LaunchKernel)) 129856113024595:129856113025504 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :125 129856113027902:129856113028756 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :126 129856113031010:129856113034968 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :127 -129856113037098:129856113037099 14696:14696 MARK(name(after HIP LaunchKernel)) 129856113039452:129856114918382 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :129 129856121536590:129856122377686 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :130 -129856122380177:129856122380178 14696:14696 MARK(name(before HIP LaunchKernel)) 129856122383242:129856122384157 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :132 129856122386562:129856122387438 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :133 129856122389743:129856122393887 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :134 -129856122395917:129856122395918 14696:14696 MARK(name(after HIP LaunchKernel)) 129856122398705:129856124236553 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :136 129856130930250:129856131721919 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :137 -129856131724534:129856131724535 14696:14696 MARK(name(before HIP LaunchKernel)) 129856131727544:129856131728453 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :139 129856131730840:129856131731718 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :140 129856131734248:129856131738338 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :141 -129856131740508:129856131740509 14696:14696 MARK(name(after HIP LaunchKernel)) 129856131742956:129856133633762 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :143 129856140484642:129856141289559 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :144 -129856141292040:129856141292041 14696:14696 MARK(name(before HIP LaunchKernel)) 129856141295360:129856141296366 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :146 129856141298705:129856141299584 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :147 129856141301885:129856141305904 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :148 -129856141308287:129856141308288 14696:14696 MARK(name(after HIP LaunchKernel)) 129856141310745:129856143207185 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :150 129856150167842:129856151019519 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :151 -129856151021903:129856151021904 14696:14696 MARK(name(before HIP LaunchKernel)) 129856151025430:129856151026339 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :153 129856151028846:129856151029731 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :154 129856151032070:129856151036399 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :155 -129856151038525:129856151038526 14696:14696 MARK(name(after HIP LaunchKernel)) 129856151041204:129856152887054 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :157 129856159416500:129856160257922 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :158 -129856160260251:129856160260252 14696:14696 MARK(name(before HIP LaunchKernel)) 129856160263327:129856160264253 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :160 129856160266588:129856160267551 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :161 129856160269815:129856160273583 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :162 -129856160275639:129856160275640 14696:14696 MARK(name(after HIP LaunchKernel)) 129856160277873:129856162154856 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :164 129856167989129:129856168794954 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :165 -129856168796817:129856168796818 14696:14696 MARK(name(before HIP LaunchKernel)) 129856168799680:129856168800356 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :167 129856168802336:129856168803043 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :168 129856168804923:129856168808196 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :169 -129856168810026:129856168810027 14696:14696 MARK(name(after HIP LaunchKernel)) 129856168811889:129856170642148 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :171 129856175935119:129856176727698 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :172 -129856176729573:129856176729574 14696:14696 MARK(name(before HIP LaunchKernel)) 129856176732312:129856176733001 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :174 129856176734764:129856176735517 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :175 129856176737306:129856176740961 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :176 -129856176742551:129856176742552 14696:14696 MARK(name(after HIP LaunchKernel)) 129856176744384:129856178576608 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :178 129856183733862:129856184521359 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :179 PASSED! ## Iteration (72) ################# -129856184523202:129856184523203 14696:14696 MARK(name(before HIP LaunchKernel)) 129856184526239:129856184526918 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :181 129856184528695:129856184529339 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :182 129856184531203:129856184534819 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :183 -129856184536444:129856184536445 14696:14696 MARK(name(after HIP LaunchKernel)) 129856184538159:129856186381152 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :185 129856191471466:129856192258965 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :186 -129856192260887:129856192260888 14696:14696 MARK(name(before HIP LaunchKernel)) 129856192264565:129856192265231 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :188 129856192266936:129856192267582 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :189 129856192269493:129856192272647 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :190 -129856192274238:129856192274239 14696:14696 MARK(name(after HIP LaunchKernel)) 129856192276014:129856194117333 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :192 PASSED! ## Iteration (71) ################# @@ -400,102 +346,74 @@ PASSED! 129856297157310:129856298378111 0:0 KernelExecution:288:14696 129856297129589:129856298914568 0:0 CopyDeviceToHost:290:14696 129856199220209:129856199993256 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :193 -129856199995165:129856199995166 14696:14696 MARK(name(before HIP LaunchKernel)) 129856199998331:129856199999016 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :195 129856200000971:129856200001630 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :196 129856200003348:129856200006409 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :197 -129856200007997:129856200007998 14696:14696 MARK(name(after HIP LaunchKernel)) 129856200009781:129856201864796 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :199 129856206828954:129856207617612 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :200 -129856207619342:129856207619343 14696:14696 MARK(name(before HIP LaunchKernel)) 129856207633427:129856207634203 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :202 129856207635929:129856207636565 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :203 129856207638289:129856207641619 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :204 -129856207643379:129856207643380 14696:14696 MARK(name(after HIP LaunchKernel)) 129856207645338:129856209486625 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :206 129856214367871:129856215199634 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :207 -129856215201421:129856215201422 14696:14696 MARK(name(before HIP LaunchKernel)) 129856215205034:129856215205701 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :209 129856215207421:129856215208068 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :210 129856215209926:129856215213001 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :211 -129856215214576:129856215214577 14696:14696 MARK(name(after HIP LaunchKernel)) 129856215216591:129856217062762 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :213 129856221865656:129856222702390 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :214 -129856222704143:129856222704144 14696:14696 MARK(name(before HIP LaunchKernel)) 129856222707593:129856222708263 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :216 129856222709907:129856222710533 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :217 129856222712408:129856222715305 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :218 -129856222716820:129856222716821 14696:14696 MARK(name(after HIP LaunchKernel)) 129856222718703:129856224572291 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :220 129856229369321:129856230206171 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :221 -129856230207933:129856230207934 14696:14696 MARK(name(before HIP LaunchKernel)) 129856230211408:129856230212070 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :223 129856230213729:129856230214356 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :224 129856230216306:129856230219552 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :225 -129856230221084:129856230221085 14696:14696 MARK(name(after HIP LaunchKernel)) 129856230222856:129856232061167 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :227 129856236820359:129856237552651 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :228 -129856237554349:129856237554350 14696:14696 MARK(name(before HIP LaunchKernel)) 129856237557958:129856237558615 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :230 129856237560382:129856237561016 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :231 129856237562876:129856237566063 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :232 -129856237567608:129856237567609 14696:14696 MARK(name(after HIP LaunchKernel)) 129856237569296:129856239419101 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :234 129856244174381:129856245010977 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :235 -129856245012718:129856245012719 14696:14696 MARK(name(before HIP LaunchKernel)) 129856245025693:129856245026451 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :237 129856245028210:129856245028855 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :238 129856245030730:129856245034177 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :239 -129856245035805:129856245035806 14696:14696 MARK(name(after HIP LaunchKernel)) 129856245038122:129856246876538 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :241 129856251653109:129856252435896 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :242 -129856252437833:129856252437834 14696:14696 MARK(name(before HIP LaunchKernel)) 129856252441362:129856252442017 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :244 129856252443660:129856252444296 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :245 129856252446165:129856252449155 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :246 -129856252450809:129856252450810 14696:14696 MARK(name(after HIP LaunchKernel)) 129856252452579:129856254303055 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :248 129856259101952:129856259882749 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :249 -129856259884515:129856259884516 14696:14696 MARK(name(before HIP LaunchKernel)) 129856259886742:129856259887392 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :251 129856259889040:129856259889671 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :252 129856259891415:129856259894919 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :253 -129856259896631:129856259896632 14696:14696 MARK(name(after HIP LaunchKernel)) 129856259898324:129856261743974 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :255 129856266541050:129856267374498 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :256 -129856267376266:129856267376267 14696:14696 MARK(name(before HIP LaunchKernel)) 129856267379647:129856267380320 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :258 129856267381929:129856267382540 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :259 129856267384409:129856267387474 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :260 -129856267389033:129856267389034 14696:14696 MARK(name(after HIP LaunchKernel)) 129856267390764:129856269239563 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :262 129856274008890:129856274843415 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :263 -129856274845095:129856274845096 14696:14696 MARK(name(before HIP LaunchKernel)) 129856274847806:129856274848470 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :265 129856274850117:129856274850733 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :266 129856274852427:129856274855749 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :267 -129856274857358:129856274857359 14696:14696 MARK(name(after HIP LaunchKernel)) 129856274859228:129856276707873 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :269 129856281498759:129856282330118 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :270 -129856282332044:129856282332045 14696:14696 MARK(name(before HIP LaunchKernel)) 129856282335358:129856282336015 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :272 129856282338029:129856282338668 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :273 129856282340644:129856282343485 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :274 -129856282345028:129856282345029 14696:14696 MARK(name(after HIP LaunchKernel)) 129856282347024:129856284203838 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :276 129856288978096:129856289708673 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :277 -129856289710414:129856289710415 14696:14696 MARK(name(before HIP LaunchKernel)) 129856289714250:129856289714924 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :279 129856289716689:129856289717305 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :280 129856289719150:129856289722057 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :281 -129856289723677:129856289723678 14696:14696 MARK(name(after HIP LaunchKernel)) 129856289725380:129856291571314 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :283 129856296341271:129856297072486 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :284 -129856297074313:129856297074314 14696:14696 MARK(name(before HIP LaunchKernel)) 129856297077733:129856297078380 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :286 129856297080109:129856297080733 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :287 129856297082729:129856297085646 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :288 -129856297087184:129856297087185 14696:14696 MARK(name(after HIP LaunchKernel)) 129856297089004:129856298926004 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :290 PASSED! ## Iteration (58) ################# @@ -565,95 +483,69 @@ PASSED! 129856394339138:129856395561058 0:0 KernelExecution:379:14696 129856394311639:129856396103600 0:0 CopyDeviceToHost:381:14696 129856303774990:129856304626161 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :291 -129856304627884:129856304627885 14696:14696 MARK(name(before HIP LaunchKernel)) 129856304631072:129856304631723 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :293 129856304633373:129856304634007 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :294 129856304635811:129856304639104 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :295 -129856304640848:129856304640849 14696:14696 MARK(name(after HIP LaunchKernel)) 129856304642651:129856306501959 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :297 129856311264292:129856312048766 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :298 -129856312050539:129856312050540 14696:14696 MARK(name(before HIP LaunchKernel)) 129856312053498:129856312054174 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :300 129856312055946:129856312056653 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :301 129856312058397:129856312061589 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :302 -129856312063201:129856312063202 14696:14696 MARK(name(after HIP LaunchKernel)) 129856312065053:129856313904746 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :304 129856318704110:129856319483869 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :305 -129856319485543:129856319485544 14696:14696 MARK(name(before HIP LaunchKernel)) 129856319499258:129856319500048 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :307 129856319501759:129856319502401 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :308 129856319504307:129856319507787 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :309 -129856319509535:129856319509536 14696:14696 MARK(name(after HIP LaunchKernel)) 129856319511552:129856321356021 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :311 129856326144210:129856326980680 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :312 -129856326982483:129856326982484 14696:14696 MARK(name(before HIP LaunchKernel)) 129856326986163:129856326986815 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :314 129856326988581:129856326989210 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :315 129856326991095:129856326994082 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :316 -129856326995650:129856326995651 14696:14696 MARK(name(after HIP LaunchKernel)) 129856326997461:129856328838450 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :318 129856333608209:129856334440902 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :319 -129856334442697:129856334442698 14696:14696 MARK(name(before HIP LaunchKernel)) 129856334446427:129856334447095 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :321 129856334448793:129856334449426 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :322 129856334451308:129856334454120 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :323 -129856334455718:129856334455719 14696:14696 MARK(name(after HIP LaunchKernel)) 129856334457508:129856336307654 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :325 129856341084552:129856341987761 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :326 -129856341989501:129856341989502 14696:14696 MARK(name(before HIP LaunchKernel)) 129856341992961:129856341993616 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :328 129856341995311:129856341995915 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :329 129856341997784:129856342000844 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :330 -129856342002457:129856342002458 14696:14696 MARK(name(after HIP LaunchKernel)) 129856342004209:129856343852827 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :332 129856348628207:129856349358297 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :333 -129856349360014:129856349360015 14696:14696 MARK(name(before HIP LaunchKernel)) 129856349363641:129856349364301 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :335 129856349365955:129856349366590 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :336 129856349368410:129856349371392 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :337 -129856349373001:129856349373002 14696:14696 MARK(name(after HIP LaunchKernel)) 129856349374736:129856351215163 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :339 129856356026231:129856356823939 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :340 -129856356825939:129856356825940 14696:14696 MARK(name(before HIP LaunchKernel)) 129856356829316:129856356829967 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :342 129856356831607:129856356832235 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :343 129856356834103:129856356837300 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :344 -129856356838880:129856356838881 14696:14696 MARK(name(after HIP LaunchKernel)) 129856356840997:129856358683474 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :346 129856363457621:129856364292098 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :347 -129856364293909:129856364293910 14696:14696 MARK(name(before HIP LaunchKernel)) 129856364296242:129856364296921 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :349 129856364298665:129856364299325 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :350 129856364301137:129856364304805 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :351 -129856364306614:129856364306615 14696:14696 MARK(name(after HIP LaunchKernel)) 129856364308432:129856366185192 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :353 129856371019019:129856371802348 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :354 -129856371804072:129856371804073 14696:14696 MARK(name(before HIP LaunchKernel)) 129856371807407:129856371808089 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :356 129856371809769:129856371810408 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :357 129856371812409:129856371815399 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :358 -129856371816938:129856371816939 14696:14696 MARK(name(after HIP LaunchKernel)) 129856371818730:129856373668223 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :360 129856378427685:129856379260530 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :361 -129856379262413:129856379262414 14696:14696 MARK(name(before HIP LaunchKernel)) 129856379266028:129856379266680 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :363 129856379268334:129856379268974 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :364 129856379270951:129856379274011 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :365 -129856379275576:129856379275577 14696:14696 MARK(name(after HIP LaunchKernel)) 129856379277516:129856381125442 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :367 129856385912709:129856386747747 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :368 -129856386749617:129856386749618 14696:14696 MARK(name(before HIP LaunchKernel)) 129856386753015:129856386753700 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :370 129856386755603:129856386756230 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :371 129856386758107:129856386761145 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :372 -129856386762828:129856386762829 14696:14696 MARK(name(after HIP LaunchKernel)) 129856386764527:129856388613300 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :374 129856393418103:129856394255127 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :375 -129856394257084:129856394257085 14696:14696 MARK(name(before HIP LaunchKernel)) 129856394260727:129856394261393 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :377 129856394263117:129856394263752 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :378 129856394266100:129856394269007 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :379 -129856394270594:129856394270595 14696:14696 MARK(name(after HIP LaunchKernel)) 129856394272528:129856396115719 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :381 PASSED! ## Iteration (44) ################# @@ -724,102 +616,74 @@ PASSED! 129856498583201:129856499806882 0:0 KernelExecution:477:14696 129856498555486:129856500349740 0:0 CopyDeviceToHost:479:14696 129856400931528:129856401693841 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :382 -129856401695697:129856401695698 14696:14696 MARK(name(before HIP LaunchKernel)) 129856401698086:129856401698763 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :384 129856401700644:129856401701356 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :385 129856401703387:129856401706670 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :386 -129856401708283:129856401708284 14696:14696 MARK(name(after HIP LaunchKernel)) 129856401710202:129856403550731 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :388 129856408346178:129856409079144 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :389 -129856409080946:129856409080947 14696:14696 MARK(name(before HIP LaunchKernel)) 129856409119575:129856409120361 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :391 129856409122350:129856409122982 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :392 129856409124716:129856409127974 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :393 -129856409129722:129856409129723 14696:14696 MARK(name(after HIP LaunchKernel)) 129856409131595:129856410958682 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :395 129856415764088:129856416549283 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :396 -129856416551147:129856416551148 14696:14696 MARK(name(before HIP LaunchKernel)) 129856416554753:129856416555457 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :398 129856416557440:129856416558065 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :399 129856416560077:129856416563543 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :400 -129856416565220:129856416565221 14696:14696 MARK(name(after HIP LaunchKernel)) 129856416567086:129856418410890 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :402 129856423185992:129856423965984 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :403 -129856423967686:129856423967687 14696:14696 MARK(name(before HIP LaunchKernel)) 129856423971156:129856423971813 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :405 129856423973453:129856423974058 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :406 129856423975959:129856423979023 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :407 -129856423980620:129856423980621 14696:14696 MARK(name(after HIP LaunchKernel)) 129856423982481:129856425851437 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :409 129856430649566:129856431446819 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :410 -129856431448647:129856431448648 14696:14696 MARK(name(before HIP LaunchKernel)) 129856431451980:129856431452627 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :412 129856431454467:129856431455103 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :413 129856431457061:129856431460021 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :414 -129856431461633:129856431461634 14696:14696 MARK(name(after HIP LaunchKernel)) 129856431463427:129856433305223 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :416 129856438060199:129856438896337 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :417 -129856438898056:129856438898057 14696:14696 MARK(name(before HIP LaunchKernel)) 129856438901614:129856438902293 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :419 129856438903944:129856438904582 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :420 129856438906471:129856438909460 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :421 -129856438910995:129856438910996 14696:14696 MARK(name(after HIP LaunchKernel)) 129856438913099:129856440770029 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :423 129856445589904:129856446428787 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :424 -129856446430525:129856446430526 14696:14696 MARK(name(before HIP LaunchKernel)) 129856446434097:129856446434755 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :426 129856446436446:129856446437074 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :427 129856446438958:129856446442103 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :428 -129856446443705:129856446443706 14696:14696 MARK(name(after HIP LaunchKernel)) 129856446445611:129856448319675 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :430 129856453113306:129856453898651 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :431 -129856453900443:129856453900444 14696:14696 MARK(name(before HIP LaunchKernel)) 129856453903924:129856453904588 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :433 129856453906239:129856453906854 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :434 129856453908740:129856453911874 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :435 -129856453913486:129856453913487 14696:14696 MARK(name(after HIP LaunchKernel)) 129856453915356:129856455761272 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :437 129856460531599:129856461270590 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :438 -129856461272368:129856461272369 14696:14696 MARK(name(before HIP LaunchKernel)) 129856461275845:129856461276515 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :440 129856461278198:129856461278850 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :441 129856461280791:129856461283899 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :442 -129856461285595:129856461285596 14696:14696 MARK(name(after HIP LaunchKernel)) 129856461287388:129856463133280 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :444 129856467884995:129856468668564 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :445 -129856468670291:129856468670292 14696:14696 MARK(name(before HIP LaunchKernel)) 129856468673055:129856468673710 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :447 129856468675408:129856468676048 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :448 129856468677942:129856468681455 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :449 -129856468683148:129856468683149 14696:14696 MARK(name(after HIP LaunchKernel)) 129856468685101:129856470532724 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :451 129856475326269:129856476110399 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :452 -129856476112220:129856476112221 14696:14696 MARK(name(before HIP LaunchKernel)) 129856476115691:129856476116355 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :454 129856476118083:129856476118692 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :455 129856476120553:129856476123478 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :456 -129856476125144:129856476125145 14696:14696 MARK(name(after HIP LaunchKernel)) 129856476126929:129856477993159 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :458 129856482771986:129856483553655 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :459 -129856483555435:129856483555436 14696:14696 MARK(name(before HIP LaunchKernel)) 129856483559048:129856483559715 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :461 129856483561368:129856483561995 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :462 129856483563875:129856483567045 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :463 -129856483569037:129856483569038 14696:14696 MARK(name(after HIP LaunchKernel)) 129856483570875:129856485418803 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :465 129856490199703:129856491039451 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :466 -129856491041225:129856491041226 14696:14696 MARK(name(before HIP LaunchKernel)) 129856491044551:129856491045204 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :468 129856491046844:129856491047481 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :469 129856491049291:129856491052245 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :470 -129856491053805:129856491053806 14696:14696 MARK(name(after HIP LaunchKernel)) 129856491055528:129856492907612 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :472 129856497665310:129856498500405 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :473 -129856498502066:129856498502067 14696:14696 MARK(name(before HIP LaunchKernel)) 129856498505506:129856498506141 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :475 129856498507858:129856498508491 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :476 129856498510523:129856498513554 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :477 -129856498515137:129856498515138 14696:14696 MARK(name(after HIP LaunchKernel)) 129856498517011:129856500365762 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :479 PASSED! ## Iteration (31) ################# @@ -890,102 +754,74 @@ PASSED! 129856595328424:129856597128257 0:0 CopyDeviceToHost:570:14696 129856601984341:129856602751266 0:0 CopyHostToDevice:571:14696 129856505180003:129856505975222 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :480 -129856505976980:129856505976981 14696:14696 MARK(name(before HIP LaunchKernel)) 129856505980587:129856505981234 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :482 129856505982935:129856505983566 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :483 129856505985434:129856505988514 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :484 -129856505990096:129856505990097 14696:14696 MARK(name(after HIP LaunchKernel)) 129856505991997:129856507832334 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :486 129856512649603:129856513382084 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :487 -129856513384599:129856513384600 14696:14696 MARK(name(before HIP LaunchKernel)) 129856513388119:129856513389080 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :489 129856513391435:129856513392275 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :490 129856513394697:129856513399367 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :491 -129856513401523:129856513401524 14696:14696 MARK(name(after HIP LaunchKernel)) 129856513404257:129856515239416 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :493 129856519992571:129856520793180 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :494 -129856520794974:129856520794975 14696:14696 MARK(name(before HIP LaunchKernel)) 129856520798420:129856520799070 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :496 129856520800911:129856520801530 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :497 129856520803611:129856520806841 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :498 -129856520808737:129856520808738 14696:14696 MARK(name(after HIP LaunchKernel)) 129856520810545:129856522657358 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :500 129856527425346:129856528218117 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :501 -129856528219874:129856528219875 14696:14696 MARK(name(before HIP LaunchKernel)) 129856528221975:129856528222627 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :503 129856528224439:129856528225291 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :504 129856528227108:129856528230172 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :505 -129856528231752:129856528231753 14696:14696 MARK(name(after HIP LaunchKernel)) 129856528233473:129856530074548 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :507 129856534899214:129856535681957 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :508 -129856535683676:129856535683677 14696:14696 MARK(name(before HIP LaunchKernel)) 129856535686401:129856535687061 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :510 129856535688790:129856535689423 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :511 129856535691153:129856535694294 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :512 -129856535695868:129856535695869 14696:14696 MARK(name(after HIP LaunchKernel)) 129856535697671:129856537541753 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :514 129856542387175:129856543225418 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :515 -129856543227192:129856543227193 14696:14696 MARK(name(before HIP LaunchKernel)) 129856543230911:129856543231570 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :517 129856543233243:129856543233871 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :518 129856543235930:129856543238762 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :519 -129856543240359:129856543240360 14696:14696 MARK(name(after HIP LaunchKernel)) 129856543242179:129856545084137 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :521 129856549857104:129856550696919 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :522 -129856550698874:129856550698875 14696:14696 MARK(name(before HIP LaunchKernel)) 129856550702196:129856550702852 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :524 129856550704612:129856550705254 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :525 129856550707079:129856550709869 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :526 -129856550711442:129856550711443 14696:14696 MARK(name(after HIP LaunchKernel)) 129856550713182:129856552568840 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :528 129856557336788:129856558182426 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :529 -129856558184195:129856558184196 14696:14696 MARK(name(before HIP LaunchKernel)) 129856558187727:129856558188380 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :531 129856558190122:129856558190752 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :532 129856558192774:129856558195554 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :533 -129856558197324:129856558197325 14696:14696 MARK(name(after HIP LaunchKernel)) 129856558199234:129856560041419 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :535 129856564809360:129856565545640 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :536 -129856565547393:129856565547394 14696:14696 MARK(name(before HIP LaunchKernel)) 129856565549636:129856565550299 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :538 129856565551969:129856565552581 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :539 129856565554301:129856565557438 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :540 -129856565559047:129856565559048 14696:14696 MARK(name(after HIP LaunchKernel)) 129856565560847:129856567411065 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :542 129856572215770:129856572957492 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :543 -129856572959234:129856572959235 14696:14696 MARK(name(before HIP LaunchKernel)) 129856572962526:129856572963184 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :545 129856572964912:129856572965546 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :546 129856572967421:129856572970453 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :547 -129856572972097:129856572972098 14696:14696 MARK(name(after HIP LaunchKernel)) 129856572974076:129856574823083 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :549 129856579588261:129856580372449 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :550 -129856580374262:129856580374263 14696:14696 MARK(name(before HIP LaunchKernel)) 129856580376547:129856580377227 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :552 129856580378975:129856580379619 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :553 129856580381546:129856580384467 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :554 -129856580386225:129856580386226 14696:14696 MARK(name(after HIP LaunchKernel)) 129856580388205:129856582240020 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :556 129856587022783:129856587805709 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :557 -129856587807440:129856587807441 14696:14696 MARK(name(before HIP LaunchKernel)) 129856587811171:129856587811825 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :559 129856587813530:129856587814170 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :560 129856587816040:129856587819243 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :561 -129856587820912:129856587820913 14696:14696 MARK(name(after HIP LaunchKernel)) 129856587822927:129856589666874 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :563 129856594433516:129856595273993 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :564 -129856595275800:129856595275801 14696:14696 MARK(name(before HIP LaunchKernel)) 129856595278990:129856595279652 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :566 129856595281384:129856595282018 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :567 129856595283991:129856595287449 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :568 -129856595289101:129856595289102 14696:14696 MARK(name(after HIP LaunchKernel)) 129856595291045:129856597140491 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :570 129856601919460:129856602754655 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :571 -129856602756445:129856602756446 14696:14696 MARK(name(before HIP LaunchKernel)) 129856602769740:129856602770661 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :573 129856602772396:129856602773016 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :574 129856602775079:129856602778192 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :575 -129856602779755:129856602779756 14696:14696 MARK(name(after HIP LaunchKernel)) PASSED! ## Iteration (17) ################# PASSED! @@ -1055,97 +891,71 @@ PASSED! 129856699769937:129856701569372 0:0 CopyDeviceToHost:668:14696 129856602781709:129856604636152 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :577 129856609479851:129856610321075 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :578 -129856610323078:129856610323079 14696:14696 MARK(name(before HIP LaunchKernel)) 129856610326500:129856610327162 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :580 129856610328857:129856610329498 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :581 129856610331492:129856610334664 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :582 -129856610336290:129856610336291 14696:14696 MARK(name(after HIP LaunchKernel)) 129856610338048:129856612222255 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :584 129856616969217:129856617705105 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :585 -129856617706989:129856617706990 14696:14696 MARK(name(before HIP LaunchKernel)) 129856617710485:129856617711142 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :587 129856617712846:129856617713491 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :588 129856617715518:129856617718644 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :589 -129856617720274:129856617720275 14696:14696 MARK(name(after HIP LaunchKernel)) 129856617722118:129856619570993 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :591 129856624331436:129856625292310 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :592 -129856625294207:129856625294208 14696:14696 MARK(name(before HIP LaunchKernel)) 129856625297113:129856625297761 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :594 129856625299459:129856625300093 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :595 129856625301835:129856625305409 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :596 -129856625307116:129856625307117 14696:14696 MARK(name(after HIP LaunchKernel)) 129856625309051:129856627159676 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :598 129856631962417:129856632745795 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :599 -129856632747622:129856632747623 14696:14696 MARK(name(before HIP LaunchKernel)) 129856632761013:129856632761762 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :601 129856632763565:129856632764219 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :602 129856632766094:129856632769110 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :603 -129856632770707:129856632770708 14696:14696 MARK(name(after HIP LaunchKernel)) 129856632772662:129856634610068 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :605 129856639375744:129856640154106 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :606 -129856640155933:129856640155934 14696:14696 MARK(name(before HIP LaunchKernel)) 129856640159565:129856640160216 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :608 129856640161841:129856640162476 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :609 129856640164410:129856640167293 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :610 -129856640168886:129856640168887 14696:14696 MARK(name(after HIP LaunchKernel)) 129856640170703:129856642054780 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :612 129856646841774:129856647623131 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :613 -129856647624849:129856647624850 14696:14696 MARK(name(before HIP LaunchKernel)) 129856647628076:129856647628742 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :615 129856647630426:129856647631050 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :616 129856647632957:129856647636281 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :617 -129856647637872:129856647637873 14696:14696 MARK(name(after HIP LaunchKernel)) 129856647639599:129856649488719 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :619 129856654273909:129856655105030 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :620 -129856655106878:129856655106879 14696:14696 MARK(name(before HIP LaunchKernel)) 129856655109847:129856655110497 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :622 129856655112292:129856655112914 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :623 129856655114757:129856655118162 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :624 -129856655119835:129856655119836 14696:14696 MARK(name(after HIP LaunchKernel)) 129856655121792:129856656973292 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :626 PASSED! ## Iteration (4) ################# 129856661755424:129856662589447 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :627 -129856662591236:129856662591237 14696:14696 MARK(name(before HIP LaunchKernel)) 129856662604066:129856662604831 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :629 129856662606611:129856662607261 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :630 129856662608995:129856662611988 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :631 -129856662613644:129856662613645 14696:14696 MARK(name(after HIP LaunchKernel)) 129856662615584:129856664462467 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :633 129856669256336:129856670039683 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :634 -129856670041634:129856670041635 14696:14696 MARK(name(before HIP LaunchKernel)) 129856670054499:129856670055254 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :636 129856670056982:129856670057615 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :637 129856670059351:129856670062513 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :638 -129856670064113:129856670064114 14696:14696 MARK(name(after HIP LaunchKernel)) 129856670066200:129856671906923 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :640 129856676668791:129856677404223 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :641 -129856677406068:129856677406069 14696:14696 MARK(name(before HIP LaunchKernel)) 129856677408812:129856677409484 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :643 129856677411095:129856677411722 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :644 129856677413461:129856677416941 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :645 -129856677418503:129856677418504 14696:14696 MARK(name(after HIP LaunchKernel)) 129856677420242:129856679269939 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :647 129856684019418:129856684826552 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :648 -129856684828363:129856684828364 14696:14696 MARK(name(before HIP LaunchKernel)) 129856684832034:129856684832695 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :650 129856684834368:129856684834970 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :651 129856684836877:129856684839963 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :652 -129856684841560:129856684841561 14696:14696 MARK(name(after HIP LaunchKernel)) 129856684843320:129856686688518 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :654 129856691504696:129856692288950 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :655 -129856692290798:129856692290799 14696:14696 MARK(name(before HIP LaunchKernel)) 129856692292859:129856692293513 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :657 129856692295227:129856692295860 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :658 129856692297819:129856692300821 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :659 -129856692302355:129856692302356 14696:14696 MARK(name(after HIP LaunchKernel)) 129856692304530:129856694153679 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :661 129856698928289:129856699716162 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :662 -129856699717890:129856699717891 14696:14696 MARK(name(before HIP LaunchKernel)) 129856699720061:129856699720715 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :664 129856699722330:129856699722941 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :665 129856699724836:129856699728198 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :666 -129856699729953:129856699729954 14696:14696 MARK(name(after HIP LaunchKernel)) 129856699731887:129856701581422 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :668 PASSED! ## Iteration (3) ################# @@ -1172,39 +982,29 @@ PASSED! 129856737053267:129856738276147 0:0 KernelExecution:701:14696 129856737025461:129856738822547 0:0 CopyDeviceToHost:703:14696 129856706409352:129856707238410 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :669 -129856707240341:129856707240342 14696:14696 MARK(name(before HIP LaunchKernel)) 129856707253495:129856707254390 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :671 129856707256214:129856707256878 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :672 129856707258659:129856707261885 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :673 -129856707263518:129856707263519 14696:14696 MARK(name(after HIP LaunchKernel)) 129856707265698:129856709110388 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :675 129856713891418:129856714734007 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :676 -129856714735794:129856714735795 14696:14696 MARK(name(before HIP LaunchKernel)) 129856714739058:129856714739715 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :678 129856714741339:129856714741972 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :679 129856714743986:129856714747316 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :680 -129856714748993:129856714748994 14696:14696 MARK(name(after HIP LaunchKernel)) 129856714750976:129856716607126 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :682 129856721364192:129856722196489 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :683 -129856722198322:129856722198323 14696:14696 MARK(name(before HIP LaunchKernel)) 129856722202102:129856722202759 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :685 129856722204452:129856722205080 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :686 129856722207098:129856722210100 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :687 -129856722211652:129856722211653 14696:14696 MARK(name(after HIP LaunchKernel)) 129856722213452:129856724068250 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :689 129856728873958:129856729610520 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :690 -129856729612474:129856729612475 14696:14696 MARK(name(before HIP LaunchKernel)) 129856729615953:129856729616618 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :692 129856729618275:129856729618880 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :693 129856729620844:129856729623983 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :694 -129856729625525:129856729625526 14696:14696 MARK(name(after HIP LaunchKernel)) 129856729627363:129856731472859 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :696 129856736212718:129856736966611 14696:14696 hipMemcpy(dst=0x7fd65ce00000, src=0x7fd7781ff010, sizeBytes=4194304, kind=1) :697 -129856736968384:129856736968385 14696:14696 MARK(name(before HIP LaunchKernel)) 129856736971498:129856736972186 14696:14696 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :699 129856736973934:129856736974581 14696:14696 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :700 129856736976433:129856736979849 14696:14696 hipLaunchKernel(function_address=0x4010c0, numBlocks={}, dimBlocks={}, args=0x7ffe6d9cea08, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :701 -129856736981559:129856736981560 14696:14696 MARK(name(after HIP LaunchKernel)) 129856736983603:129856738834349 14696:14696 hipMemcpy(dst=0x7fd65d707010, src=0x7fd65c800000, sizeBytes=4194304, kind=2) :703 129856743571751:129856743607276 14696:14696 hipFree(ptr=0x7fd65ce00000) :704 129856743609591:129856743621235 14696:14696 hipFree(ptr=0x7fd65c800000) :705 diff --git a/test/golden_traces/MatrixTranspose_hip_input_trace.txt b/test/golden_traces/MatrixTranspose_hip_input_trace.txt index 8f68254c5b..261381618b 100644 --- a/test/golden_traces/MatrixTranspose_hip_input_trace.txt +++ b/test/golden_traces/MatrixTranspose_hip_input_trace.txt @@ -408,404 +408,204 @@ PASSED! 4496524903280142:4496524903426608 880592:880592 hipMalloc(ptr=0x7f14c3000000, size=4194304) :1 4496524903446365:4496524903573365 880592:880592 hipMalloc(ptr=0x7f14c2800000, size=4194304) :2 4496524903588203:4496525133627902 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :3 -4496525133635787:4496525133635788 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525134199640:4496525134199641 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525134207305:4496525140607184 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :6 4496525154755917:4496525158532879 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :7 -4496525158535584:4496525158535585 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525158550863:4496525158550864 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525158552125:4496525163335997 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :10 4496525175814741:4496525179506102 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :11 -4496525179507855:4496525179507856 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525179517513:4496525179517514 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525179519266:4496525184300123 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :14 4496525196393148:4496525200179318 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :15 -4496525200180801:4496525200180802 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525200188466:4496525200188467 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525200189638:4496525204936449 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :18 4496525216744046:4496525220425409 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :19 -4496525220430760:4496525220430761 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525220437733:4496525220437734 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525220438995:4496525225172542 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :22 4496525236900238:4496525240619832 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :23 -4496525240621355:4496525240621356 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525240632276:4496525240632277 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525240633478:4496525245363489 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :26 4496525257076899:4496525260752009 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :27 -4496525260753792:4496525260753793 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525260764202:4496525260764203 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525260765474:4496525265528037 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :30 4496525278601381:4496525282344690 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :31 -4496525282346172:4496525282346173 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525282352745:4496525282352746 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525282356923:4496525287062988 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :34 4496525298199228:4496525301976453 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :35 -4496525301977805:4496525301977806 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525301985179:4496525301985180 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525301989357:4496525306701493 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :38 4496525319442590:4496525323149401 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :39 -4496525323150894:4496525323150895 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525323157957:4496525323157958 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525323159049:4496525327878419 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :42 4496525340212129:4496525343964345 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :43 -4496525343965688:4496525343965689 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525343972501:4496525343972502 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525343973583:4496525348741845 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :46 4496525360729852:4496525364398150 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :47 -4496525364403590:4496525364403591 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525364410854:4496525364410855 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525364412076:4496525369144271 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :50 4496525381014837:4496525384667765 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :51 -4496525384672134:4496525384672135 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525384679758:4496525384679759 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525384680900:4496525389438431 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :54 4496525401191155:4496525404934986 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :55 -4496525404936389:4496525404936390 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525404945757:4496525404945758 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525404946919:4496525410298471 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :58 4496525423502872:4496525427227196 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :59 -4496525427228929:4496525427228930 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525427240851:4496525427240852 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525427242074:4496525431931367 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :62 4496525444940650:4496525448596826 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :63 -4496525448598570:4496525448598571 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525448605503:4496525448605504 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525448609119:4496525453319692 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :66 4496525464825952:4496525468507253 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :67 -4496525468508586:4496525468508587 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525468515599:4496525468515600 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525468516811:4496525473221545 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :70 4496525484776165:4496525488428212 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :71 -4496525488429845:4496525488429846 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525488437419:4496525488437420 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525488438561:4496525493128415 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :74 4496525504724173:4496525508381501 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :75 -4496525508383023:4496525508383024 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525508389967:4496525508389968 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525508391049:4496525513111039 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :78 4496525524703772:4496525528368253 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :79 -4496525528373653:4496525528373654 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525528380236:4496525528380237 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525528381448:4496525533087222 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :82 4496525544743344:4496525548393326 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :83 -4496525548394819:4496525548394820 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525548404588:4496525548404589 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525548405820:4496525553108910 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :86 4496525564776353:4496525568419633 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :87 -4496525568421026:4496525568421027 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525568430434:4496525568430435 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525568431526:4496525573146797 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :90 4496525584773363:4496525588428076 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :91 -4496525588429449:4496525588429450 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525588436592:4496525588436593 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525588441251:4496525593151694 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :94 4496525604951276:4496525608612772 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :95 -4496525608614626:4496525608614627 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525608621939:4496525608621940 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525608626318:4496525613335408 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :98 4496525624925244:4496525628593993 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :99 -4496525628595485:4496525628595486 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525628603070:4496525628603071 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525628604623:4496525633324024 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :102 4496525644955148:4496525648653793 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :103 -4496525648655416:4496525648655417 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525648662599:4496525648662600 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525648663752:4496525653416343 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :106 4496525665022200:4496525668655764 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :107 -4496525668661865:4496525668661866 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525668668568:4496525668668569 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525668669820:4496525673415239 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :110 4496525685021526:4496525688656242 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :111 -4496525688661842:4496525688661843 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525688668305:4496525688668306 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525688669547:4496525693410117 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :114 4496525705048605:4496525708697446 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :115 -4496525708698938:4496525708698939 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525708709679:4496525708709680 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525708710921:4496525713450741 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :118 4496525725057529:4496525728701911 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :119 -4496525728703444:4496525728703445 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525728713643:4496525728713644 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525728714956:4496525733453982 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :122 4496525745101558:4496525748716245 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :123 -4496525748717458:4496525748717459 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525748724611:4496525748724612 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525748728729:4496525753469559 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :126 4496525765097578:4496525768729748 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :127 -4496525768730961:4496525768730962 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525768738184:4496525768738185 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525768739346:4496525773486869 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :130 4496525785153981:4496525788889836 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :131 -4496525788891139:4496525788891140 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525788898142:4496525788898143 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525788899334:4496525793625478 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :134 4496525806694594:4496525810379663 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :135 -4496525810381096:4496525810381097 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525810388580:4496525810388581 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525810389762:4496525815062083 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :138 4496525829025717:4496525832652416 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :139 -4496525832657686:4496525832657687 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525832664930:4496525832664931 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525832666232:4496525838020960 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :142 4496525851335449:4496525855079079 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :143 -4496525855085421:4496525855085422 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525855093967:4496525855093968 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525855095120:4496525859768263 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :146 4496525873262060:4496525876972367 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :147 -4496525876974080:4496525876974081 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525876984951:4496525876984952 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525876986173:4496525881732493 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :150 4496525894813432:4496525898344842 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :151 -4496525898346185:4496525898346186 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525898353449:4496525898353450 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525898357967:4496525903025769 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :154 4496525914049899:4496525917708138 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :155 -4496525917709640:4496525917709641 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525917717645:4496525917717646 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525917721533:4496525922419974 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :158 4496525933083213:4496525936861418 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :159 -4496525936863392:4496525936863393 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525936870265:4496525936870266 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525936871808:4496525941569528 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :162 4496525952271099:4496525956051338 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :163 -4496525956052891:4496525956052892 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525956060355:4496525956060356 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525956061647:4496525960747143 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :166 4496525973345872:4496525977113719 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :167 -4496525977118778:4496525977118779 880592:880592 MARK(name(before HIP LaunchKernel)) -4496525977126052:4496525977126053 880592:880592 MARK(name(after HIP LaunchKernel)) 4496525977127134:4496525981829511 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :170 4496525996273891:4496525999995089 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :171 -4496526000000189:4496526000000190 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526000007312:4496526000007313 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526000008564:4496526004736400 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :174 4496526016480127:4496526020175927 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :175 -4496526020177280:4496526020177281 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526020187950:4496526020187951 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526020189152:4496526024907620 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :178 4496526036737941:4496526040392402 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :179 -4496526040393895:4496526040393896 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526040404845:4496526040404846 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526040406088:4496526045126310 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :182 4496526056750972:4496526060387640 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :183 -4496526060388933:4496526060388934 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526060396076:4496526060396077 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526060400274:4496526065106138 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :186 4496526076767389:4496526080447340 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :187 -4496526080448782:4496526080448783 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526080455275:4496526080455276 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526080456357:4496526085186276 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :190 4496526096786342:4496526100434311 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :191 -4496526100435814:4496526100435815 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526100442497:4496526100442498 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526100443629:4496526105161156 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :194 4496526116801218:4496526120501776 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :195 -4496526120503329:4496526120503330 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526120510072:4496526120510073 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526120511514:4496526125217650 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :198 4496526136832464:4496526140494920 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :199 -4496526140500110:4496526140500111 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526140507885:4496526140507886 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526140509047:4496526145220241 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :202 4496526156843100:4496526160502872 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :203 -4496526160507441:4496526160507442 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526160514635:4496526160514636 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526160515847:4496526165229165 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :206 4496526176867433:4496526180510052 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :207 -4496526180511384:4496526180511385 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526180521073:4496526180521074 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526180522345:4496526185229233 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :210 4496526196882068:4496526200511312 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :211 -4496526200512644:4496526200512645 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526200519086:4496526200519087 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526200522904:4496526205229030 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :214 4496526216885692:4496526220532459 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :215 -4496526220533741:4496526220533742 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526220540234:4496526220540235 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526220544051:4496526225248913 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :218 4496526236953526:4496526240608640 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :219 -4496526240610032:4496526240610033 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526240617316:4496526240617317 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526240618608:4496526245336946 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :222 4496526257032562:4496526260697764 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :223 -4496526260699086:4496526260699087 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526260705799:4496526260705800 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526260706901:4496526266068673 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :226 4496526279332747:4496526283108167 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :227 -4496526283114379:4496526283114380 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526283122765:4496526283122766 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526283124067:4496526287796549 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :230 4496526301304112:4496526305009459 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :231 -4496526305014168:4496526305014169 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526305022153:4496526305022154 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526305023315:4496526309749930 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :234 4496526322801743:4496526326516899 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :235 -4496526326518893:4496526326518894 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526326533039:4496526326533040 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526326534903:4496526331245847 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :238 4496526340107579:4496526343906984 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :239 -4496526343908958:4496526343908959 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526343922443:4496526343922444 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526343924247:4496526348732695 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :242 4496526360672632:4496526364342794 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :243 -4496526364344246:4496526364344247 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526364351580:4496526364351581 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526364356309:4496526369073956 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :246 4496526380921729:4496526384554339 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :247 -4496526384555681:4496526384555682 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526384563015:4496526384563016 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526384564297:4496526389280813 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :250 4496526401055448:4496526404706814 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :251 -4496526404708236:4496526404708237 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526404715179:4496526404715180 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526404716291:4496526409453775 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :254 4496526421231786:4496526424938237 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :255 -4496526424939570:4496526424939571 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526424946152:4496526424946153 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526424947284:4496526429644452 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :258 4496526442708689:4496526446413777 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :259 -4496526446418566:4496526446418567 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526446425690:4496526446425691 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526446426842:4496526451217265 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :262 4496526463698402:4496526467373874 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :263 -4496526467379615:4496526467379616 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526467388151:4496526467388152 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526467389634:4496526472081051 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :266 4496526484017822:4496526487658527 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :267 -4496526487660120:4496526487660121 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526487671221:4496526487671222 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526487672484:4496526492365545 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :270 4496526504217596:4496526507940206 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :271 -4496526507941599:4496526507941600 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526507948341:4496526507948342 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526507952269:4496526512732904 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :274 4496526524481750:4496526528181919 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :275 -4496526528183281:4496526528183282 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526528190385:4496526528190386 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526528194643:4496526532912630 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :278 4496526544545337:4496526548219016 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :279 -4496526548220469:4496526548220470 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526548227472:4496526548227473 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526548228644:4496526552953164 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :282 4496526564603244:4496526568298141 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :283 -4496526568300125:4496526568300126 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526568306718:4496526568306719 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526568308411:4496526573022752 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :286 4496526584675307:4496526588335099 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :287 -4496526588336581:4496526588336582 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526588343565:4496526588343566 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526588344907:4496526593063886 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :290 4496526604685893:4496526608347148 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :291 -4496526608352378:4496526608352379 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526608359341:4496526608359342 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526608360543:4496526613066458 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :294 4496526624712120:4496526628367043 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :295 -4496526628368456:4496526628368457 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526628378575:4496526628378576 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526628379787:4496526633084449 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :298 4496526644736553:4496526648383901 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :299 -4496526648385494:4496526648385495 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526648394792:4496526648394793 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526648395974:4496526653098974 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :302 4496526664769242:4496526668420808 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :303 -4496526668422211:4496526668422212 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526668428923:4496526668428924 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526668433191:4496526673144235 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :306 4496526684807961:4496526689128249 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :307 -4496526689129702:4496526689129703 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526689136916:4496526689136917 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526689138038:4496526693842629 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :310 4496526706935721:4496526710671858 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :311 -4496526710673421:4496526710673422 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526710680895:4496526710680896 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526710682528:4496526715357624 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :314 4496526728844507:4496526732497026 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :315 -4496526732498649:4496526732498650 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526732506164:4496526732506165 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526732507246:4496526737198843 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :318 4496526748886113:4496526752517561 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :319 -4496526752522671:4496526752522672 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526752529534:4496526752529535 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526752530505:4496526757248855 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :322 4496526768940533:4496526772608911 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :323 -4496526772614301:4496526772614302 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526772620994:4496526772620995 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526772622196:4496526777347416 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :326 4496526789025531:4496526792698958 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :327 -4496526792700511:4496526792700512 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526792710941:4496526792710942 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526792712093:4496526797464554 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :330 4496526809125575:4496526812718051 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :331 -4496526812719434:4496526812719435 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526812727048:4496526812727049 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526812731336:4496526817481033 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :334 4496526829138567:4496526832879692 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :335 -4496526832880944:4496526832880945 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526832887747:4496526832887748 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526832891444:4496526837636884 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :338 4496526849206473:4496526852946255 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :339 -4496526852947527:4496526852947528 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526852953829:4496526852953830 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526852954871:4496526857658531 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :342 4496526869245494:4496526873593022 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :343 -4496526873594705:4496526873594706 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526873602520:4496526873602521 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526873604183:4496526878299818 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :346 4496526891597135:4496526895318503 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :347 -4496526895320266:4496526895320267 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526895328381:4496526895328382 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526895329664:4496526900009158 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :350 4496526913485803:4496526917173899 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :351 -4496526917179309:4496526917179310 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526917186683:4496526917186684 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526917187725:4496526921890463 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :354 4496526934966763:4496526938716654 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :355 -4496526938717977:4496526938717978 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526938728427:4496526938728428 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526938729629:4496526943439361 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :358 4496526957411730:4496526961125205 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :359 -4496526961126547:4496526961126548 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526961136536:4496526961136537 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526961138059:4496526965826390 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :362 4496526978879125:4496526982620470 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :363 -4496526982621833:4496526982621834 880592:880592 MARK(name(before HIP LaunchKernel)) -4496526982628466:4496526982628467 880592:880592 MARK(name(after HIP LaunchKernel)) 4496526982632643:4496526987311768 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :366 4496527000778785:4496527004436191 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :367 -4496527004437654:4496527004437655 880592:880592 MARK(name(before HIP LaunchKernel)) -4496527004445078:4496527004445079 880592:880592 MARK(name(after HIP LaunchKernel)) 4496527004448955:4496527009161343 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :370 4496527020723638:4496527024395191 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :371 -4496527024396794:4496527024396795 880592:880592 MARK(name(before HIP LaunchKernel)) -4496527024403457:4496527024403458 880592:880592 MARK(name(after HIP LaunchKernel)) 4496527024404639:4496527029129138 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :374 4496527040699580:4496527044353630 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :375 -4496527044355043:4496527044355044 880592:880592 MARK(name(before HIP LaunchKernel)) -4496527044361916:4496527044361917 880592:880592 MARK(name(after HIP LaunchKernel)) 4496527044363048:4496527049060306 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :378 4496527060632609:4496527064307921 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :379 -4496527064313732:4496527064313733 880592:880592 MARK(name(before HIP LaunchKernel)) -4496527064320805:4496527064320806 880592:880592 MARK(name(after HIP LaunchKernel)) 4496527064321907:4496527069027702 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :382 4496527080621436:4496527084288380 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :383 -4496527084292949:4496527084292950 880592:880592 MARK(name(before HIP LaunchKernel)) -4496527084299932:4496527084299933 880592:880592 MARK(name(after HIP LaunchKernel)) 4496527084301195:4496527089011037 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :386 4496527100657080:4496527104315719 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :387 -4496527104317693:4496527104317694 880592:880592 MARK(name(before HIP LaunchKernel)) -4496527104327251:4496527104327252 880592:880592 MARK(name(after HIP LaunchKernel)) 4496527104328433:4496527109036020 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :390 4496527120665231:4496527125002391 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :391 -4496527125004065:4496527125004066 880592:880592 MARK(name(before HIP LaunchKernel)) -4496527125011499:4496527125011500 880592:880592 MARK(name(after HIP LaunchKernel)) 4496527125016488:4496527129737942 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :394 4496527143046309:4496527146717213 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :395 -4496527146718826:4496527146718827 880592:880592 MARK(name(before HIP LaunchKernel)) -4496527146726520:4496527146726521 880592:880592 MARK(name(after HIP LaunchKernel)) 4496527146730868:4496527151451590 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :398 4496527163132549:4496527166937384 880592:880592 hipMemcpy(dst=0x7f14c3000000, src=0x7f14c3cff010, sizeBytes=4194304, kind=1) :399 -4496527166938797:4496527166938798 880592:880592 MARK(name(before HIP LaunchKernel)) -4496527166946050:4496527166946051 880592:880592 MARK(name(after HIP LaunchKernel)) 4496527166947223:4496527171616068 880592:880592 hipMemcpy(dst=0x7f14c38fe010, src=0x7f14c2800000, sizeBytes=4194304, kind=2) :402 4496527185123250:4496527185153196 880592:880592 hipFree(ptr=0x7f14c3000000) :403 4496527185154519:4496527185168716 880592:880592 hipFree(ptr=0x7f14c2800000) :404 diff --git a/test/golden_traces/MatrixTranspose_hip_period_trace.txt b/test/golden_traces/MatrixTranspose_hip_period_trace.txt index caa2d63885..249eceda88 100644 --- a/test/golden_traces/MatrixTranspose_hip_period_trace.txt +++ b/test/golden_traces/MatrixTranspose_hip_period_trace.txt @@ -208,251 +208,51 @@ PASSED! 3802699752571489:3802699752686289 1983:1983 hipMalloc(ptr=0x7f6c121ff010, size=4194304) 3802699752688639:3802699752749390 1983:1983 hipMalloc(ptr=0x7fffefcadf28, size=4194304) 3802699752763840:3802700027958750 1983:1983 hipMemcpy(dst=0x7f6c11400000, src=0x7f6c121ff010, sizeBytes=4194304, kind=1) -3802700027966800:3802700027966801 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700028567724:3802700028567725 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700041950374:3802700041950375 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700041963674:3802700041963675 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700054151914:3802700054151915 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700054162714:3802700054162715 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700066165433:3802700066165434 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700066176343:3802700066176344 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700078181322:3802700078181323 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700078192012:3802700078192013 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700090220561:3802700090220562 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700090239211:3802700090239212 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700102271721:3802700102271722 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700102282171:3802700102282172 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700114144958:3802700114144959 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700114162049:3802700114162050 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700126128128:3802700126128129 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700126138758:3802700126138759 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700138129156:3802700138129157 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700138139446:3802700138139447 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700150136865:3802700150136866 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700150148016:3802700150148017 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700162246915:3802700162246916 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700162258105:3802700162258106 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700174131823:3802700174131824 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700174149233:3802700174149234 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700186413294:3802700186413295 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700186424475:3802700186424476 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700198692895:3802700198692896 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700198703415:3802700198703416 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700210532173:3802700210532174 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700210542783:3802700210542784 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700222880184:3802700222880185 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700222891274:3802700222891275 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700234962094:3802700234962095 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700234972984:3802700234972985 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700247111934:3802700247111935 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700247122294:3802700247122295 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700259114883:3802700259114884 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700259131593:3802700259131594 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700270919381:3802700270919382 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700270930441:3802700270930442 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700282944209:3802700282944210 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700282954850:3802700282954851 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700294960369:3802700294960370 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700294970439:3802700294970440 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700306951068:3802700306951069 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700306963188:3802700306963189 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700318935636:3802700318935637 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700318952436:3802700318952437 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700330939575:3802700330939576 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700330957096:3802700330957097 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700342957675:3802700342957676 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700342976555:3802700342976556 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700354958353:3802700354958354 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700354969733:3802700354969734 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700367116224:3802700367116225 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700367127874:3802700367127875 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700378910551:3802700378910552 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700378921781:3802700378921782 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700391300403:3802700391300404 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700391311253:3802700391311254 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700403119421:3802700403119422 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700403149901:3802700403149902 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700414928588:3802700414928589 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700414939088:3802700414939089 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700426957197:3802700426957198 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700426969607:3802700426969608 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700438945256:3802700438945257 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700438956156:3802700438956157 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700450955785:3802700450955786 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700450966535:3802700450966536 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700462947734:3802700462947735 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700462958494:3802700462958495 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700475120764:3802700475120765 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700475133244:3802700475133245 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700486943952:3802700486943953 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700486963842:3802700486963843 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700498936501:3802700498936502 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700498947611:3802700498947612 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700510957970:3802700510957971 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700510969340:3802700510969341 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700522956379:3802700522956380 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700522968409:3802700522968410 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700534942538:3802700534942539 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700534953908:3802700534953909 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700546789315:3802700546789316 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700546806236:3802700546806237 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700558559853:3802700558559854 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700558571313:3802700558571314 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700570153708:3802700570153709 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700570176129:3802700570176130 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700581726404:3802700581726405 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700581741565:3802700581741566 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700593057879:3802700593057880 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700593070449:3802700593070450 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700604400132:3802700604400133 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700604413112:3802700604413113 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700615730637:3802700615730638 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700615743157:3802700615743158 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700627079061:3802700627079062 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700627101981:3802700627101982 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700638410875:3802700638410876 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700638425755:3802700638425756 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700649752129:3802700649752130 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700649766079:3802700649766080 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700661088702:3802700661088703 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700661101353:3802700661101354 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700672436427:3802700672436428 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700672449997:3802700672449998 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700683973653:3802700683973654 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700683987193:3802700683987194 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700695366597:3802700695366598 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700695379007:3802700695379008 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700706708861:3802700706708862 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700706735151:3802700706735152 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700718019795:3802700718019796 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700718034725:3802700718034726 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700729346979:3802700729346980 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700729360039:3802700729360040 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700740688063:3802700740688064 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700740702553:3802700740702554 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700752045097:3802700752045098 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700752060217:3802700752060218 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700763470772:3802700763470773 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700763485762:3802700763485763 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700774801006:3802700774801007 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700774813776:3802700774813777 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700786122470:3802700786122471 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700786147830:3802700786147831 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700797490594:3802700797490595 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700797504834:3802700797504835 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700808806748:3802700808806749 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700808822388:3802700808822389 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700820150282:3802700820150283 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700820163482:3802700820163483 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700831687737:3802700831687738 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700831701867:3802700831701868 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700843073042:3802700843073043 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700843096032:3802700843096033 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700854417226:3802700854417227 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700854429236:3802700854429237 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700865753490:3802700865753491 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700865775180:3802700865775181 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700877105074:3802700877105075 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700877120554:3802700877120555 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700888576349:3802700888576350 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700888589579:3802700888589580 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700900086965:3802700900086966 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700900101025:3802700900101026 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700911461388:3802700911461389 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700911474589:3802700911474590 1983:1983 MARK(name(after HIP LaunchKernel)) -3802700922810673:3802700922810674 1983:1983 MARK(name(before HIP LaunchKernel)) -3802700922833153:3802700922833154 1983:1983 MARK(name(after HIP LaunchKernel)) 3802700932447414:3802700934135107 1983:1983 hipMemcpy(dst=0x7f6c11400000, src=0x7f6c121ff010, sizeBytes=4194304, kind=1) -3802700934139057:3802700934139058 1983:1983 MARK(name(before HIP LaunchKernel)) 3802700934143817:3802700934144527 1983:1983 __hipPushCallConfiguration(gridDim=, blockDim=, sharedMem=0, stream=0) 3802700934146607:3802700934147267 1983:1983 __hipPopCallConfiguration(gridDim=, blockDim=, sharedMem=140106682958042, stream=0xd8282e03f3099) 3802700934158787:3802700934164967 1983:1983 hipLaunchKernel(function_address=0x401030, numBlocks=, dimBlocks=, args=0x3b9aca00, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) -3802700934191267:3802700934191268 1983:1983 MARK(name(after HIP LaunchKernel)) 3802700934192847:3802700936775947 1983:1983 hipMemcpy(dst=0x7f6c11dfe010, src=0x7f6c10e00000, sizeBytes=4194304, kind=2) 3802700943795998:3802700945501111 1983:1983 hipMemcpy(dst=0x7f6c11400000, src=0x7f6c121ff010, sizeBytes=4194304, kind=1) -3802700945513191:3802700945513192 1983:1983 MARK(name(before HIP LaunchKernel)) 3802700945517031:3802700945517901 1983:1983 __hipPushCallConfiguration(gridDim=, blockDim=, sharedMem=0, stream=0) 3802700945519841:3802700945520521 1983:1983 __hipPopCallConfiguration(gridDim=, blockDim=, sharedMem=140106682958042, stream=0xd8282e0ecbb86) 3802700945522671:3802700945530171 1983:1983 hipLaunchKernel(function_address=0x401030, numBlocks=, dimBlocks=, args=0x3b9aca00, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) -3802700945531971:3802700945531972 1983:1983 MARK(name(after HIP LaunchKernel)) 3802700945534701:3802700948131020 1983:1983 hipMemcpy(dst=0x7f6c11dfe010, src=0x7f6c10e00000, sizeBytes=4194304, kind=2) 3802700955136442:3802700956839355 1983:1983 hipMemcpy(dst=0x7f6c11400000, src=0x7f6c121ff010, sizeBytes=4194304, kind=1) -3802700956843375:3802700956843376 1983:1983 MARK(name(before HIP LaunchKernel)) 3802700956847725:3802700956848495 1983:1983 __hipPushCallConfiguration(gridDim=, blockDim=, sharedMem=0, stream=0) 3802700956850235:3802700956850825 1983:1983 __hipPopCallConfiguration(gridDim=, blockDim=, sharedMem=140106682958042, stream=0xd8282e1999f61) 3802700956860545:3802700956868795 1983:1983 hipLaunchKernel(function_address=0x401030, numBlocks=, dimBlocks=, args=0x3b9aca00, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) -3802700956870695:3802700956870696 1983:1983 MARK(name(after HIP LaunchKernel)) 3802700956872065:3802700959479235 1983:1983 hipMemcpy(dst=0x7f6c11dfe010, src=0x7f6c10e00000, sizeBytes=4194304, kind=2) 3802700966505397:3802700968203670 1983:1983 hipMemcpy(dst=0x7f6c11400000, src=0x7f6c121ff010, sizeBytes=4194304, kind=1) -3802700968207780:3802700968207781 1983:1983 MARK(name(before HIP LaunchKernel)) 3802700968219030:3802700968219770 1983:1983 __hipPushCallConfiguration(gridDim=, blockDim=, sharedMem=0, stream=0) 3802700968221700:3802700968222280 1983:1983 __hipPopCallConfiguration(gridDim=, blockDim=, sharedMem=140106682958042, stream=0xd8282e247222e) 3802700968225090:3802700968233560 1983:1983 hipLaunchKernel(function_address=0x401030, numBlocks=, dimBlocks=, args=0x3b9aca00, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) -3802700968235360:3802700968235361 1983:1983 MARK(name(after HIP LaunchKernel)) 3802700968241120:3802700970853059 1983:1983 hipMemcpy(dst=0x7f6c11dfe010, src=0x7f6c10e00000, sizeBytes=4194304, kind=2) 3802700977859821:3802700979559833 1983:1983 hipMemcpy(dst=0x7f6c11400000, src=0x7f6c121ff010, sizeBytes=4194304, kind=1) -3802700979563253:3802700979563254 1983:1983 MARK(name(before HIP LaunchKernel)) 3802700979567803:3802700979568553 1983:1983 __hipPushCallConfiguration(gridDim=, blockDim=, sharedMem=0, stream=0) 3802700979570433:3802700979571073 1983:1983 __hipPopCallConfiguration(gridDim=, blockDim=, sharedMem=140106682958042, stream=0xd8282e2f44d18) 3802700979581243:3802700979589274 1983:1983 hipLaunchKernel(function_address=0x401030, numBlocks=, dimBlocks=, args=0x3b9aca00, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) -3802700979590674:3802700979590675 1983:1983 MARK(name(after HIP LaunchKernel)) 3802700979592044:3802700982222943 1983:1983 hipMemcpy(dst=0x7f6c11dfe010, src=0x7f6c10e00000, sizeBytes=4194304, kind=2) 3802700989239045:3802700990944838 1983:1983 hipMemcpy(dst=0x7f6c11400000, src=0x7f6c121ff010, sizeBytes=4194304, kind=1) -3802700990948338:3802700990948339 1983:1983 MARK(name(before HIP LaunchKernel)) 3802700990960008:3802700990960828 1983:1983 __hipPushCallConfiguration(gridDim=, blockDim=, sharedMem=0, stream=0) 3802700990963068:3802700990963638 1983:1983 __hipPopCallConfiguration(gridDim=, blockDim=, sharedMem=140106682958042, stream=0xd8282e3a221d9) 3802700990966328:3802700990975628 1983:1983 hipLaunchKernel(function_address=0x401030, numBlocks=, dimBlocks=, args=0x3b9aca00, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) -3802700990977238:3802700990977239 1983:1983 MARK(name(after HIP LaunchKernel)) 3802700990978718:3802700993694078 1983:1983 hipMemcpy(dst=0x7f6c11dfe010, src=0x7f6c10e00000, sizeBytes=4194304, kind=2) 3802701000919212:3802701002625515 1983:1983 hipMemcpy(dst=0x7f6c11400000, src=0x7f6c121ff010, sizeBytes=4194304, kind=1) -3802701002628745:3802701002628746 1983:1983 MARK(name(before HIP LaunchKernel)) 3802701002633405:3802701002634215 1983:1983 __hipPushCallConfiguration(gridDim=, blockDim=, sharedMem=0, stream=0) 3802701002635935:3802701002636515 1983:1983 __hipPopCallConfiguration(gridDim=, blockDim=, sharedMem=140106682958042, stream=0xd8282e45440c4) 3802701002649885:3802701002657855 1983:1983 hipLaunchKernel(function_address=0x401030, numBlocks=, dimBlocks=, args=0x3b9aca00, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) -3802701002659335:3802701002659336 1983:1983 MARK(name(after HIP LaunchKernel)) 3802701002660835:3802701005267024 1983:1983 hipMemcpy(dst=0x7f6c11dfe010, src=0x7f6c10e00000, sizeBytes=4194304, kind=2) 3802701012322026:3802701014008789 1983:1983 hipMemcpy(dst=0x7f6c11400000, src=0x7f6c121ff010, sizeBytes=4194304, kind=1) -3802701014011999:3802701014012000 1983:1983 MARK(name(before HIP LaunchKernel)) 3802701014023469:3802701014024239 1983:1983 __hipPushCallConfiguration(gridDim=, blockDim=, sharedMem=0, stream=0) 3802701014028089:3802701014028669 1983:1983 __hipPopCallConfiguration(gridDim=, blockDim=, sharedMem=140106682958042, stream=0xd8282e5020cc5) 3802701014031569:3802701014039849 1983:1983 hipLaunchKernel(function_address=0x401030, numBlocks=, dimBlocks=, args=0x3b9aca00, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) -3802701014041409:3802701014041410 1983:1983 MARK(name(after HIP LaunchKernel)) 3802701014042919:3802701016640288 1983:1983 hipMemcpy(dst=0x7f6c11dfe010, src=0x7f6c10e00000, sizeBytes=4194304, kind=2) 3802701023688501:3802701025398903 1983:1983 hipMemcpy(dst=0x7f6c11400000, src=0x7f6c121ff010, sizeBytes=4194304, kind=1) -3802701025402873:3802701025402874 1983:1983 MARK(name(before HIP LaunchKernel)) 3802701025407454:3802701025408214 1983:1983 __hipPushCallConfiguration(gridDim=, blockDim=, sharedMem=0, stream=0) 3802701025410224:3802701025411104 1983:1983 __hipPopCallConfiguration(gridDim=, blockDim=, sharedMem=140106682958042, stream=0xd8282e5afc125) 3802701025412944:3802701025420534 1983:1983 hipLaunchKernel(function_address=0x401030, numBlocks=, dimBlocks=, args=0x3b9aca00, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) -3802701025429704:3802701025429705 1983:1983 MARK(name(after HIP LaunchKernel)) 3802701025431374:3802701028050563 1983:1983 hipMemcpy(dst=0x7f6c11dfe010, src=0x7f6c10e00000, sizeBytes=4194304, kind=2) -3802701036808678:3802701036808679 1983:1983 MARK(name(before HIP LaunchKernel)) -3802701036822078:3802701036822079 1983:1983 MARK(name(after HIP LaunchKernel)) -3802701048170132:3802701048170133 1983:1983 MARK(name(before HIP LaunchKernel)) -3802701048184912:3802701048184913 1983:1983 MARK(name(after HIP LaunchKernel)) -3802701059593377:3802701059593378 1983:1983 MARK(name(before HIP LaunchKernel)) -3802701059607287:3802701059607288 1983:1983 MARK(name(after HIP LaunchKernel)) -3802701070985111:3802701070985112 1983:1983 MARK(name(before HIP LaunchKernel)) -3802701071008911:3802701071008912 1983:1983 MARK(name(after HIP LaunchKernel)) -3802701082354665:3802701082354666 1983:1983 MARK(name(before HIP LaunchKernel)) -3802701082369396:3802701082369397 1983:1983 MARK(name(after HIP LaunchKernel)) -3802701093751910:3802701093751911 1983:1983 MARK(name(before HIP LaunchKernel)) -3802701093766810:3802701093766811 1983:1983 MARK(name(after HIP LaunchKernel)) -3802701105308045:3802701105308046 1983:1983 MARK(name(before HIP LaunchKernel)) -3802701105323296:3802701105323297 1983:1983 MARK(name(after HIP LaunchKernel)) -3802701116675540:3802701116675541 1983:1983 MARK(name(before HIP LaunchKernel)) -3802701116689570:3802701116689571 1983:1983 MARK(name(after HIP LaunchKernel)) -3802701128156035:3802701128156036 1983:1983 MARK(name(before HIP LaunchKernel)) -3802701128181736:3802701128181737 1983:1983 MARK(name(after HIP LaunchKernel)) -3802701139551739:3802701139551740 1983:1983 MARK(name(before HIP LaunchKernel)) -3802701139565579:3802701139565580 1983:1983 MARK(name(after HIP LaunchKernel)) -3802701150939144:3802701150939145 1983:1983 MARK(name(before HIP LaunchKernel)) -3802701150961354:3802701150961355 1983:1983 MARK(name(after HIP LaunchKernel)) -3802701162295078:3802701162295079 1983:1983 MARK(name(before HIP LaunchKernel)) -3802701162308528:3802701162308529 1983:1983 MARK(name(after HIP LaunchKernel)) -3802701173678182:3802701173678183 1983:1983 MARK(name(before HIP LaunchKernel)) -3802701173692162:3802701173692163 1983:1983 MARK(name(after HIP LaunchKernel)) -3802701185053367:3802701185053368 1983:1983 MARK(name(before HIP LaunchKernel)) -3802701185066667:3802701185066668 1983:1983 MARK(name(after HIP LaunchKernel)) 3802700025923715:3802700027953920 0:0 CopyHostToDevice:4:1983 3802700932468645:3802700934131397 0:0 CopyHostToDevice:159:1983 3802700934227596:3802700935424394 0:0 KernelExecution:163:1983 diff --git a/test/golden_traces/MatrixTranspose_sys_hsa_trace.txt b/test/golden_traces/MatrixTranspose_sys_hsa_trace.txt index 136cf1488d..a92b7d58a9 100644 --- a/test/golden_traces/MatrixTranspose_sys_hsa_trace.txt +++ b/test/golden_traces/MatrixTranspose_sys_hsa_trace.txt @@ -5144,704 +5144,504 @@ ROCTracer (pid=158131): 337766975606005:337766975727544 158131:158131 hipMalloc(ptr=0x7f3e43000000, size=4194304) :2 337766975729067:337766975854995 158131:158131 hipMalloc(ptr=0x7f3e42800000, size=4194304) :3 337766975868801:337767194313754 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :4 -337767194318883:337767194318884 158131:158131 MARK(name(before HIP LaunchKernel)) 337767194342478:337767194343830 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :6 337767194346004:337767194346485 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :7 337767194348239:337767194857128 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :8 -337767194872548:337767194872549 158131:158131 MARK(name(after HIP LaunchKernel)) 337767194877096:337767198600589 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :10 337767211443633:337767213698847 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :11 -337767213700460:337767213700461 158131:158131 MARK(name(before HIP LaunchKernel)) 337767213705559:337767213706150 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :13 337767213707283:337767213707753 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :14 337767213709958:337767213724806 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :15 -337767213726569:337767213726570 158131:158131 MARK(name(after HIP LaunchKernel)) 337767213728493:337767215930456 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :17 337767228387752:337767230638347 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :18 -337767230639619:337767230639620 158131:158131 MARK(name(before HIP LaunchKernel)) 337767230645540:337767230646081 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :20 337767230647023:337767230647865 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :21 337767230648726:337767230660429 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :22 -337767230661911:337767230661912 158131:158131 MARK(name(after HIP LaunchKernel)) 337767230664256:337767232863504 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :24 337767243411499:337767245697039 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :25 -337767245698882:337767245698883 158131:158131 MARK(name(before HIP LaunchKernel)) 337767245705184:337767245705765 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :27 337767245707098:337767245707689 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :28 337767245711677:337767245727186 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :29 -337767245729220:337767245729221 158131:158131 MARK(name(after HIP LaunchKernel)) 337767245733127:337767247954105 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :31 337767256142289:337767258320928 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :32 -337767258322752:337767258322753 158131:158131 MARK(name(before HIP LaunchKernel)) 337767258328102:337767258328503 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :34 337767258329374:337767258330206 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :35 337767258330987:337767258342148 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :36 -337767258343721:337767258343722 158131:158131 MARK(name(after HIP LaunchKernel)) 337767258346667:337767260513855 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :38 337767270817268:337767273062733 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :39 -337767273064547:337767273064548 158131:158131 MARK(name(before HIP LaunchKernel)) 337767273070348:337767273070919 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :41 337767273072292:337767273072913 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :42 337767273077181:337767273093912 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :43 -337767273095986:337767273095987 158131:158131 MARK(name(after HIP LaunchKernel)) 337767273099132:337767275379964 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :45 337767283563870:337767285732370 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :46 -337767285733633:337767285733634 158131:158131 MARK(name(before HIP LaunchKernel)) 337767285739734:337767285740285 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :48 337767285741207:337767285741668 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :49 337767285742469:337767285753019 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :50 -337767285755083:337767285755084 158131:158131 MARK(name(after HIP LaunchKernel)) 337767285757818:337767287927761 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :52 337767297920088:337767300172035 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :53 -337767300173809:337767300173810 158131:158131 MARK(name(before HIP LaunchKernel)) 337767300179620:337767300180261 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :55 337767300181513:337767300182285 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :56 337767300186312:337767300202703 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :57 -337767300204958:337767300204959 158131:158131 MARK(name(after HIP LaunchKernel)) 337767300208164:337767302399998 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :59 337767310566371:337767312698212 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :60 -337767312701368:337767312701369 158131:158131 MARK(name(before HIP LaunchKernel)) 337767312705676:337767312706147 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :62 337767312707008:337767312707459 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :63 337767312708261:337767312720814 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :64 -337767312722297:337767312722298 158131:158131 MARK(name(after HIP LaunchKernel)) 337767312725162:337767314905485 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :66 337767324225302:337767326630218 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :67 -337767326632171:337767326632172 158131:158131 MARK(name(before HIP LaunchKernel)) 337767326638293:337767326639004 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :69 337767326640347:337767326641088 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :70 337767326644284:337767326659503 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :71 -337767326662058:337767326662059 158131:158131 MARK(name(after HIP LaunchKernel)) 337767326665324:337767328874220 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :73 337767341730008:337767343889150 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :74 -337767343891364:337767343891365 158131:158131 MARK(name(before HIP LaunchKernel)) 337767343895582:337767343895963 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :76 337767343896855:337767343897276 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :77 337767343898067:337767343909118 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :78 -337767343910821:337767343910822 158131:158131 MARK(name(after HIP LaunchKernel)) 337767343914097:337767346149393 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :80 337767357340201:337767359602798 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :81 -337767359604041:337767359604042 158131:158131 MARK(name(before HIP LaunchKernel)) 337767359607898:337767359608229 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :83 337767359609191:337767359609641 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :84 337767359612637:337767359624790 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :85 -337767359626142:337767359626143 158131:158131 MARK(name(after HIP LaunchKernel)) 337767359628226:337767362392901 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :87 337767370583520:337767372727504 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :88 -337767372729918:337767372729919 158131:158131 MARK(name(before HIP LaunchKernel)) 337767372734026:337767372734597 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :90 337767372735338:337767372736060 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :91 337767372736931:337767372748102 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :92 -337767372750006:337767372750007 158131:158131 MARK(name(after HIP LaunchKernel)) 337767372753082:337767374911783 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :94 337767386842927:337767389026054 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :95 -337767389027407:337767389027408 158131:158131 MARK(name(before HIP LaunchKernel)) 337767389032176:337767389032757 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :97 337767389034631:337767389035061 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :98 337767389035893:337767389047835 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :99 -337767389049208:337767389049209 158131:158131 MARK(name(after HIP LaunchKernel)) 337767389051653:337767391262963 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :101 337767401302348:337767403625540 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :102 -337767403631150:337767403631151 158131:158131 MARK(name(before HIP LaunchKernel)) 337767403636711:337767403637442 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :104 337767403638775:337767403639406 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :105 337767403640658:337767403655196 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :106 -337767403657119:337767403657120 158131:158131 MARK(name(after HIP LaunchKernel)) 337767403661508:337767405850096 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :108 337767414038200:337767416155293 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :109 -337767416157006:337767416157007 158131:158131 MARK(name(before HIP LaunchKernel)) 337767416161023:337767416161414 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :111 337767416164199:337767416164761 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :112 337767416165562:337767416175861 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :113 -337767416177174:337767416177175 158131:158131 MARK(name(after HIP LaunchKernel)) 337767416179899:337767418323041 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :115 337767426540801:337767428694984 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :116 -337767428697219:337767428697220 158131:158131 MARK(name(before HIP LaunchKernel)) 337767428701006:337767428701396 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :118 337767428702178:337767428702759 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :119 337767428703530:337767428713249 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :120 -337767428715854:337767428715855 158131:158131 MARK(name(after HIP LaunchKernel)) 337767428718048:337767430853946 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :122 337767442974988:337767445133299 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :123 -337767445134602:337767445134603 158131:158131 MARK(name(before HIP LaunchKernel)) 337767445138419:337767445138820 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :125 337767445141455:337767445141895 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :126 337767445142757:337767445153267 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :127 -337767445154730:337767445154731 158131:158131 MARK(name(after HIP LaunchKernel)) 337767445156874:337767447277203 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :129 337767457262296:337767459631826 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :130 -337767459635052:337767459635053 158131:158131 MARK(name(before HIP LaunchKernel)) 337767459640913:337767459641674 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :132 337767459643007:337767459643618 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :133 337767459644880:337767459659969 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :134 -337767459663044:337767459663045 158131:158131 MARK(name(after HIP LaunchKernel)) 337767459666571:337767461850200 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :136 337767470021230:337767472126100 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :137 -337767472127232:337767472127233 158131:158131 MARK(name(before HIP LaunchKernel)) 337767472131229:337767472131680 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :139 337767472133854:337767472134395 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :140 337767472135177:337767472145406 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :141 -337767472147189:337767472147190 158131:158131 MARK(name(after HIP LaunchKernel)) 337767472149313:337767474294991 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :143 337767482547276:337767484700437 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :144 -337767484701639:337767484701640 158131:158131 MARK(name(before HIP LaunchKernel)) 337767484705637:337767484706107 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :146 337767484707009:337767484707460 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :147 337767484708231:337767484717819 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :148 -337767484721026:337767484721027 158131:158131 MARK(name(after HIP LaunchKernel)) 337767484723540:337767486915875 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :150 337767498181053:337767500271376 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :151 -337767500272478:337767500272479 158131:158131 MARK(name(before HIP LaunchKernel)) 337767500276305:337767500276836 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :153 337767500279020:337767500279471 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :154 337767500280313:337767500290712 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :155 -337767500292085:337767500292086 158131:158131 MARK(name(after HIP LaunchKernel)) 337767500294219:337767502424908 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :157 337767514185079:337767516608650 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :158 -337767516609902:337767516609903 158131:158131 MARK(name(before HIP LaunchKernel)) 337767516613960:337767516614401 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :160 337767516615273:337767516615693 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :161 337767516616465:337767516625923 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :162 -337767516628097:337767516628098 158131:158131 MARK(name(after HIP LaunchKernel)) 337767516630201:337767518783622 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :164 337767528416742:337767530629065 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :165 -337767530630918:337767530630919 158131:158131 MARK(name(before HIP LaunchKernel)) 337767530636539:337767530637591 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :167 337767530641548:337767530642310 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :168 337767530643622:337767530657498 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :169 -337767530659362:337767530659363 158131:158131 MARK(name(after HIP LaunchKernel)) 337767530662688:337767532867857 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :171 337767545437393:337767547614971 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :172 -337767547616493:337767547616494 158131:158131 MARK(name(before HIP LaunchKernel)) 337767547621162:337767547621713 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :174 337767547622695:337767547623116 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :175 337767547623907:337767547635189 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :176 -337767547638194:337767547638195 158131:158131 MARK(name(after HIP LaunchKernel)) 337767547640258:337767549833144 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :178 337767561223869:337767563606182 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :179 -337767563607365:337767563607366 158131:158131 MARK(name(before HIP LaunchKernel)) 337767563613396:337767563613977 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :181 337767563614849:337767563615299 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :182 337767563616141:337767563627482 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :183 -337767563628835:337767563628836 158131:158131 MARK(name(after HIP LaunchKernel)) 337767563631961:337767565791204 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :185 337767574231283:337767576611813 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :186 -337767576613155:337767576613156 158131:158131 MARK(name(before HIP LaunchKernel)) 337767576617123:337767576617614 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :188 337767576618505:337767576618946 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :189 337767576619868:337767576630779 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :190 -337767576634506:337767576634507 158131:158131 MARK(name(after HIP LaunchKernel)) 337767576636640:337767578794640 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :192 337767590051562:337767592160019 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :193 -337767592161472:337767592161473 158131:158131 MARK(name(before HIP LaunchKernel)) 337767592166561:337767592166952 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :195 337767592167914:337767592168345 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :196 337767592169216:337767592179626 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :197 -337767592180968:337767592180969 158131:158131 MARK(name(after HIP LaunchKernel)) 337767592183203:337767594314973 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :199 337767605936183:337767608091408 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :200 -337767608092600:337767608092601 158131:158131 MARK(name(before HIP LaunchKernel)) 337767608096537:337767608096988 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :202 337767608097750:337767608098311 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :203 337767608101026:337767608112738 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :204 -337767608114020:337767608114021 158131:158131 MARK(name(after HIP LaunchKernel)) 337767608116084:337767610323438 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :206 337767618518844:337767620683096 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :207 -337767620684288:337767620684289 158131:158131 MARK(name(before HIP LaunchKernel)) 337767620689798:337767620690259 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :209 337767620691031:337767620691481 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :210 337767620692273:337767620702853 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :211 -337767620704055:337767620704056 158131:158131 MARK(name(after HIP LaunchKernel)) 337767620706219:337767622841567 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :213 337767634728658:337767636912607 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :214 -337767636913829:337767636913830 158131:158131 MARK(name(before HIP LaunchKernel)) 337767636917446:337767636917907 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :216 337767636918768:337767636919219 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :217 337767636922566:337767636933456 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :218 -337767636934718:337767636934719 158131:158131 MARK(name(after HIP LaunchKernel)) 337767636936953:337767639147723 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :220 337767648806150:337767651012391 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :221 -337767651014295:337767651014296 158131:158131 MARK(name(before HIP LaunchKernel)) 337767651022560:337767651023131 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :223 337767651024564:337767651025175 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :224 337767651026508:337767651042107 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :225 -337767651044301:337767651044302 158131:158131 MARK(name(after HIP LaunchKernel)) 337767651047637:337767653313171 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :227 337767661488300:337767663643385 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :228 -337767663644467:337767663644468 158131:158131 MARK(name(before HIP LaunchKernel)) 337767663648374:337767663648785 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :230 337767663649857:337767663650298 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :231 337767663652402:337767663662471 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :232 -337767663663723:337767663663724 158131:158131 MARK(name(after HIP LaunchKernel)) 337767663665907:337767665806926 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :234 337767673986283:337767676162668 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :235 -337767676163920:337767676163921 158131:158131 MARK(name(before HIP LaunchKernel)) 337767676170162:337767676170573 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :237 337767676171475:337767676171915 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :238 337767676172757:337767676183457 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :239 -337767676184780:337767676184781 158131:158131 MARK(name(after HIP LaunchKernel)) 337767676188406:337767678326950 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :241 337767689596174:337767691883598 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :242 -337767691884750:337767691884751 158131:158131 MARK(name(before HIP LaunchKernel)) 337767691889128:337767691889539 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :244 337767691890451:337767691890882 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :245 337767691893787:337767691905870 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :246 -337767691906972:337767691906973 158131:158131 MARK(name(after HIP LaunchKernel)) 337767691909086:337767694152087 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :248 337767705566316:337767707738723 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :249 -337767707739965:337767707739966 158131:158131 MARK(name(before HIP LaunchKernel)) 337767707745015:337767707745466 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :251 337767707746347:337767707746788 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :252 337767707747540:337767707757609 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :253 -337767707758841:337767707758842 158131:158131 MARK(name(after HIP LaunchKernel)) 337767707762127:337767709917513 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :255 337767718100777:337767720221597 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :256 -337767720222760:337767720222761 158131:158131 MARK(name(before HIP LaunchKernel)) 337767720226607:337767720227148 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :258 337767720228020:337767720228460 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :259 337767720231025:337767720241485 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :260 -337767720242727:337767720242728 158131:158131 MARK(name(after HIP LaunchKernel)) 337767720244851:337767722379548 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :262 337767733662679:337767735850947 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :263 -337767735855846:337767735855847 158131:158131 MARK(name(before HIP LaunchKernel)) 337767735859793:337767735860264 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :265 337767735861136:337767735861567 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :266 337767735862328:337767735872968 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :267 -337767735874281:337767735874282 158131:158131 MARK(name(after HIP LaunchKernel)) 337767735877266:337767738154572 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :269 337767749496464:337767751689019 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :270 -337767751690242:337767751690243 158131:158131 MARK(name(before HIP LaunchKernel)) 337767751695231:337767751695752 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :272 337767751696614:337767751697055 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :273 337767751699119:337767751709298 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :274 -337767751710520:337767751710521 158131:158131 MARK(name(after HIP LaunchKernel)) 337767751712754:337767753849585 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :276 337767762008121:337767764124393 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :277 -337767764127208:337767764127209 158131:158131 MARK(name(before HIP LaunchKernel)) 337767764130875:337767764131336 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :279 337767764132227:337767764133149 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :280 337767764133941:337767764144380 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :281 -337767764145683:337767764145684 158131:158131 MARK(name(after HIP LaunchKernel)) 337767764148638:337767766289286 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :283 337767777579200:337767779697586 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :284 -337767779698878:337767779698879 158131:158131 MARK(name(before HIP LaunchKernel)) 337767779702736:337767779703196 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :286 337767779705741:337767779706352 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :287 337767779707164:337767779717423 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :288 -337767779718676:337767779718677 158131:158131 MARK(name(after HIP LaunchKernel)) 337767779720840:337767781914698 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :290 337767793066662:337767795230303 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :291 -337767795232837:337767795232838 158131:158131 MARK(name(before HIP LaunchKernel)) 337767795236725:337767795237186 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :293 337767795238047:337767795238799 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :294 337767795239580:337767795250210 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :295 -337767795251523:337767795251524 158131:158131 MARK(name(after HIP LaunchKernel)) 337767795254298:337767797393343 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :297 337767805564384:337767807730991 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :298 -337767807732183:337767807732184 158131:158131 MARK(name(before HIP LaunchKernel)) 337767807736431:337767807736832 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :300 337767807738886:337767807739326 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :301 337767807740128:337767807750718 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :302 -337767807752381:337767807752382 158131:158131 MARK(name(after HIP LaunchKernel)) 337767807754445:337767809910952 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :304 337767821070741:337767823217330 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :305 -337767823220606:337767823220607 158131:158131 MARK(name(before HIP LaunchKernel)) 337767823224113:337767823224584 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :307 337767823225435:337767823226117 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :308 337767823226888:337767823237809 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :309 -337767823239061:337767823239062 158131:158131 MARK(name(after HIP LaunchKernel)) 337767823242508:337767825378306 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :311 337767836186891:337767838611975 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :312 -337767838613157:337767838613158 158131:158131 MARK(name(before HIP LaunchKernel)) 337767838616974:337767838617435 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :314 337767838619529:337767838619980 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :315 337767838620751:337767838631151 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :316 -337767838632373:337767838632374 158131:158131 MARK(name(after HIP LaunchKernel)) 337767838634497:337767841389975 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :318 337767849602334:337767851741900 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :319 -337767851744665:337767851744666 158131:158131 MARK(name(before HIP LaunchKernel)) 337767851748422:337767851748953 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :321 337767851749865:337767851750326 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :322 337767851751257:337767851762939 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :323 -337767851765164:337767851765165 158131:158131 MARK(name(after HIP LaunchKernel)) 337767851767288:337767853916672 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :325 337767865022429:337767867180790 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :326 -337767867182052:337767867182053 158131:158131 MARK(name(before HIP LaunchKernel)) 337767867186040:337767867186581 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :328 337767867189446:337767867189897 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :329 337767867190779:337767867201489 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :330 -337767867202901:337767867202902 158131:158131 MARK(name(after HIP LaunchKernel)) 337767867204965:337767869336385 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :332 337767877529990:337767879695264 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :333 -337767879697488:337767879697489 158131:158131 MARK(name(before HIP LaunchKernel)) 337767879701245:337767879701716 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :335 337767879702618:337767879703058 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :336 337767879703930:337767879713799 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :337 -337767879715792:337767879715793 158131:158131 MARK(name(after HIP LaunchKernel)) 337767879717967:337767881913167 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :339 337767892995540:337767895138812 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :340 -337767895140095:337767895140096 158131:158131 MARK(name(before HIP LaunchKernel)) 337767895143782:337767895144343 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :342 337767895147399:337767895147850 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :343 337767895148741:337767895159992 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :344 -337767895161385:337767895161386 158131:158131 MARK(name(after HIP LaunchKernel)) 337767895163479:337767897306631 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :346 337767905491088:337767907644809 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :347 -337767907645981:337767907645982 158131:158131 MARK(name(before HIP LaunchKernel)) 337767907649959:337767907650369 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :349 337767907651271:337767907651702 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :350 337767907652503:337767907662182 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :351 -337767907665338:337767907665339 158131:158131 MARK(name(after HIP LaunchKernel)) 337767907667542:337767909844217 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :353 337767920834587:337767923015841 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :354 -337767923016993:337767923016994 158131:158131 MARK(name(before HIP LaunchKernel)) 337767923020860:337767923021301 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :356 337767923023625:337767923024216 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :357 337767923025018:337767923034997 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :358 -337767923036169:337767923036170 158131:158131 MARK(name(after HIP LaunchKernel)) 337767923038564:337767925257779 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :360 337767933415867:337767935607120 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :361 -337767935608392:337767935608393 158131:158131 MARK(name(before HIP LaunchKernel)) 337767935614504:337767935614894 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :363 337767935615796:337767935616227 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :364 337767935617028:337767935628791 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :365 -337767935630814:337767935630815 158131:158131 MARK(name(after HIP LaunchKernel)) 337767935633069:337767937795447 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :367 337767949313502:337767951612979 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :368 -337767951614161:337767951614162 158131:158131 MARK(name(before HIP LaunchKernel)) 337767951619331:337767951619782 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :370 337767951620653:337767951621084 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :371 337767951621866:337767951631975 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :372 -337767951633117:337767951633118 158131:158131 MARK(name(after HIP LaunchKernel)) 337767951635461:337767953790546 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :374 337767961974873:337767964090794 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :375 -337767964091946:337767964091947 158131:158131 MARK(name(before HIP LaunchKernel)) 337767964095883:337767964096334 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :377 337767964097106:337767964097537 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :378 337767964098328:337767964109599 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :379 -337767964112976:337767964112977 158131:158131 MARK(name(after HIP LaunchKernel)) 337767964115200:337767966322082 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :381 337767978141735:337767980312048 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :382 -337767980313270:337767980313271 158131:158131 MARK(name(before HIP LaunchKernel)) 337767980318530:337767980318991 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :384 337767980319862:337767980320283 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :385 337767980321075:337767980333218 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :386 -337767980334370:337767980334371 158131:158131 MARK(name(after HIP LaunchKernel)) 337767980336434:337767982463225 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :388 337767990643965:337767992831180 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :389 -337767992832242:337767992832243 158131:158131 MARK(name(before HIP LaunchKernel)) 337767992835949:337767992836400 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :391 337767992837272:337767992838023 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :392 337767992838895:337767992849154 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :393 -337767992852671:337767992852672 158131:158131 MARK(name(after HIP LaunchKernel)) 337767992854985:337767995170302 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :395 337768006421925:337768008620131 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :396 -337768008621293:337768008621294 158131:158131 MARK(name(before HIP LaunchKernel)) 337768008627004:337768008627585 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :398 337768008628486:337768008628917 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :399 337768008629709:337768008640940 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :400 -337768008642232:337768008642233 158131:158131 MARK(name(after HIP LaunchKernel)) 337768008644336:337768010807607 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :402 337768022826035:337768025034360 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :403 -337768025035673:337768025035674 158131:158131 MARK(name(before HIP LaunchKernel)) 337768025040201:337768025040742 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :405 337768025041624:337768025042085 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :406 337768025045702:337768025059588 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :407 -337768025061241:337768025061242 158131:158131 MARK(name(after HIP LaunchKernel)) 337768025063405:337768027279074 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :409 337768035511752:337768037677757 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :410 -337768037679060:337768037679061 158131:158131 MARK(name(before HIP LaunchKernel)) 337768037684300:337768037684831 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :412 337768037685733:337768037686173 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :413 337768037687045:337768037698837 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :414 -337768037700029:337768037700030 158131:158131 MARK(name(after HIP LaunchKernel)) 337768037702123:337768039835918 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :416 337768052464758:337768054677029 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :417 -337768054678492:337768054678493 158131:158131 MARK(name(before HIP LaunchKernel)) 337768054682209:337768054682760 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :419 337768054683682:337768054684123 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :420 337768054687028:337768054699391 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :421 -337768054700824:337768054700825 158131:158131 MARK(name(after HIP LaunchKernel)) 337768054702888:337768056852582 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :423 337768067696706:337768069885404 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :424 -337768069886696:337768069886697 158131:158131 MARK(name(before HIP LaunchKernel)) 337768069892627:337768069893168 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :426 337768069894090:337768069894531 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :427 337768069895333:337768069906854 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :428 -337768069908016:337768069908017 158131:158131 MARK(name(after HIP LaunchKernel)) 337768069910862:337768072170173 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :430 337768080351174:337768082619121 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :431 -337768082620604:337768082620605 158131:158131 MARK(name(before HIP LaunchKernel)) 337768082624071:337768082624542 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :433 337768082625433:337768082625864 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :434 337768082627908:337768082637987 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :435 -337768082639350:337768082639351 158131:158131 MARK(name(after HIP LaunchKernel)) 337768082641434:337768084796047 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :437 337768095528300:337768097722809 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :438 -337768097724172:337768097724173 158131:158131 MARK(name(before HIP LaunchKernel)) 337768097729221:337768097729712 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :440 337768097730584:337768097731155 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :441 337768097732016:337768097741915 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :442 -337768097743117:337768097743118 158131:158131 MARK(name(after HIP LaunchKernel)) 337768097746354:337768099921176 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :444 337768108134717:337768110237323 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :445 -337768110238696:337768110238697 158131:158131 MARK(name(before HIP LaunchKernel)) 337768110242483:337768110242954 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :447 337768110243806:337768110244246 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :448 337768110246992:337768110258072 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :449 -337768110259235:337768110259236 158131:158131 MARK(name(after HIP LaunchKernel)) 337768110261339:337768112386066 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :451 337768122890659:337768125074838 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :452 -337768125076772:337768125076773 158131:158131 MARK(name(before HIP LaunchKernel)) 337768125081792:337768125082333 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :454 337768125083224:337768125083976 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :455 337768125084777:337768125095507 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :456 -337768125096680:337768125096681 158131:158131 MARK(name(after HIP LaunchKernel)) 337768125100236:337768127306697 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :458 337768135501804:337768137646259 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :459 -337768137647451:337768137647452 158131:158131 MARK(name(before HIP LaunchKernel)) 337768137651519:337768137651969 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :461 337768137652901:337768137653332 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :462 337768137655256:337768137665595 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :463 -337768137667489:337768137667490 158131:158131 MARK(name(after HIP LaunchKernel)) 337768137669593:337768139840788 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :465 337768150007965:337768152183808 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :466 -337768152188658:337768152188659 158131:158131 MARK(name(before HIP LaunchKernel)) 337768152194328:337768152195040 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :468 337768152196402:337768152197013 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :469 337768152198296:337768152212402 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :470 -337768152214216:337768152214217 158131:158131 MARK(name(after HIP LaunchKernel)) 337768152219596:337768154397694 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :472 337768162580378:337768164727518 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :473 -337768164728680:337768164728681 158131:158131 MARK(name(before HIP LaunchKernel)) 337768164733259:337768164733719 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :475 337768164734801:337768164735282 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :476 337768164737577:337768164748748 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :477 -337768164750000:337768164750001 158131:158131 MARK(name(after HIP LaunchKernel)) 337768164752154:337768166918771 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :479 337768176494672:337768178718727 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :480 -337768178721673:337768178721674 158131:158131 MARK(name(before HIP LaunchKernel)) 337768178727373:337768178727954 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :482 337768178729638:337768178730259 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :483 337768178731531:337768178746109 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :484 -337768178747892:337768178747893 158131:158131 MARK(name(after HIP LaunchKernel)) 337768178752310:337768180959564 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :486 337768193581480:337768195710897 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :487 -337768195712069:337768195712070 158131:158131 MARK(name(before HIP LaunchKernel)) 337768195716056:337768195716457 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :489 337768195719553:337768195720294 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :490 337768195721106:337768195731295 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :491 -337768195732517:337768195732518 158131:158131 MARK(name(after HIP LaunchKernel)) 337768195735303:337768197924692 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :493 337768209190018:337768211608961 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :494 -337768211611596:337768211611597 158131:158131 MARK(name(before HIP LaunchKernel)) 337768211615473:337768211615864 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :496 337768211617006:337768211617567 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :497 337768211618379:337768211629159 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :498 -337768211630471:337768211630472 158131:158131 MARK(name(after HIP LaunchKernel)) 337768211633337:337768213792179 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :500 337768221985442:337768224096274 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :501 -337768224097586:337768224097587 158131:158131 MARK(name(before HIP LaunchKernel)) 337768224101524:337768224101924 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :503 337768224104630:337768224105050 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :504 337768224105842:337768224116632 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :505 -337768224117704:337768224117705 158131:158131 MARK(name(after HIP LaunchKernel)) 337768224119818:337768226336920 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :507 337768237853602:337768240033864 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :508 -337768240036840:337768240036841 158131:158131 MARK(name(before HIP LaunchKernel)) 337768240040687:337768240041078 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :510 337768240042400:337768240042821 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :511 337768240043613:337768240053391 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :512 -337768240055445:337768240055446 158131:158131 MARK(name(after HIP LaunchKernel)) 337768240057689:337768242274030 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :514 337768250469578:337768252848905 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :515 -337768252855277:337768252855278 158131:158131 MARK(name(before HIP LaunchKernel)) 337768252869364:337768252870586 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :517 337768252876868:337768252877830 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :518 337768252880114:337768252911774 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :519 -337768252915411:337768252915412 158131:158131 MARK(name(after HIP LaunchKernel)) 337768252920370:337768255347979 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :521 337768268551523:337768270751402 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :522 -337768270755650:337768270755651 158131:158131 MARK(name(before HIP LaunchKernel)) 337768270761180:337768270761641 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :524 337768270762723:337768270763194 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :525 337768270765088:337768270783793 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :526 -337768270786478:337768270786479 158131:158131 MARK(name(after HIP LaunchKernel)) 337768270788863:337768272953826 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :528 337768285726044:337768287887231 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :529 -337768287888854:337768287888855 158131:158131 MARK(name(before HIP LaunchKernel)) 337768287892821:337768287893372 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :531 337768287896709:337768287897280 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :532 337768287898051:337768287909623 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :533 -337768287911166:337768287911167 158131:158131 MARK(name(after HIP LaunchKernel)) 337768287913500:337768290155559 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :535 337768301488935:337768303702591 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :536 -337768303705937:337768303705938 158131:158131 MARK(name(before HIP LaunchKernel)) 337768303710095:337768303710626 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :538 337768303711508:337768303711928 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :539 337768303712700:337768303724151 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :540 -337768303726566:337768303726567 158131:158131 MARK(name(after HIP LaunchKernel)) 337768303728660:337768305927337 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :542 337768314071007:337768316174444 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :543 -337768316175637:337768316175638 158131:158131 MARK(name(before HIP LaunchKernel)) 337768316179454:337768316180315 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :545 337768316183652:337768316184063 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :546 337768316184874:337768316197488 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :547 -337768316198820:337768316198821 158131:158131 MARK(name(after HIP LaunchKernel)) 337768316200924:337768318880829 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :549 337768330621273:337768332854295 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :550 -337768332855597:337768332855598 158131:158131 MARK(name(before HIP LaunchKernel)) 337768332859845:337768332860316 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :552 337768332861198:337768332861759 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :553 337768332862540:337768332874884 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :554 -337768332878350:337768332878351 158131:158131 MARK(name(after HIP LaunchKernel)) 337768332880615:337768335154463 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :556 337768344608986:337768346866314 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :557 -337768346868297:337768346868298 158131:158131 MARK(name(before HIP LaunchKernel)) 337768346873848:337768346874479 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :559 337768346878667:337768346879689 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :560 337768346880981:337768346896671 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :561 -337768346898554:337768346898555 158131:158131 MARK(name(after HIP LaunchKernel)) 337768346901931:337768349187070 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :563 337768357366927:337768359620077 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :564 -337768359621420:337768359621421 158131:158131 MARK(name(before HIP LaunchKernel)) 337768359626189:337768359626810 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :566 337768359627762:337768359628192 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :567 337768359629154:337768359643301 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :568 -337768359645665:337768359645666 158131:158131 MARK(name(after HIP LaunchKernel)) 337768359648020:337768361807924 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :570 337768370013571:337768372141474 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :571 -337768372142707:337768372142708 158131:158131 MARK(name(before HIP LaunchKernel)) 337768372147686:337768372148157 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :573 337768372149049:337768372149469 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :574 337768372150241:337768372160180 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :575 -337768372161652:337768372161653 158131:158131 MARK(name(after HIP LaunchKernel)) 337768372163756:337768374308411 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :577 337768385673678:337768387892924 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :578 -337768387894387:337768387894388 158131:158131 MARK(name(before HIP LaunchKernel)) 337768387898584:337768387899166 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :580 337768387900057:337768387900478 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :581 337768387901350:337768387912661 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :582 -337768387916108:337768387916109 158131:158131 MARK(name(after HIP LaunchKernel)) 337768387918372:337768390163166 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :584 337768398340079:337768400614609 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :585 -337768400615961:337768400615962 158131:158131 MARK(name(before HIP LaunchKernel)) 337768400622193:337768400622644 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :587 337768400623596:337768400624016 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :588 337768400624818:337768400637362 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :589 -337768400638854:337768400638855 158131:158131 MARK(name(after HIP LaunchKernel)) 337768400641169:337768402797706 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :591 337768414385352:337768416618845 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :592 -337768416620398:337768416620399 158131:158131 MARK(name(before HIP LaunchKernel)) 337768416624315:337768416625017 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :594 337768416626008:337768416626429 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :595 337768416627221:337768416637450 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :596 -337768416640917:337768416640918 158131:158131 MARK(name(after HIP LaunchKernel)) 337768416643371:337768418792214 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :598 337768427961818:337768430177186 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :599 -337768430179080:337768430179081 158131:158131 MARK(name(before HIP LaunchKernel)) 337768430186484:337768430187155 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :601 337768430188517:337768430189089 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :602 337768430190351:337768430204648 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :603 -337768430206511:337768430206512 158131:158131 MARK(name(after HIP LaunchKernel)) 337768430209727:337768432405409 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :605 337768445362658:337768447619615 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :606 -337768447620907:337768447620908 158131:158131 MARK(name(before HIP LaunchKernel)) 337768447624705:337768447625246 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :608 337768447626007:337768447626418 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :609 337768447629554:337768447639172 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :610 -337768447640605:337768447640606 158131:158131 MARK(name(after HIP LaunchKernel)) 337768447642769:337768449799557 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :612 337768460754209:337768463014171 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :613 -337768463015454:337768463015455 158131:158131 MARK(name(before HIP LaunchKernel)) 337768463020914:337768463021425 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :615 337768463022307:337768463022697 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :616 337768463023549:337768463033768 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :617 -337768463035271:337768463035272 158131:158131 MARK(name(after HIP LaunchKernel)) 337768463037485:337768465249006 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :619 337768473400381:337768475617864 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :620 -337768475619156:337768475619157 158131:158131 MARK(name(before HIP LaunchKernel)) 337768475623053:337768475623524 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :622 337768475624506:337768475624927 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :623 337768475627251:337768475637441 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :624 -337768475638953:337768475638954 158131:158131 MARK(name(after HIP LaunchKernel)) 337768475641158:337768477801122 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :626 337768489348752:337768491615487 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :627 -337768491616780:337768491616781 158131:158131 MARK(name(before HIP LaunchKernel)) 337768491622821:337768491623262 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :629 337768491624254:337768491624685 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :630 337768491625486:337768491635575 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :631 -337768491637098:337768491637099 158131:158131 MARK(name(after HIP LaunchKernel)) 337768491641817:337768493801620 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :633 337768501990595:337768504118268 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :634 -337768504120121:337768504120122 158131:158131 MARK(name(before HIP LaunchKernel)) 337768504124329:337768504124770 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :636 337768504125662:337768504126072 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :637 337768504128397:337768504138977 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :638 -337768504140389:337768504140390 158131:158131 MARK(name(after HIP LaunchKernel)) 337768504142463:337768506366899 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :640 337768518232669:337768520625573 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :641 -337768520626815:337768520626816 158131:158131 MARK(name(before HIP LaunchKernel)) 337768520631905:337768520632456 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :643 337768520633878:337768520634299 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :644 337768520635061:337768520645651 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :645 -337768520647073:337768520647074 158131:158131 MARK(name(after HIP LaunchKernel)) 337768520650029:337768522810183 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :647 337768532969966:337768535149747 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :648 -337768535151751:337768535151752 158131:158131 MARK(name(before HIP LaunchKernel)) 337768535157873:337768535158514 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :650 337768535159816:337768535160448 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :651 337768535165006:337768535180515 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :652 -337768535182409:337768535182410 158131:158131 MARK(name(after HIP LaunchKernel)) 337768535185725:337768537380745 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :654 337768545542419:337768547693376 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :655 -337768547695821:337768547695822 158131:158131 MARK(name(before HIP LaunchKernel)) 337768547699348:337768547699789 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :657 337768547700690:337768547701111 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :658 337768547701913:337768547711901 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :659 -337768547713164:337768547713165 158131:158131 MARK(name(after HIP LaunchKernel)) 337768547716490:337768549856496 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :661 337768558079085:337768560202931 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :662 -337768560204103:337768560204104 158131:158131 MARK(name(before HIP LaunchKernel)) 337768560208211:337768560208672 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :664 337768560209604:337768560210025 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :665 337768560213241:337768560225203 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :666 -337768560227177:337768560227178 158131:158131 MARK(name(after HIP LaunchKernel)) 337768560229411:337768562358307 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :668 337768574142772:337768576292777 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :669 -337768576296725:337768576296726 158131:158131 MARK(name(before HIP LaunchKernel)) 337768576300492:337768576301013 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :671 337768576301914:337768576302335 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :672 337768576303127:337768576313827 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :673 -337768576315029:337768576315030 158131:158131 MARK(name(after HIP LaunchKernel)) 337768576318716:337768578450637 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :675 337768586668517:337768588863888 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :676 -337768588865100:337768588865101 158131:158131 MARK(name(before HIP LaunchKernel)) 337768588869188:337768588869729 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :678 337768588870801:337768588871352 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :679 337768588873446:337768588884256 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :680 -337768588885429:337768588885430 158131:158131 MARK(name(after HIP LaunchKernel)) 337768588887593:337768591162173 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :682 337768603357906:337768605622036 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :683 -337768605625142:337768605625143 158131:158131 MARK(name(before HIP LaunchKernel)) 337768605629520:337768605630041 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :685 337768605631043:337768605631464 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :686 337768605632225:337768605644258 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :687 -337768605645821:337768605645822 158131:158131 MARK(name(after HIP LaunchKernel)) 337768605648927:337768607800946 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :689 337768617929891:337768620088853 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :690 -337768620090907:337768620090908 158131:158131 MARK(name(before HIP LaunchKernel)) 337768620097259:337768620097810 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :692 337768620101827:337768620102438 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :693 337768620103691:337768620119190 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :694 -337768620121354:337768620121355 158131:158131 MARK(name(after HIP LaunchKernel)) 337768620124650:337768622380325 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :696 337768630606661:337768632738702 158131:158131 hipMemcpy(dst=0x7f3e43000000, src=0x7f3e7c0ff010, sizeBytes=4194304, kind=1) :697 -337768632742249:337768632742250 158131:158131 MARK(name(before HIP LaunchKernel)) 337768632747128:337768632747529 158131:158131 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :699 337768632748420:337768632748871 158131:158131 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :700 337768632749663:337768632761475 158131:158131 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7fff99cd0d68, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :701 -337768632763158:337768632763159 158131:158131 MARK(name(after HIP LaunchKernel)) 337768632766214:337768634923603 158131:158131 hipMemcpy(dst=0x7f3e43bf9010, src=0x7f3e42800000, sizeBytes=4194304, kind=2) :703 337768644579574:337768644620882 158131:158131 hipFree(ptr=0x7f3e43000000) :704 337768644622795:337768644639537 158131:158131 hipFree(ptr=0x7f3e42800000) :705 diff --git a/test/golden_traces/MatrixTranspose_sys_trace.txt b/test/golden_traces/MatrixTranspose_sys_trace.txt index bee7a24018..b9f5aa67f4 100644 --- a/test/golden_traces/MatrixTranspose_sys_trace.txt +++ b/test/golden_traces/MatrixTranspose_sys_trace.txt @@ -4041,704 +4041,504 @@ ROCTracer (pid=158125): 337764704442075:337764704580366 158125:158125 hipMalloc(ptr=0x7f95c0800000, size=4194304) :2 337764704581889:337764704737823 158125:158125 hipMalloc(ptr=0x7f9484c00000, size=4194304) :3 337764704752891:337764922533350 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :4 -337764922538480:337764922538481 158125:158125 MARK(name(before HIP LaunchKernel)) 337764922562495:337764922564128 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :6 337764922566293:337764922566894 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :7 337764922569459:337764923031149 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :8 -337764923044474:337764923044475 158125:158125 MARK(name(after HIP LaunchKernel)) 337764923047921:337764925574527 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :10 337764938684604:337764941181393 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :11 -337764941182806:337764941182807 158125:158125 MARK(name(before HIP LaunchKernel)) 337764941188697:337764941189108 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :13 337764941190230:337764941190701 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :14 337764941194668:337764941210328 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :15 -337764941212081:337764941212082 158125:158125 MARK(name(after HIP LaunchKernel)) 337764941214015:337764942339087 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :17 337764950623693:337764953056311 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :18 -337764953057774:337764953057775 158125:158125 MARK(name(before HIP LaunchKernel)) 337764953063685:337764953064206 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :20 337764953065609:337764953066049 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :21 337764953067041:337764953079134 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :22 -337764953081038:337764953081039 158125:158125 MARK(name(after HIP LaunchKernel)) 337764953083192:337764954180501 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :24 337764962423108:337764964979740 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :25 -337764964980832:337764964980833 158125:158125 MARK(name(before HIP LaunchKernel)) 337764964984519:337764964985050 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :27 337764964986002:337764964986443 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :28 337764964988627:337764964999588 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :29 -337764965000860:337764965000861 158125:158125 MARK(name(after HIP LaunchKernel)) 337764965002904:337764966123257 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :31 337764974365011:337764977266363 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :32 -337764977267505:337764977267506 158125:158125 MARK(name(before HIP LaunchKernel)) 337764977273266:337764977273797 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :34 337764977274759:337764977275220 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :35 337764977276171:337764977287002 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :36 -337764977288485:337764977288486 158125:158125 MARK(name(after HIP LaunchKernel)) 337764977291550:337764978407134 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :38 337764986653789:337764989132825 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :39 -337764989134297:337764989134298 158125:158125 MARK(name(before HIP LaunchKernel)) 337764989138095:337764989138666 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :41 337764989139617:337764989140068 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :42 337764989143615:337764989154375 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :43 -337764989155898:337764989155899 158125:158125 MARK(name(after HIP LaunchKernel)) 337764989158022:337764990265090 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :45 337764998786773:337765001226896 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :46 -337765001227958:337765001227959 158125:158125 MARK(name(before HIP LaunchKernel)) 337765001234560:337765001235011 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :48 337765001235843:337765001236294 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :49 337765001237235:337765001247825 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :50 -337765001249288:337765001249289 158125:158125 MARK(name(after HIP LaunchKernel)) 337765001252113:337765002370653 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :52 337765010705494:337765013159863 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :53 -337765013160895:337765013160896 158125:158125 MARK(name(before HIP LaunchKernel)) 337765013164893:337765013165353 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :55 337765013166506:337765013166976 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :56 337765013170443:337765013182155 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :57 -337765013183498:337765013183499 158125:158125 MARK(name(after HIP LaunchKernel)) 337765013185662:337765014295144 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :59 337765022617712:337765025088462 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :60 -337765025090746:337765025090747 158125:158125 MARK(name(before HIP LaunchKernel)) 337765025095195:337765025095586 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :62 337765025096567:337765025097018 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :63 337765025097990:337765025108670 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :64 -337765025109913:337765025109914 158125:158125 MARK(name(after HIP LaunchKernel)) 337765025112798:337765026232400 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :66 337765034457684:337765036908086 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :67 -337765036909138:337765036909139 158125:158125 MARK(name(before HIP LaunchKernel)) 337765036913035:337765036913426 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :69 337765036914247:337765036914708 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :70 337765036918836:337765036929165 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :71 -337765036930508:337765036930509 158125:158125 MARK(name(after HIP LaunchKernel)) 337765036932752:337765038039760 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :73 337765046315278:337765048767192 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :74 -337765048770388:337765048770389 158125:158125 MARK(name(before HIP LaunchKernel)) 337765048774425:337765048774806 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :76 337765048775738:337765048776078 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :77 337765048777030:337765048788001 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :78 -337765048789774:337765048789775 158125:158125 MARK(name(after HIP LaunchKernel)) 337765048793040:337765049915989 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :80 337765058187129:337765060574001 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :81 -337765060575344:337765060575345 158125:158125 MARK(name(before HIP LaunchKernel)) 337765060578850:337765060579231 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :83 337765060580163:337765060580503 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :84 337765060584280:337765060595902 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :85 -337765060597225:337765060597226 158125:158125 MARK(name(after HIP LaunchKernel)) 337765060599449:337765061740842 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :87 337765069951218:337765072362576 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :88 -337765072364740:337765072364741 158125:158125 MARK(name(before HIP LaunchKernel)) 337765072369058:337765072369489 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :90 337765072370421:337765072370821 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :91 337765072371773:337765072381732 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :92 -337765072383095:337765072383096 158125:158125 MARK(name(after HIP LaunchKernel)) 337765072386431:337765073501153 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :94 337765081732048:337765084159937 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :95 -337765084160999:337765084161000 158125:158125 MARK(name(before HIP LaunchKernel)) 337765084165328:337765084165688 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :97 337765084170227:337765084170567 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :98 337765084171619:337765084182320 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :99 -337765084183682:337765084183683 158125:158125 MARK(name(after HIP LaunchKernel)) 337765084185656:337765085297784 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :101 337765093537775:337765096025317 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :102 -337765096029174:337765096029175 158125:158125 MARK(name(before HIP LaunchKernel)) 337765096032892:337765096033272 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :104 337765096034655:337765096034985 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :105 337765096035937:337765096046277 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :106 -337765096047579:337765096047580 158125:158125 MARK(name(after HIP LaunchKernel)) 337765096050314:337765097356057 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :108 337765105649560:337765108080996 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :109 -337765108082258:337765108082259 158125:158125 MARK(name(before HIP LaunchKernel)) 337765108086076:337765108086627 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :111 337765108091215:337765108091636 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :112 337765108092828:337765108106043 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :113 -337765108107466:337765108107467 158125:158125 MARK(name(after HIP LaunchKernel)) 337765108109790:337765109224292 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :115 337765117727170:337765120171099 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :116 -337765120173344:337765120173345 158125:158125 MARK(name(before HIP LaunchKernel)) 337765120177231:337765120177742 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :118 337765120178804:337765120179125 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :119 337765120180006:337765120191999 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :120 -337765120194123:337765120194124 158125:158125 MARK(name(after HIP LaunchKernel)) 337765120196457:337765121307212 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :122 337765129537163:337765131980392 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :123 -337765131981414:337765131981415 158125:158125 MARK(name(before HIP LaunchKernel)) 337765131984740:337765131985341 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :125 337765131987676:337765131988016 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :126 337765131989018:337765131999758 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :127 -337765132009206:337765132009207 158125:158125 MARK(name(after HIP LaunchKernel)) 337765132011340:337765133127245 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :129 337765141404317:337765143867803 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :130 -337765143871109:337765143871110 158125:158125 MARK(name(before HIP LaunchKernel)) 337765143875017:337765143875528 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :132 337765143876369:337765143876690 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :133 337765143877562:337765143889744 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :134 -337765143891989:337765143891990 158125:158125 MARK(name(after HIP LaunchKernel)) 337765143894754:337765145003225 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :136 337765153330852:337765155802584 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :137 -337765155803606:337765155803607 158125:158125 MARK(name(before HIP LaunchKernel)) 337765155807283:337765155807814 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :139 337765155811080:337765155811430 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :140 337765155812422:337765155823523 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :141 -337765155824956:337765155824957 158125:158125 MARK(name(after HIP LaunchKernel)) 337765155826960:337765156943876 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :143 337765165226198:337765167700264 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :144 -337765167702008:337765167702009 158125:158125 MARK(name(before HIP LaunchKernel)) 337765167705424:337765167705855 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :146 337765167706757:337765167707087 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :147 337765167708179:337765167720783 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :148 -337765167723098:337765167723099 158125:158125 MARK(name(after HIP LaunchKernel)) 337765167725672:337765168845485 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :150 337765177111916:337765179504549 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :151 -337765179505631:337765179505632 158125:158125 MARK(name(before HIP LaunchKernel)) 337765179509078:337765179509548 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :153 337765179512033:337765179512364 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :154 337765179513296:337765179523705 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :155 -337765179525068:337765179525069 158125:158125 MARK(name(after HIP LaunchKernel)) 337765179527733:337765180639169 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :157 337765188914788:337765191325545 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :158 -337765191326677:337765191326678 158125:158125 MARK(name(before HIP LaunchKernel)) 337765191330795:337765191331176 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :160 337765191332067:337765191332398 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :161 337765191333390:337765191344000 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :162 -337765191347256:337765191347257 158125:158125 MARK(name(after HIP LaunchKernel)) 337765191349470:337765192463481 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :164 337765200792860:337765203211492 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :165 -337765203212494:337765203212495 158125:158125 MARK(name(before HIP LaunchKernel)) 337765203215940:337765203216341 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :167 337765203219537:337765203219968 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :168 337765203220870:337765203231429 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :169 -337765203232592:337765203232593 158125:158125 MARK(name(after HIP LaunchKernel)) 337765203234595:337765204352734 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :171 337765212603176:337765215045302 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :172 -337765215046304:337765215046305 158125:158125 MARK(name(before HIP LaunchKernel)) 337765215049851:337765215050272 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :174 337765215051123:337765215051534 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :175 337765215052546:337765215064719 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :176 -337765215067103:337765215067104 158125:158125 MARK(name(after HIP LaunchKernel)) 337765215069267:337765216191183 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :178 337765224482622:337765226963902 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :179 -337765226964894:337765226964895 158125:158125 MARK(name(before HIP LaunchKernel)) 337765226970044:337765226970405 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :181 337765226971416:337765226971747 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :182 337765226972659:337765226982998 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :183 -337765226984441:337765226984442 158125:158125 MARK(name(after HIP LaunchKernel)) 337765226988078:337765228101498 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :185 337765236379211:337765238861964 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :186 -337765238862966:337765238862967 158125:158125 MARK(name(before HIP LaunchKernel)) 337765238866653:337765238867003 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :188 337765238867865:337765238868195 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :189 337765238869147:337765238880008 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :190 -337765238883504:337765238883505 158125:158125 MARK(name(after HIP LaunchKernel)) 337765238885749:337765239998748 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :192 337765248323740:337765250795292 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :193 -337765250796604:337765250796605 158125:158125 MARK(name(before HIP LaunchKernel)) 337765250802485:337765250802916 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :195 337765250804259:337765250804589 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :196 337765250805441:337765250816071 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :197 -337765250817353:337765250817354 158125:158125 MARK(name(after HIP LaunchKernel)) 337765250819517:337765251927607 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :199 337765260173130:337765262594897 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :200 -337765262595959:337765262595960 158125:158125 MARK(name(before HIP LaunchKernel)) 337765262600167:337765262600618 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :202 337765262601500:337765262601851 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :203 337765262604976:337765262616528 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :204 -337765262617680:337765262617681 158125:158125 MARK(name(after HIP LaunchKernel)) 337765262619774:337765263725670 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :206 337765272031895:337765274457500 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :207 -337765274458662:337765274458663 158125:158125 MARK(name(before HIP LaunchKernel)) 337765274464183:337765274464634 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :209 337765274465525:337765274465986 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :210 337765274466978:337765274477879 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :211 -337765274479241:337765274479242 158125:158125 MARK(name(after HIP LaunchKernel)) 337765274481415:337765275593242 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :213 337765283871867:337765286274118 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :214 -337765286275260:337765286275261 158125:158125 MARK(name(before HIP LaunchKernel)) 337765286279107:337765286279578 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :216 337765286280470:337765286280811 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :217 337765286283075:337765286294416 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :218 -337765286295799:337765286295800 158125:158125 MARK(name(after HIP LaunchKernel)) 337765286297883:337765287415781 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :220 337765295729662:337765298174083 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :221 -337765298175245:337765298175246 158125:158125 MARK(name(before HIP LaunchKernel)) 337765298180806:337765298181657 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :223 337765298182549:337765298182890 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :224 337765298183851:337765298195233 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :225 -337765298196646:337765298196647 158125:158125 MARK(name(after HIP LaunchKernel)) 337765298198950:337765299310807 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :227 337765307576858:337765310015998 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :228 -337765310017191:337765310017192 158125:158125 MARK(name(before HIP LaunchKernel)) 337765310020557:337765310021088 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :230 337765310022240:337765310022601 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :231 337765310025797:337765310037178 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :232 -337765310038511:337765310038512 158125:158125 MARK(name(after HIP LaunchKernel)) 337765310041296:337765311153774 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :234 337765319462296:337765321917687 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :235 -337765321918829:337765321918830 158125:158125 MARK(name(before HIP LaunchKernel)) 337765321924690:337765321925111 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :237 337765321926043:337765321926383 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :238 337765321927325:337765321939187 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :239 -337765321940840:337765321940841 158125:158125 MARK(name(after HIP LaunchKernel)) 337765321943836:337765323047217 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :241 337765331334799:337765333800680 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :242 -337765333801632:337765333801633 158125:158125 MARK(name(before HIP LaunchKernel)) 337765333805689:337765333806020 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :244 337765333806881:337765333807292 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :245 337765333809647:337765333820417 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :246 -337765333821790:337765333821791 158125:158125 MARK(name(after HIP LaunchKernel)) 337765333823934:337765334937344 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :248 337765343248378:337765345732022 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :249 -337765345733114:337765345733115 158125:158125 MARK(name(before HIP LaunchKernel)) 337765345739366:337765345739777 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :251 337765345740558:337765345740879 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :252 337765345741750:337765345752751 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :253 -337765345754084:337765345754085 158125:158125 MARK(name(after HIP LaunchKernel)) 337765345758552:337765346872854 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :255 337765355158251:337765357542558 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :256 -337765357543580:337765357543581 158125:158125 MARK(name(before HIP LaunchKernel)) 337765357547237:337765357548089 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :258 337765357548880:337765357549201 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :259 337765357552347:337765357562656 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :260 -337765357564540:337765357564541 158125:158125 MARK(name(after HIP LaunchKernel)) 337765357566714:337765358703679 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :262 337765366968407:337765369387249 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :263 -337765369390796:337765369390797 158125:158125 MARK(name(before HIP LaunchKernel)) 337765369394683:337765369395074 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :265 337765369395886:337765369396226 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :266 337765369397238:337765369409070 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :267 -337765369410593:337765369410594 158125:158125 MARK(name(after HIP LaunchKernel)) 337765369413920:337765370514896 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :269 337765378813919:337765381249433 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :270 -337765381250495:337765381250496 158125:158125 MARK(name(before HIP LaunchKernel)) 337765381255795:337765381256146 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :272 337765381257067:337765381257398 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :273 337765381259262:337765381270573 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :274 -337765381271925:337765381271926 158125:158125 MARK(name(after HIP LaunchKernel)) 337765381273999:337765382389143 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :276 337765390675582:337765393103622 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :277 -337765393106477:337765393106478 158125:158125 MARK(name(before HIP LaunchKernel)) 337765393110024:337765393110414 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :279 337765393111286:337765393111627 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :280 337765393112599:337765393123419 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :281 -337765393124852:337765393124853 158125:158125 MARK(name(after HIP LaunchKernel)) 337765393127787:337765394243081 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :283 337765402542775:337765405018485 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :284 -337765405019727:337765405019728 158125:158125 MARK(name(before HIP LaunchKernel)) 337765405023564:337765405024035 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :286 337765405027412:337765405027862 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :287 337765405028914:337765405040186 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :288 -337765405041428:337765405041429 158125:158125 MARK(name(after HIP LaunchKernel)) 337765405043412:337765406153906 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :290 337765414439543:337765416968903 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :291 -337765416971859:337765416971860 158125:158125 MARK(name(before HIP LaunchKernel)) 337765416975906:337765416976508 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :293 337765416977560:337765416977880 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :294 337765416978852:337765416990364 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :295 -337765416991516:337765416991517 158125:158125 MARK(name(after HIP LaunchKernel)) 337765416994742:337765418107140 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :297 337765426444636:337765428930194 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :298 -337765428931216:337765428931217 158125:158125 MARK(name(before HIP LaunchKernel)) 337765428935253:337765428935804 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :300 337765428937708:337765428938029 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :301 337765428938940:337765428949350 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :302 -337765428951043:337765428951044 158125:158125 MARK(name(after HIP LaunchKernel)) 337765428953277:337765430060145 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :304 337765438339150:337765441268235 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :305 -337765441270489:337765441270490 158125:158125 MARK(name(before HIP LaunchKernel)) 337765441274216:337765441274747 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :307 337765441275729:337765441276060 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :308 337765441276962:337765441287842 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :309 -337765441289235:337765441289236 158125:158125 MARK(name(after HIP LaunchKernel)) 337765441292160:337765442412533 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :311 337765450709312:337765453167268 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :312 -337765453168290:337765453168291 158125:158125 MARK(name(before HIP LaunchKernel)) 337765453171837:337765453172288 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :314 337765453175113:337765453175684 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :315 337765453176656:337765453187697 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :316 -337765453189130:337765453189131 158125:158125 MARK(name(after HIP LaunchKernel)) 337765453191354:337765454301107 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :318 337765462848969:337765465268904 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :319 -337765465272340:337765465272341 158125:158125 MARK(name(before HIP LaunchKernel)) 337765465276338:337765465276859 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :321 337765465277761:337765465278171 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :322 337765465279123:337765465290104 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :323 -337765465292639:337765465292640 158125:158125 MARK(name(after HIP LaunchKernel)) 337765465294733:337765466406910 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :325 337765474686697:337765477122020 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :326 -337765477122992:337765477122993 158125:158125 MARK(name(before HIP LaunchKernel)) 337765477126609:337765477126970 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :328 337765477130416:337765477130767 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :329 337765477131749:337765477144473 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :330 -337765477145815:337765477145816 158125:158125 MARK(name(after HIP LaunchKernel)) 337765477147809:337765478265337 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :332 337765486542638:337765489033045 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :333 -337765489035209:337765489035210 158125:158125 MARK(name(before HIP LaunchKernel)) 337765489038946:337765489039336 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :335 337765489040108:337765489040549 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :336 337765489041490:337765489052010 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :337 -337765489054255:337765489054256 158125:158125 MARK(name(after HIP LaunchKernel)) 337765489056579:337765490169488 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :339 337765498462309:337765500912371 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :340 -337765500913433:337765500913434 158125:158125 MARK(name(before HIP LaunchKernel)) 337765500917410:337765500917801 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :342 337765500920967:337765500921307 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :343 337765500922309:337765500934001 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :344 -337765500935354:337765500935355 158125:158125 MARK(name(after HIP LaunchKernel)) 337765500937468:337765502051439 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :346 337765510338339:337765512803419 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :347 -337765512804631:337765512804632 158125:158125 MARK(name(before HIP LaunchKernel)) 337765512808448:337765512808879 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :349 337765512809771:337765512810091 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :350 337765512811123:337765512821753 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :351 -337765512826432:337765512826433 158125:158125 MARK(name(after HIP LaunchKernel)) 337765512828546:337765513936426 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :353 337765522202487:337765524571746 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :354 -337765524573359:337765524573360 158125:158125 MARK(name(before HIP LaunchKernel)) 337765524577146:337765524577546 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :356 337765524581193:337765524581524 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :357 337765524582496:337765524594358 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :358 -337765524595821:337765524595822 158125:158125 MARK(name(after HIP LaunchKernel)) 337765524598015:337765525748215 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :360 337765534071724:337765536497660 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :361 -337765536499463:337765536499464 158125:158125 MARK(name(before HIP LaunchKernel)) 337765536504743:337765536505134 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :363 337765536505985:337765536506326 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :364 337765536507728:337765536518278 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :365 -337765536521014:337765536521015 158125:158125 MARK(name(after HIP LaunchKernel)) 337765536523027:337765537637159 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :367 337765545903460:337765548307234 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :368 -337765548308867:337765548308868 158125:158125 MARK(name(before HIP LaunchKernel)) 337765548314498:337765548314909 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :370 337765548315930:337765548316411 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :371 337765548317443:337765548328604 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :372 -337765548329837:337765548329838 158125:158125 MARK(name(after HIP LaunchKernel)) 337765548332271:337765549443808 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :374 337765557720648:337765560151162 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :375 -337765560152143:337765560152144 158125:158125 MARK(name(before HIP LaunchKernel)) 337765560156001:337765560156351 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :377 337765560157363:337765560157684 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :378 337765560158596:337765560169526 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :379 -337765560173414:337765560173415 158125:158125 MARK(name(after HIP LaunchKernel)) 337765560175588:337765561286232 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :381 337765569553195:337765572027742 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :382 -337765572029295:337765572029296 158125:158125 MARK(name(before HIP LaunchKernel)) 337765572036198:337765572036739 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :384 337765572037741:337765572038072 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :385 337765572039034:337765572051167 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :386 -337765572052609:337765572052610 158125:158125 MARK(name(after HIP LaunchKernel)) 337765572055224:337765573176419 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :388 337765581527320:337765583981769 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :389 -337765583982862:337765583982863 158125:158125 MARK(name(before HIP LaunchKernel)) 337765583986849:337765583987270 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :391 337765583988041:337765583988372 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :392 337765583989234:337765584005755 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :393 -337765584008750:337765584008751 158125:158125 MARK(name(after HIP LaunchKernel)) 337765584010904:337765585124174 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :395 337765593393521:337765595851157 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :396 -337765595852249:337765595852250 158125:158125 MARK(name(before HIP LaunchKernel)) 337765595857308:337765595858080 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :398 337765595858982:337765595859312 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :399 337765595860174:337765595870794 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :400 -337765595872116:337765595872117 158125:158125 MARK(name(after HIP LaunchKernel)) 337765595874491:337765596989704 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :402 337765605549108:337765608027193 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :403 -337765608028255:337765608028256 158125:158125 MARK(name(before HIP LaunchKernel)) 337765608032172:337765608032733 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :405 337765608033524:337765608033965 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :406 337765608039165:337765608050527 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :407 -337765608051949:337765608051950 158125:158125 MARK(name(after HIP LaunchKernel)) 337765608054193:337765609169507 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :409 337765617468711:337765619920355 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :410 -337765619921347:337765619921348 158125:158125 MARK(name(before HIP LaunchKernel)) 337765619927148:337765619927679 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :412 337765619928660:337765619929001 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :413 337765619929913:337765619939821 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :414 -337765619941124:337765619941125 158125:158125 MARK(name(after HIP LaunchKernel)) 337765619943298:337765621073860 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :416 337765629366101:337765631863661 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :417 -337765631864673:337765631864674 158125:158125 MARK(name(before HIP LaunchKernel)) 337765631868260:337765631868631 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :419 337765631869402:337765631869823 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :420 337765631873550:337765631884220 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :421 -337765631885433:337765631885434 158125:158125 MARK(name(after HIP LaunchKernel)) 337765631887536:337765632994073 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :423 337765641290129:337765643763524 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :424 -337765643764546:337765643764547 158125:158125 MARK(name(before HIP LaunchKernel)) 337765643769886:337765643770227 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :426 337765643771119:337765643771439 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :427 337765643772311:337765643782781 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :428 -337765643784173:337765643784174 158125:158125 MARK(name(after HIP LaunchKernel)) 337765643787810:337765644905058 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :430 337765653182400:337765655559503 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :431 -337765655561036:337765655561037 158125:158125 MARK(name(before HIP LaunchKernel)) 337765655564733:337765655565074 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :433 337765655565925:337765655566336 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :434 337765655569733:337765655579972 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :435 -337765655581435:337765655581436 158125:158125 MARK(name(after HIP LaunchKernel)) 337765655583769:337765656701417 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :437 337765665019797:337765667416377 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :438 -337765667417629:337765667417630 158125:158125 MARK(name(before HIP LaunchKernel)) 337765667423450:337765667423791 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :440 337765667424873:337765667425294 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :441 337765667426136:337765667436074 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :442 -337765667437407:337765667437408 158125:158125 MARK(name(after HIP LaunchKernel)) 337765667440122:337765668548412 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :444 337765676812980:337765679222275 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :445 -337765679223267:337765679223268 158125:158125 MARK(name(before HIP LaunchKernel)) 337765679227645:337765679227995 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :447 337765679228957:337765679229378 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :448 337765679232354:337765679244447 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :449 -337765679245809:337765679245810 158125:158125 MARK(name(after HIP LaunchKernel)) 337765679247953:337765680356955 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :451 337765688606675:337765691044864 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :452 -337765691045926:337765691045927 158125:158125 MARK(name(before HIP LaunchKernel)) 337765691051106:337765691051466 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :454 337765691052448:337765691052869 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :455 337765691053670:337765691064300 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :456 -337765691065613:337765691065614 158125:158125 MARK(name(after HIP LaunchKernel)) 337765691068518:337765692184794 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :458 337765700496681:337765702965147 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :459 -337765702966329:337765702966330 158125:158125 MARK(name(before HIP LaunchKernel)) 337765702970397:337765702970738 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :461 337765702971629:337765702971960 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :462 337765702975026:337765702985896 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :463 -337765702987239:337765702987240 158125:158125 MARK(name(after HIP LaunchKernel)) 337765702989493:337765704101801 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :465 337765712370696:337765714849511 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :466 -337765714852497:337765714852498 158125:158125 MARK(name(before HIP LaunchKernel)) 337765714856404:337765714856865 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :468 337765714857817:337765714858157 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :469 337765714859129:337765714869088 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :470 -337765714870220:337765714870221 158125:158125 MARK(name(after HIP LaunchKernel)) 337765714873206:337765715984822 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :472 337765724257526:337765726752442 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :473 -337765726753554:337765726753555 158125:158125 MARK(name(before HIP LaunchKernel)) 337765726757381:337765726757902 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :475 337765726758763:337765726759094 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :476 337765726762511:337765726773591 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :477 -337765726774964:337765726774965 158125:158125 MARK(name(after HIP LaunchKernel)) 337765726777028:337765727891159 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :479 337765736175495:337765738571424 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :480 -337765738573508:337765738573509 158125:158125 MARK(name(before HIP LaunchKernel)) 337765738577195:337765738577716 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :482 337765738578677:337765738578998 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :483 337765738580090:337765738590129 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :484 -337765738591672:337765738591673 158125:158125 MARK(name(after HIP LaunchKernel)) 337765738594668:337765739707977 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :486 337765748070500:337765750493230 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :487 -337765750494372:337765750494373 158125:158125 MARK(name(before HIP LaunchKernel)) 337765750497859:337765750498270 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :489 337765750500444:337765750500804 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :490 337765750501846:337765750512667 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :491 -337765750514159:337765750514160 158125:158125 MARK(name(after HIP LaunchKernel)) 337765750516434:337765751633932 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :493 337765759933566:337765762341477 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :494 -337765762344814:337765762344815 158125:158125 MARK(name(before HIP LaunchKernel)) 337765762348350:337765762348841 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :496 337765762349723:337765762350174 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :497 337765762351566:337765762361946 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :498 -337765762363499:337765762363500 158125:158125 MARK(name(after HIP LaunchKernel)) 337765762366384:337765763484233 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :500 337765771735786:337765774156773 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :501 -337765774157805:337765774157806 158125:158125 MARK(name(before HIP LaunchKernel)) 337765774161492:337765774162063 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :503 337765774165299:337765774165640 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :504 337765774166712:337765774177812 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :505 -337765774179285:337765774179286 158125:158125 MARK(name(after HIP LaunchKernel)) 337765774181369:337765775302103 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :507 337765783578812:337765786029635 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :508 -337765786033162:337765786033163 158125:158125 MARK(name(before HIP LaunchKernel)) 337765786036808:337765786037349 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :510 337765786038131:337765786038582 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :511 337765786039473:337765786052037 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :512 -337765786054091:337765786054092 158125:158125 MARK(name(after HIP LaunchKernel)) 337765786056656:337765787172160 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :514 337765795490429:337765797965808 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :515 -337765797966980:337765797966981 158125:158125 MARK(name(before HIP LaunchKernel)) 337765797970798:337765797971409 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :517 337765797973573:337765797973923 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :518 337765797974775:337765797985515 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :519 -337765797986738:337765797986739 158125:158125 MARK(name(after HIP LaunchKernel)) 337765797988832:337765799105267 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :521 337765807418016:337765809874289 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :522 -337765809877956:337765809877957 158125:158125 MARK(name(before HIP LaunchKernel)) 337765809881653:337765809882114 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :524 337765809883016:337765809883427 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :525 337765809884378:337765809895339 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :526 -337765809897333:337765809897334 158125:158125 MARK(name(after HIP LaunchKernel)) 337765809899497:337765811016343 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :528 337765819288546:337765821755830 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :529 -337765821757352:337765821757353 158125:158125 MARK(name(before HIP LaunchKernel)) 337765821760979:337765821761450 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :531 337765821764346:337765821764816 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :532 337765821765718:337765821776088 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :533 -337765821777450:337765821777451 158125:158125 MARK(name(after HIP LaunchKernel)) 337765821779594:337765822898395 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :535 337765831205783:337765833694167 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :536 -337765833697303:337765833697304 158125:158125 MARK(name(before HIP LaunchKernel)) 337765833701471:337765833701831 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :538 337765833702623:337765833702953 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :539 337765833703825:337765833715307 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :540 -337765833717601:337765833717602 158125:158125 MARK(name(after HIP LaunchKernel)) 337765833719785:337765834853393 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :542 337765843156995:337765845538948 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :543 -337765845540120:337765845540121 158125:158125 MARK(name(before HIP LaunchKernel)) 337765845544178:337765845544508 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :545 337765845546542:337765845546883 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :546 337765845547704:337765845557583 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :547 -337765845558916:337765845558917 158125:158125 MARK(name(after HIP LaunchKernel)) 337765845561130:337765846664872 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :549 337765854951950:337765857350254 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :550 -337765857351296:337765857351297 158125:158125 MARK(name(before HIP LaunchKernel)) 337765857354933:337765857355293 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :552 337765857356055:337765857356546 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :553 337765857357508:337765857367727 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :554 -337765857371213:337765857371214 158125:158125 MARK(name(after HIP LaunchKernel)) 337765857373287:337765858496676 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :556 337765866775191:337765869163646 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :557 -337765869164748:337765869164749 158125:158125 MARK(name(before HIP LaunchKernel)) 337765869168926:337765869169316 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :559 337765869174366:337765869174827 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :560 337765869175788:337765869186388 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :561 -337765869187891:337765869187892 158125:158125 MARK(name(after HIP LaunchKernel)) 337765869190156:337765870296673 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :563 337765878585186:337765881030107 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :564 -337765881031149:337765881031150 158125:158125 MARK(name(before HIP LaunchKernel)) 337765881034957:337765881035347 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :566 337765881036219:337765881036550 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :567 337765881037982:337765881050857 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :568 -337765881053522:337765881053523 158125:158125 MARK(name(after HIP LaunchKernel)) 337765881055616:337765882175217 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :570 337765890460034:337765892915986 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :571 -337765892917308:337765892917309 158125:158125 MARK(name(before HIP LaunchKernel)) 337765892922147:337765892922558 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :573 337765892923320:337765892923650 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :574 337765892925103:337765892935142 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :575 -337765892936464:337765892936465 158125:158125 MARK(name(after HIP LaunchKernel)) 337765892938639:337765894040557 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :577 337765902321336:337765904774573 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :578 -337765904775605:337765904775606 158125:158125 MARK(name(before HIP LaunchKernel)) 337765904779151:337765904779552 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :580 337765904780414:337765904780754 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :581 337765904781706:337765904792316 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :582 -337765904794911:337765904794912 158125:158125 MARK(name(after HIP LaunchKernel)) 337765904797416:337765906407563 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :584 337765914710163:337765917154774 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :585 -337765917155946:337765917155947 158125:158125 MARK(name(before HIP LaunchKernel)) 337765917162037:337765917162428 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :587 337765917163400:337765917163841 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :588 337765917164873:337765917176795 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :589 -337765917178248:337765917178249 158125:158125 MARK(name(after HIP LaunchKernel)) 337765917181103:337765918298240 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :591 337765926830502:337765929245907 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :592 -337765929247080:337765929247081 158125:158125 MARK(name(before HIP LaunchKernel)) 337765929250937:337765929251328 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :594 337765929252269:337765929252720 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :595 337765929253702:337765929266025 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :596 -337765929269762:337765929269763 158125:158125 MARK(name(after HIP LaunchKernel)) 337765929272007:337765930388232 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :598 337765938673068:337765941095628 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :599 -337765941096650:337765941096651 158125:158125 MARK(name(before HIP LaunchKernel)) 337765941101008:337765941101419 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :601 337765941102370:337765941102821 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :602 337765941103783:337765941115335 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :603 -337765941116758:337765941116759 158125:158125 MARK(name(after HIP LaunchKernel)) 337765941118952:337765942236489 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :605 337765950583563:337765953028034 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :606 -337765953029146:337765953029147 158125:158125 MARK(name(before HIP LaunchKernel)) 337765953032813:337765953033184 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :608 337765953034396:337765953034847 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :609 337765953037271:337765953047330 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :610 -337765953048773:337765953048774 158125:158125 MARK(name(after HIP LaunchKernel)) 337765953050847:337765954167944 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :612 337765962480472:337765964922048 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :613 -337765964923280:337765964923281 158125:158125 MARK(name(before HIP LaunchKernel)) 337765964928680:337765964929111 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :615 337765964930153:337765964930594 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :616 337765964931365:337765964942516 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :617 -337765964943658:337765964943659 158125:158125 MARK(name(after HIP LaunchKernel)) 337765964945752:337765966055586 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :619 337765974287412:337765976754355 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :620 -337765976755427:337765976755428 158125:158125 MARK(name(before HIP LaunchKernel)) 337765976759224:337765976759605 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :622 337765976760457:337765976760897 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :623 337765976763903:337765976774673 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :624 -337765976776036:337765976776037 158125:158125 MARK(name(after HIP LaunchKernel)) 337765976778220:337765977896830 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :626 337765986168812:337765988577395 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :627 -337765988578958:337765988578959 158125:158125 MARK(name(before HIP LaunchKernel)) 337765988584569:337765988584999 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :629 337765988585891:337765988586482 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :630 337765988587334:337765988598775 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :631 -337765988600238:337765988600239 158125:158125 MARK(name(after HIP LaunchKernel)) 337765988604055:337765989709069 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :633 337765998093663:337766000492497 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :634 -337766000493649:337766000493650 158125:158125 MARK(name(before HIP LaunchKernel)) 337766000497646:337766000498087 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :636 337766000498999:337766000499330 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :637 337766000501814:337766000511843 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :638 -337766000513607:337766000513608 158125:158125 MARK(name(after HIP LaunchKernel)) 337766000515690:337766001640322 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :640 337766009956637:337766012392983 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :641 -337766012393985:337766012393986 158125:158125 MARK(name(before HIP LaunchKernel)) 337766012399555:337766012400226 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :643 337766012401198:337766012401659 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :644 337766012402521:337766012412960 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :645 -337766012414383:337766012414384 158125:158125 MARK(name(after HIP LaunchKernel)) 337766012417790:337766013529516 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :647 337766021796369:337766024223527 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :648 -337766024224779:337766024224780 158125:158125 MARK(name(before HIP LaunchKernel)) 337766024228837:337766024229218 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :650 337766024229979:337766024230440 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :651 337766024234097:337766024245328 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :652 -337766024246560:337766024246561 158125:158125 MARK(name(after HIP LaunchKernel)) 337766024248784:337766025360712 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :654 337766033651129:337766036557400 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :655 -337766036560857:337766036560858 158125:158125 MARK(name(before HIP LaunchKernel)) 337766036564965:337766036565345 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :657 337766036566287:337766036566758 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :658 337766036567640:337766036580564 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :659 -337766036582197:337766036582198 158125:158125 MARK(name(after HIP LaunchKernel)) 337766036585143:337766037708642 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :661 337766045986585:337766048388886 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :662 -337766048389958:337766048389959 158125:158125 MARK(name(before HIP LaunchKernel)) 337766048393825:337766048394376 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :664 337766048395278:337766048395819 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :665 337766048397773:337766048409445 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :666 -337766048410777:337766048410778 158125:158125 MARK(name(after HIP LaunchKernel)) 337766048413082:337766049518447 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :668 337766058038627:337766060454343 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :669 -337766060457078:337766060457079 158125:158125 MARK(name(before HIP LaunchKernel)) 337766060461226:337766060461647 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :671 337766060462509:337766060462950 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :672 337766060463811:337766060475754 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :673 -337766060476986:337766060476987 158125:158125 MARK(name(after HIP LaunchKernel)) 337766060479932:337766061599133 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :675 337766069885611:337766072274686 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :676 -337766072275738:337766072275739 158125:158125 MARK(name(before HIP LaunchKernel)) 337766072279706:337766072280117 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :678 337766072280978:337766072281419 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :679 337766072284986:337766072296648 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :680 -337766072298511:337766072298512 158125:158125 MARK(name(after HIP LaunchKernel)) 337766072300575:337766073410839 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :682 337766081680868:337766084149093 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :683 -337766084152289:337766084152290 158125:158125 MARK(name(before HIP LaunchKernel)) 337766084156237:337766084156647 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :685 337766084157629:337766084157970 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :686 337766084158992:337766084170043 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :687 -337766084171385:337766084171386 158125:158125 MARK(name(after HIP LaunchKernel)) 337766084174451:337766085284064 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :689 337766093580402:337766096024893 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :690 -337766096026455:337766096026456 158125:158125 MARK(name(before HIP LaunchKernel)) 337766096030032:337766096030433 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :692 337766096034350:337766096034831 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :693 337766096035793:337766096047385 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :694 -337766096048818:337766096048819 158125:158125 MARK(name(after HIP LaunchKernel)) 337766096051563:337766097168119 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :696 337766105477451:337766107930458 158125:158125 hipMemcpy(dst=0x7f95c0800000, src=0x7f95c88ff010, sizeBytes=4194304, kind=1) :697 -337766107932672:337766107932673 158125:158125 MARK(name(before HIP LaunchKernel)) 337766107936439:337766107936860 158125:158125 __hipPushCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :699 337766107937852:337766107938193 158125:158125 __hipPopCallConfiguration(gridDim={}, blockDim={}, sharedMem=0, stream=0) :700 337766107939084:337766107949224 158125:158125 hipLaunchKernel(function_address=0x200ee0, numBlocks={}, dimBlocks={}, args=0x7ffea16f38c8, sharedMemBytes=0, stream=0) kernel=matrixTranspose(float*, float*, int) :701 -337766107950656:337766107950657 158125:158125 MARK(name(after HIP LaunchKernel)) 337766107953562:337766109068685 158125:158125 hipMemcpy(dst=0x7f95c84fe010, src=0x7f9484c00000, sizeBytes=4194304, kind=2) :703 337766117332762:337766117364702 158125:158125 hipFree(ptr=0x7f95c0800000) :704 337766117365825:337766117379931 158125:158125 hipFree(ptr=0x7f9484c00000) :705 diff --git a/test/hip/MatrixTranspose.cpp b/test/hip/MatrixTranspose.cpp index 7f19fe991e..b96f2b80a0 100644 --- a/test/hip/MatrixTranspose.cpp +++ b/test/hip/MatrixTranspose.cpp @@ -44,9 +44,6 @@ #define THREADS_PER_BLOCK_Y 4 #define THREADS_PER_BLOCK_Z 1 -// Mark API -extern "C" void roctracer_mark(const char* str); - // Device (Kernel) function, it must be void __global__ void matrixTranspose(float* out, float* in, const int width) { int x = hipBlockDim_x * hipBlockIdx_x + hipThreadIdx_x; @@ -100,7 +97,6 @@ int main() { // Memory transfer from host to device HIP_CALL(hipMemcpy(gpuMatrix, Matrix, NUM * sizeof(float), hipMemcpyHostToDevice)); - roctracer_mark("before HIP LaunchKernel"); roctxMark("before hipLaunchKernel"); int rangeId = roctxRangeStart("hipLaunchKernel range"); roctxRangePush("hipLaunchKernel"); @@ -108,7 +104,6 @@ int main() { hipLaunchKernelGGL( matrixTranspose, dim3(WIDTH / THREADS_PER_BLOCK_X, WIDTH / THREADS_PER_BLOCK_Y), dim3(THREADS_PER_BLOCK_X, THREADS_PER_BLOCK_Y), 0, 0, gpuTransposeMatrix, gpuMatrix, WIDTH); - roctracer_mark("after HIP LaunchKernel"); roctxMark("after hipLaunchKernel"); // Memory transfer from device to host