diff --git a/test/ctrl_hsa_trace.txt b/test/ctrl_hsa_trace.txt new file mode 100644 index 0000000000..8289d19a17 --- /dev/null +++ b/test/ctrl_hsa_trace.txt @@ -0,0 +1,164 @@ +tool HSA test: "./test/hsa/ctrl" +ROCTracer (pid=116451): + HSA-trace() + HSA-activity-trace() +> GPU agents : +> agent[0] : +>> Name : gfx900 +>> APU : 0 +>> HSAIL profile : 0 +>> Max Wave Size : 64 +>> Max Queue Size : 131072 +>> CU number : 64 +>> Waves per CU : 40 +>> SIMDs per CU : 4 +>> SE number : 4 +>> Shader Arrays per SE : 1 +TestHsa::Initialize : +> Using agent[0] : gfx900 +TestHsa::setup : +Code object filename: gfx9_DummyKernel.hsaco +TestHsa::run : +> Executing kernel: "DummyKernel" +> Waiting on kernel dispatch signal, que_idx=0 +> DONE, que_idx=0 +Test : Passed +Time taken for Setup by DummyKernel : 0.000803955 +Time taken for Dispatch by DummyKernel : 2.68555e-05 +Time taken in Total by DummyKernel : 0.000830811 +TestHsa::Initialize : +> Using agent[0] : gfx900 +TestHsa::setup : +Code object filename: gfx9_SimpleConvolution.hsaco +SimpleConvolution::init : +> Input[0] : +> 15 201 51 89 92 34 96 66 11 225 161 96 81 211 108 124 202 244 182 90 215 92 98 20 44 225 55 247 202 0 45 218 202 97 51 39 131 147 105 143 116 11 239 198 222 92 67 169 81 250 3 40 86 101 60 131 70 116 123 17 117 168 236 64 +> Mask : +> 0 0.2 0 +> 0.2 0.2 0.2 +> 0 0.2 0 +TestHsa::run : +> Executing kernel: "SimpleConvolution" +> Waiting on kernel dispatch signal, que_idx=1 +> DONE, que_idx=1 +> Output[0] : +> 45 60 89 75 79 86 45 43 104 82 144 105 99 90 109 124 123 146 149 124 120 87 43 36 88 91 113 103 98 53 68 104 113 106 76 90 90 122 82 92 102 124 95 149 112 102 69 82 146 116 103 62 50 96 99 87 84 110 88 81 61 105 134 71 +Test : Passed +Time taken for Setup by SimpleConvolution : 0.00060498 +Time taken for Dispatch by SimpleConvolution : 4.29687e-05 +Time taken in Total by SimpleConvolution : 0.000647949 +1822787198892285:1822787198903100 async-copy0 +1822786593183215:1822786593187325 116451:116451 hsa_amd_profiling_async_copy_enable() = 0 +1822786593205695:1822786593206405 116451:116451 hsa_agent_get_info(, 17, 0x7ffd08170f5c) = 0 +1822786593211235:1822786593212485 116451:116451 hsa_amd_memory_pool_get_info(, 0, 0x7ffd08170df8) = 0 +1822786593213335:1822786593213925 116451:116451 hsa_amd_memory_pool_get_info(, 1, 0x7ffd08170dfc) = 0 +1822786593214745:1822786593215305 116451:116451 hsa_amd_memory_pool_get_info(, 0, 0x7ffd08170df8) = 0 +1822786593216065:1822786593216635 116451:116451 hsa_amd_memory_pool_get_info(, 1, 0x7ffd08170dfc) = 0 +1822786593216065:1822786593217435 116451:116451 hsa_amd_agent_iterate_memory_pools(, 1, 0x143cfc0) = 1 +1822786593219035:1822786593219605 116451:116451 hsa_amd_memory_pool_get_info(, 0, 0x7ffd08170df8) = 0 +1822786593220385:1822786593220945 116451:116451 hsa_amd_memory_pool_get_info(, 1, 0x7ffd08170dfc) = 0 +1822786593220385:1822786593221715 116451:116451 hsa_amd_agent_iterate_memory_pools(, 1, 0x143cfd0) = 1 +1822786593224085:1822786593224895 116451:116451 hsa_agent_get_info(, 17, 0x7ffd08170f5c) = 0 +1822786593225835:1822786593231426 116451:116451 hsa_agent_get_info(, 0, 0x143d094) = 0 +1822786593233936:1822786593234536 116451:116451 hsa_agent_get_info(, 6, 0x143d0d4) = 0 +1822786593235326:1822786593235926 116451:116451 hsa_agent_get_info(, 14, 0x143d0d8) = 0 +1822786593236696:1822786593237276 116451:116451 hsa_agent_get_info(, 4, 0x143d0dc) = 0 +1822786593238046:1822786593238646 116451:116451 hsa_agent_get_info(, 40962, 0x143d0f8) = 0 +1822786593239416:1822786593240136 116451:116451 hsa_agent_get_info(, 40970, 0x143d0fc) = 0 +1822786593240946:1822786593241526 116451:116451 hsa_agent_get_info(, 40971, 0x143d100) = 0 +1822786593242296:1822786593242886 116451:116451 hsa_agent_get_info(, 40972, 0x143d104) = 0 +1822786593243666:1822786593244246 116451:116451 hsa_agent_get_info(, 40973, 0x143d108) = 0 +1822786593245736:1822786593246326 116451:116451 hsa_amd_memory_pool_get_info(, 0, 0x7ffd08170de8) = 0 +1822786593247096:1822786593247676 116451:116451 hsa_amd_memory_pool_get_info(, 1, 0x7ffd08170dec) = 0 +1822786593247096:1822786593248456 116451:116451 hsa_amd_agent_iterate_memory_pools(, 1, 0x143d0e8) = 1 +1822786593247096:1822786593250036 116451:116451 hsa_iterate_agents(1, 0x13fd320) = 0 +1822786593251826:1822786593416117 116451:116451 hsa_system_get_extension_table(, , , 0x13fd3b8) = 0 +1822786593417707:1822786593420377 116451:116451 hsa_system_get_extension_table(, , , 0x13fd408) = 0 +1822786593422447:1822786593423047 116451:116451 hsa_system_get_info(3, 0x7ffd08171128) = 0 +1822786593658778:1822786608352362 116451:116459 hsa_queue_create(, , , 0, 0, , , ) = 0 +1822786902531377:1822786902535757 116451:116459 hsa_signal_create(1, , 0, 0x7fa610001f20) = 0 +1822786902571037:1822786902584537 116451:116459 hsa_code_object_reader_create_from_file(5, 0x7fa665ffcbe0) = 0 +1822786902586167:1822786902597097 116451:116459 hsa_executable_create_alt(1, 0, +1822786902598597:1822786902965610 116451:116459 hsa_executable_load_agent_code_object(, , , +1822786902967780:1822786903353172 116451:116459 hsa_executable_freeze(, ) = 0 +1822786903355162:1822786903356442 116451:116459 hsa_executable_get_symbol(, +1822786903362512:1822786903363052 116451:116459 hsa_executable_symbol_get_info(, 13, 0x7fa665ffcc44) = 0 +1822786903363492:1822786903363782 116451:116459 hsa_executable_symbol_get_info(, 14, 0x7fa665ffcc48) = 0 +1822786903364172:1822786903364492 116451:116459 hsa_executable_symbol_get_info(, 22, 0x7fa665ffcc58) = 0 +1822786903365702:1822786903366022 116451:116459 hsa_signal_store_relaxed(, 1) = void +1822786903370912:1822786903371252 116451:116459 hsa_queue_load_write_index_relaxed(0x7fa7a2ce1000) = 0 +1822786903372632:1822786903372942 116451:116459 hsa_queue_store_write_index_relaxed(0x7fa7a2ce1000, ) = void +1822786903374072:1822786903374512 116451:116459 hsa_queue_load_read_index_relaxed(0x7fa7a2ce1000) = 0 +1822786903375092:1822786903375562 116451:116459 hsa_signal_store_relaxed(, 0) = void +1822786903379112:1822786903393132 116451:116459 hsa_signal_wait_scacquire(, 2, 1, , 0) = 0 +1822786903425033:1822786903474693 116451:116459 hsa_executable_destroy() = 0 +1822786903475683:1822786903476973 116451:116459 hsa_signal_destroy() = 0 +1822787197612807:1822787197613567 116451:116459 hsa_signal_create(1, , 0, 0x7fa610007340) = 0 +1822787197622077:1822787197628137 116451:116459 hsa_code_object_reader_create_from_file(7, 0x7fa665ffcbe0) = 0 +1822787197628677:1822787197629627 116451:116459 hsa_executable_create_alt(1, 0, +1822787197630087:1822787197791048 116451:116459 hsa_executable_load_agent_code_object(, , , +1822787197792018:1822787197833668 116451:116459 hsa_executable_freeze(, ) = 0 +1822787197834218:1822787197839559 116451:116459 hsa_executable_get_symbol(, +1822787197841769:1822787197856699 116451:116459 hsa_amd_memory_pool_allocate(, , , 0x7fa665ffcc68) = 0 +1822787197858079:1822787197924589 116451:116459 hsa_amd_agents_allow_access(, 0x7fa665ffcc70, 0, 0x7fa7a2cc4000) = 0 +1822787197926269:1822787197927179 116451:116459 hsa_amd_memory_pool_allocate(, , , 0x7fa665ffcc70) = 0 +1822787197927659:1822787197939219 116451:116459 hsa_amd_memory_pool_allocate(, , , 0x7fa665ffcc68) = 0 +1822787197939719:1822787197992339 116451:116459 hsa_amd_agents_allow_access(, 0x7fa665ffcc70, 0, 0x7fa7a2cd6000) = 0 +1822787197993039:1822787197993399 116451:116459 hsa_executable_symbol_get_info(, 11, 0x7fa665ffcca0) = 0 +1822787197995009:1822787198005070 116451:116459 hsa_amd_memory_pool_allocate(, , , 0x7fa665ffcc68) = 0 +1822787198005560:1822787198054310 116451:116459 hsa_amd_agents_allow_access(, 0x7fa665ffcc70, 0, 0x7fa7a2cd4000) = 0 +1822787198222651:1822787198223061 116451:116459 hsa_executable_symbol_get_info(, 13, 0x7fa665ffcc44) = 0 +1822787198223531:1822787198223831 116451:116459 hsa_executable_symbol_get_info(, 14, 0x7fa665ffcc48) = 0 +1822787198224221:1822787198224531 116451:116459 hsa_executable_symbol_get_info(, 22, 0x7fa665ffcc58) = 0 +1822787198224991:1822787198225351 116451:116459 hsa_signal_store_relaxed(, 1) = void +1822787198228821:1822787198229191 116451:116459 hsa_queue_load_write_index_relaxed(0x7fa7a2ce1000) = 1 +1822787198229651:1822787198229961 116451:116459 hsa_queue_store_write_index_relaxed(0x7fa7a2ce1000, ) = void +1822787198230421:1822787198230851 116451:116459 hsa_queue_load_read_index_relaxed(0x7fa7a2ce1000) = 1 +1822787198231381:1822787198231871 116451:116459 hsa_signal_store_relaxed(, 1) = void +1822787198234591:1822787198268311 116451:116459 hsa_signal_wait_scacquire(, 2, 1, , 0) = 0 +1822787198271101:1822787198289651 116451:116459 hsa_amd_memory_pool_allocate(, , , 0x7fa665ffcc68) = 0 +1822787198290261:1822787198347092 116451:116459 hsa_amd_agents_allow_access(, 0x7fa665ffcc70, 0, 0x7fa7a2c78000) = 0 +1822787198347792:1822787198349312 116451:116459 hsa_signal_create(1, , 0, 0x7fa665ffcc40) = 0 +1822787198356932:1822787198357642 116451:116459 hsa_agent_get_info(, 17, 0x7fa665ffc7bc) = 0 +1822787198359432:1822787198360132 116451:116459 hsa_amd_memory_pool_get_info(, 0, 0x7fa665ffc658) = 0 +1822787198360542:1822787198360842 116451:116459 hsa_amd_memory_pool_get_info(, 1, 0x7fa665ffc65c) = 0 +1822787198361262:1822787198361552 116451:116459 hsa_amd_memory_pool_get_info(, 0, 0x7fa665ffc658) = 0 +1822787198361942:1822787198362232 116451:116459 hsa_amd_memory_pool_get_info(, 1, 0x7fa665ffc65c) = 0 +1822787198361942:1822787198362632 116451:116459 hsa_amd_agent_iterate_memory_pools(, 1, 0x7fa610006d60) = 1 +1822787198363522:1822787198363812 116451:116459 hsa_amd_memory_pool_get_info(, 0, 0x7fa665ffc658) = 0 +1822787198364212:1822787198364502 116451:116459 hsa_amd_memory_pool_get_info(, 1, 0x7fa665ffc65c) = 0 +1822787198364212:1822787198364892 116451:116459 hsa_amd_agent_iterate_memory_pools(, 1, 0x7fa610006d70) = 1 +1822787198365732:1822787198366072 116451:116459 hsa_agent_get_info(, 17, 0x7fa665ffc7bc) = 0 +1822787198366522:1822787198369532 116451:116459 hsa_agent_get_info(, 0, 0x7fa610006e34) = 0 +1822787198372162:1822787198372472 116451:116459 hsa_agent_get_info(, 6, 0x7fa610006e74) = 0 +1822787198372872:1822787198373172 116451:116459 hsa_agent_get_info(, 14, 0x7fa610006e78) = 0 +1822787198373572:1822787198373862 116451:116459 hsa_agent_get_info(, 4, 0x7fa610006e7c) = 0 +1822787198374262:1822787198374572 116451:116459 hsa_agent_get_info(, 40962, 0x7fa610006e98) = 0 +1822787198375892:1822787198376202 116451:116459 hsa_agent_get_info(, 40970, 0x7fa610006e9c) = 0 +1822787198376692:1822787198376992 116451:116459 hsa_agent_get_info(, 40971, 0x7fa610006ea0) = 0 +1822787198377392:1822787198377692 116451:116459 hsa_agent_get_info(, 40972, 0x7fa610006ea4) = 0 +1822787198378092:1822787198378392 116451:116459 hsa_agent_get_info(, 40973, 0x7fa610006ea8) = 0 +1822787198379162:1822787198379462 116451:116459 hsa_amd_memory_pool_get_info(, 0, 0x7fa665ffc648) = 0 +1822787198379852:1822787198380152 116451:116459 hsa_amd_memory_pool_get_info(, 1, 0x7fa665ffc64c) = 0 +1822787198379852:1822787198380542 116451:116459 hsa_amd_agent_iterate_memory_pools(, 1, 0x7fa610006e88) = 1 +1822787198379852:1822787198381142 116451:116459 hsa_iterate_agents(1, 0x7fa610006980) = 0 +1822787198381692:1822787198397632 116451:116459 hsa_system_get_major_extension_table(, , , 0x7fa610006a18) = 0 +1822787198398112:1822787198398412 116451:116459 hsa_system_get_major_extension_table(, , , 0x7fa610006a68) = 0 +1822787198399032:1822787198399332 116451:116459 hsa_system_get_info(3, 0x7fa665ffc988) = 0 +1822787198399782:1822787198400322 116451:116459 hsa_system_get_info(2, 0x7fa665ffc9d0) = 0 +1822787198400762:1822787198401922 116451:116459 hsa_signal_create(1, , 0, 0x7fa68f797050) = 0 +1822787198402472:1822787198405132 116451:116459 hsa_amd_signal_async_handler(, 2, 1, 1, 0x7fa68f797010) = 0 +1822787198405752:1822787198837475 116451:116459 hsa_amd_memory_async_copy(0x7fa7a2c78000, , 0x7fa688203000, , , , 0, ) = 0 +1822787198931945:1822787198941165 116451:116454 hsa_amd_profiling_get_async_copy_time(, 0x7fa7a092bc40) = 0 +1822787198944925:1822787198946035 116451:116454 hsa_system_get_info(2, 0x7fa7a092bc38) = 0 +1822787198947005:1822787198948155 116451:116454 hsa_signal_load_relaxed() = 1 +1822787198838365:1822787198950945 116451:116459 hsa_signal_wait_scacquire(, 2, 1, , 0) = 0 +1822787198949035:1822787198951965 116451:116454 hsa_signal_store_screlease(, 0) = void +1822787198952535:1822787198953995 116451:116459 hsa_signal_destroy() = 0 +1822787198953835:1822787198955305 116451:116454 hsa_signal_destroy() = 0 +1822787199054396:1822787199072966 116451:116459 hsa_memory_free(0x7fa7a2c78000) = 0 +1822787199096536:1822787199113536 116451:116459 hsa_executable_destroy() = 0 +1822787199114426:1822787199116066 116451:116459 hsa_signal_destroy() = 0 +1822787199118006:1822787200339674 116451:116459 hsa_queue_destroy() = 0 +tool HSA test: PASSED +8 tests total / 1 tests run / 0 tests failed