48 KiB
48 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | GRBM_COUNT | GRBM_GUI_ACTIVE | CPC_ME1_BUSY_FOR_PACKET_DECODE | SQ_CYCLES | SQ_WAVES | SQ_WAVE_CYCLES | SQ_BUSY_CYCLES | SQ_LEVEL_WAVES | SQ_ACCUM_PREV_HIRES | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBufferAligned.kd | 0 | 0 | 0 | 229609 | 229609 | 33554432 | 256 | 0 | 0 | 4 | 32 | 4160 | 0x0 | 0x7fbe34404280 | 381263 | 381263 | 8890 | 3050112 | 524288 | 238895534 | 2962457 | 0 | 971826084 | 17704936968427 | 17704230750143 | 17705081453045 | 17705081565284 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 229609 | 229609 | 32768 | 256 | 0 | 0 | 12 | 24 | 13888 | 0x0 | 0x7fbe34423f80 | 33603 | 33603 | 30038 | 268832 | 512 | 1728667 | 161482 | 0 | 6928212 | 17705086704565 | 17705081453045 | 17705086842338 | 17705086846922 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 5 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 14336 | 0x7fbe37412380 | 0x7fbe34423fc0 | 165838 | 165838 | 13145 | 1326712 | 65536 | 71213297 | 1218469 | 0 | 286591028 | 17705086889921 | 17705086842338 | 17705087234019 | 17705087236572 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 8 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15040 | 0x7fbe37412200 | 0x7fbe34424000 | 310165 | 310165 | 24235 | 2481328 | 65536 | 221979920 | 2376367 | 0 | 889649004 | 17705087280861 | 17705087234019 | 17705087659940 | 17705087662531 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 11 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15488 | 0x7fbe37412080 | 0x7fbe34424040 | 310242 | 310242 | 24406 | 2481944 | 65536 | 226991974 | 2375657 | 0 | 909693676 | 17705087702290 | 17705087659940 | 17705088078341 | 17705088080621 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 14 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 15936 | 0x7fbe34c6df00 | 0x7fbe34424080 | 166125 | 166125 | 15134 | 1329008 | 65536 | 84131616 | 1220911 | 0 | 338253916 | 17705088120850 | 17705088078341 | 17705088401221 | 17705088403393 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 17 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 16384 | 0x7fbe34c6dd80 | 0x7fbe344240c0 | 164834 | 164834 | 13742 | 1318680 | 65536 | 73136413 | 1209232 | 0 | 294282380 | 17705088442192 | 17705088401221 | 17705088720902 | 17705088723075 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 20 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 17088 | 0x7fbe34c6dc00 | 0x7fbe34424100 | 164358 | 164358 | 14715 | 1314872 | 65536 | 95265591 | 1206243 | 0 | 382790668 | 17705088776333 | 17705088720902 | 17705089042823 | 17705089045137 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 23 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 16 | 24 | 17792 | 0x7fbe34c6da80 | 0x7fbe34424140 | 309562 | 309562 | 24423 | 2476504 | 65536 | 228046732 | 2367471 | 0 | 913915752 | 17705089085186 | 17705089042823 | 17705089470504 | 17705089472616 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 26 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 16 | 24 | 18496 | 0x7fbe34c6d900 | 0x7fbe34424180 | 307173 | 307173 | 21988 | 2457392 | 65536 | 215027111 | 2351352 | 0 | 861837712 | 17705089511805 | 17705089470504 | 17705089885865 | 17705089887976 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 29 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19200 | 0x7fbe34c6d780 | 0x7fbe344241c0 | 164556 | 164556 | 14994 | 1316456 | 65536 | 92600180 | 1208307 | 0 | 372132588 | 17705089927125 | 17705089885865 | 17705090220906 | 17705090223297 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 32 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19904 | 0x7fbe34c6d600 | 0x7fbe34424200 | 164966 | 164966 | 15399 | 1319736 | 65536 | 95863865 | 1214595 | 0 | 385182356 | 17705090263036 | 17705090220906 | 17705090554187 | 17705090556419 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 35 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 20608 | 0x7fbe37412480 | 0x7fbe34424240 | 165628 | 165628 | 15377 | 1325032 | 65536 | 83907206 | 1210207 | 0 | 337362764 | 17705090605538 | 17705090554187 | 17705090879308 | 17705090881611 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 38 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 16 | 24 | 21312 | 0x7fbe37412300 | 0x7fbe34424280 | 309987 | 309987 | 24071 | 2479904 | 65536 | 226883645 | 2374159 | 0 | 909263920 | 17705090921880 | 17705090879308 | 17705091293389 | 17705091295050 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 41 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22016 | 0x7fbe37412180 | 0x7fbe344242c0 | 309063 | 309063 | 21814 | 2472512 | 65536 | 221965244 | 2363589 | 0 | 889590152 | 17705091335869 | 17705091293389 | 17705091677709 | 17705091679250 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 44 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22720 | 0x7fbe37412000 | 0x7fbe34424300 | 164631 | 164631 | 14216 | 1317056 | 65536 | 83681877 | 1214062 | 0 | 336460536 | 17705091718619 | 17705091677709 | 17705091975310 | 17705091976993 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 47 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 23424 | 0x7fbe34c6de80 | 0x7fbe34424340 | 165019 | 165019 | 15145 | 1320160 | 65536 | 91446317 | 1215671 | 0 | 367521048 | 17705092016992 | 17705091975310 | 17705092267311 | 17705092268976 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 50 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 24128 | 0x7fbe34c6dd00 | 0x7fbe34424380 | 163639 | 163639 | 14467 | 1309120 | 65536 | 87883547 | 1203538 | 0 | 353257384 | 17705092316344 | 17705092267311 | 17705092560112 | 17705092561788 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 53 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 16 | 24 | 24832 | 0x7fbe34c6db80 | 0x7fbe344243c0 | 309723 | 309723 | 24301 | 2477792 | 65536 | 228283365 | 2371609 | 0 | 914862896 | 17705092602147 | 17705092560112 | 17705092941873 | 17705092943559 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 56 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 16 | 24 | 25536 | 0x7fbe34c6da00 | 0x7fbe34424400 | 307033 | 307033 | 22759 | 2456272 | 65536 | 219601637 | 2352822 | 0 | 880138900 | 17705092985248 | 17705092941873 | 17705093324114 | 17705093325719 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 59 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26240 | 0x7fbe34c6d880 | 0x7fbe34424440 | 165041 | 165041 | 14422 | 1320336 | 65536 | 88222019 | 1213142 | 0 | 354624520 | 17705093365658 | 17705093324114 | 17705093617714 | 17705093619412 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 62 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26944 | 0x7fbe34c6d700 | 0x7fbe34424480 | 163329 | 163329 | 15001 | 1306640 | 65536 | 106677405 | 1204086 | 0 | 428431280 | 17705093658911 | 17705093617714 | 17705093910995 | 17705093912604 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 65 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 27648 | 0x7fbe37412580 | 0x7fbe344244c0 | 163267 | 163267 | 15758 | 1306144 | 65536 | 98906850 | 1202758 | 0 | 397359688 | 17705093959653 | 17705093910995 | 17705094219476 | 17705094221506 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 68 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 16 | 24 | 28608 | 0x7fbe37412400 | 0x7fbe34424500 | 309007 | 309007 | 23045 | 2472064 | 65536 | 226694224 | 2367706 | 0 | 908506572 | 17705094262355 | 17705094219476 | 17705094604277 | 17705094605857 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 71 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 16 | 24 | 29312 | 0x7fbe37412280 | 0x7fbe34424540 | 306389 | 306389 | 21695 | 2451120 | 65536 | 213818025 | 2347253 | 0 | 857001908 | 17705094646686 | 17705094604277 | 17705094987638 | 17705094989297 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 74 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 30016 | 0x7fbe37412100 | 0x7fbe34424580 | 161903 | 161903 | 14760 | 1295232 | 65536 | 97386646 | 1191628 | 0 | 391278680 | 17705095029976 | 17705094987638 | 17705095283638 | 17705095285290 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 77 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 8 | 24 | 30976 | 0x7fbe34c6df80 | 0x7fbe344245c0 | 163197 | 163197 | 14617 | 1305584 | 65536 | 90919910 | 1203451 | 0 | 365412128 | 17705095325729 | 17705095283638 | 17705095575319 | 17705095577032 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 80 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 31680 | 0x7fbe34c6de00 | 0x7fbe34424600 | 162819 | 162819 | 15650 | 1302560 | 65536 | 102346093 | 1199176 | 0 | 411104504 | 17705095624611 | 17705095575319 | 17705095868120 | 17705095869755 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 83 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 16 | 24 | 32640 | 0x7fbe34c6dc80 | 0x7fbe34424640 | 306939 | 306939 | 24174 | 2455520 | 65536 | 221277350 | 2340420 | 0 | 886839708 | 17705095909424 | 17705095868120 | 17705096254681 | 17705096256345 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 86 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 33600 | 0x7fbe34c6db00 | 0x7fbe34424680 | 306145 | 306145 | 22292 | 2449168 | 65536 | 216094156 | 2340460 | 0 | 866106260 | 17705096297934 | 17705096254681 | 17705096637882 | 17705096639496 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 89 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 34560 | 0x7fbe34c6d980 | 0x7fbe344246c0 | 162810 | 162810 | 14509 | 1302488 | 65536 | 94344285 | 1198509 | 0 | 379104220 | 17705096679645 | 17705096637882 | 17705096932602 | 17705096934328 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 92 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 8 | 24 | 35520 | 0x7fbe34c6d800 | 0x7fbe34424700 | 162701 | 162701 | 14523 | 1301616 | 65536 | 90597937 | 1199637 | 0 | 364121044 | 17705096974877 | 17705096932602 | 17705097224923 | 17705097226521 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 95 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 36224 | 0x7fbe34c6d680 | 0x7fbe34424740 | 164134 | 164134 | 15690 | 1313080 | 65536 | 93949974 | 1202861 | 0 | 377531076 | 17705097274700 | 17705097224923 | 17705097525244 | 17705097526863 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 98 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 37184 | 0x7fbe37412500 | 0x7fbe34424780 | 306815 | 306815 | 24517 | 2454528 | 65536 | 226566685 | 2352541 | 0 | 907998044 | 17705097567122 | 17705097525244 | 17705097905885 | 17705097907454 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 101 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 38144 | 0x7fbe37412380 | 0x7fbe344247c0 | 306268 | 306268 | 23038 | 2450152 | 65536 | 214660343 | 2346170 | 0 | 860369424 | 17705097947933 | 17705097905885 | 17705098303806 | 17705098305474 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 104 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 39104 | 0x7fbe37412200 | 0x7fbe34424800 | 162649 | 162649 | 14408 | 1301200 | 65536 | 85360088 | 1196434 | 0 | 343170176 | 17705098346213 | 17705098303806 | 17705098603967 | 17705098605726 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 107 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 8 | 24 | 40320 | 0x7fbe37412080 | 0x7fbe34424840 | 163216 | 163216 | 15179 | 1305736 | 65536 | 87713806 | 1201618 | 0 | 352581620 | 17705098646735 | 17705098603967 | 17705098907327 | 17705098909039 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 110 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 41280 | 0x7fbe34c6df00 | 0x7fbe34424880 | 162349 | 162349 | 14872 | 1298800 | 65536 | 96268286 | 1196763 | 0 | 386798792 | 17705098957687 | 17705098907327 | 17705099202048 | 17705099203651 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 113 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 42240 | 0x7fbe34c6dd80 | 0x7fbe344248c0 | 304648 | 304648 | 23443 | 2437192 | 65536 | 213568663 | 2324376 | 0 | 856003796 | 17705099243980 | 17705099202048 | 17705099584449 | 17705099586092 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 116 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 43200 | 0x7fbe34c6dc00 | 0x7fbe34424900 | 302400 | 302400 | 20924 | 2419208 | 65536 | 211961669 | 2312297 | 0 | 849578620 | 17705099625151 | 17705099584449 | 17705099966050 | 17705099967772 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 119 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 8 | 24 | 44160 | 0x7fbe34c6da80 | 0x7fbe34424940 | 163390 | 163390 | 15302 | 1307128 | 65536 | 85524809 | 1201537 | 0 | 343827676 | 17705100008471 | 17705099966050 | 17705100263491 | 17705100265055 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 122 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 45376 | 0x7fbe34c6d900 | 0x7fbe34424980 | 163264 | 163264 | 15437 | 1306120 | 65536 | 92225451 | 1195519 | 0 | 370630844 | 17705100305144 | 17705100263491 | 17705100559011 | 17705100560597 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 125 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 46336 | 0x7fbe34c6d780 | 0x7fbe344249c0 | 161946 | 161946 | 14516 | 1295576 | 65536 | 95209824 | 1190713 | 0 | 382569372 | 17705100608096 | 17705100559011 | 17705100858052 | 17705100859750 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 128 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 47552 | 0x7fbe34c6d600 | 0x7fbe34424a00 | 305858 | 305858 | 24378 | 2446872 | 65536 | 225426422 | 2340679 | 0 | 903435480 | 17705100900759 | 17705100858052 | 17705101241733 | 17705101243460 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 131 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 48512 | 0x7fbe37412480 | 0x7fbe34424a40 | 301950 | 301950 | 22135 | 2415608 | 65536 | 214786769 | 2312050 | 0 | 860874552 | 17705101284249 | 17705101241733 | 17705101623174 | 17705101624721 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 134 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 8 | 24 | 49472 | 0x7fbe37412300 | 0x7fbe34424a80 | 162289 | 162289 | 14670 | 1298320 | 65536 | 82402047 | 1193739 | 0 | 331348104 | 17705101665280 | 17705101623174 | 17705101919175 | 17705101920883 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 137 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 50688 | 0x7fbe37412180 | 0x7fbe34424ac0 | 163638 | 163638 | 16770 | 1309112 | 65536 | 96052913 | 1198527 | 0 | 385947872 | 17705101961272 | 17705101919175 | 17705102223976 | 17705102225846 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 140 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 51648 | 0x7fbe37412000 | 0x7fbe34424b00 | 162304 | 162304 | 15238 | 1298440 | 65536 | 90659565 | 1195226 | 0 | 364367700 | 17705102274054 | 17705102223976 | 17705102522536 | 17705102524078 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 143 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 52864 | 0x7fbe34c6de80 | 0x7fbe34424b40 | 303252 | 303252 | 22970 | 2426024 | 65536 | 215841142 | 2314125 | 0 | 865093576 | 17705102564847 | 17705102522536 | 17705102904617 | 17705102906228 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 146 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 54080 | 0x7fbe34c6dd00 | 0x7fbe34424b80 | 303952 | 303952 | 20809 | 2431624 | 65536 | 216431221 | 2318408 | 0 | 867456572 | 17705102946227 | 17705102904617 | 17705103290058 | 17705103291649 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 149 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 8 | 24 | 55296 | 0x7fbe34c6db80 | 0x7fbe34424bc0 | 162802 | 162802 | 15015 | 1302424 | 65536 | 89479025 | 1198028 | 0 | 359649528 | 17705103331678 | 17705103290058 | 17705103585099 | 17705103586751 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 152 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 56768 | 0x7fbe34c6da00 | 0x7fbe34424c00 | 164999 | 164999 | 16433 | 1320000 | 65536 | 100821277 | 1211993 | 0 | 405029076 | 17705103627070 | 17705103585099 | 17705103886540 | 17705103888294 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 155 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 57728 | 0x7fbe34c6d880 | 0x7fbe34424c40 | 163100 | 163100 | 14932 | 1304808 | 65536 | 94066627 | 1197106 | 0 | 377992692 | 17705103935413 | 17705103886540 | 17705104188620 | 17705104190336 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 158 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 58944 | 0x7fbe34c6d700 | 0x7fbe34424c80 | 301112 | 301112 | 23161 | 2408904 | 65536 | 215671737 | 2299808 | 0 | 864417964 | 17705104230695 | 17705104188620 | 17705104566541 | 17705104568197 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 161 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 60160 | 0x7fbe37412580 | 0x7fbe34424cc0 | 301782 | 301782 | 21601 | 2414264 | 65536 | 214445803 | 2308591 | 0 | 859514404 | 17705104608596 | 17705104566541 | 17705104950542 | 17705104952257 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 164 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 8 | 24 | 61376 | 0x7fbe37412400 | 0x7fbe34424d00 | 162606 | 162606 | 14746 | 1300856 | 65536 | 87328009 | 1196451 | 0 | 351042964 | 17705104992666 | 17705104950542 | 17705105251343 | 17705105252929 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 167 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 62848 | 0x7fbe37412280 | 0x7fbe34424d40 | 170036 | 170036 | 15988 | 1360296 | 65536 | 100276662 | 1256004 | 0 | 402853812 | 17705105293348 | 17705105251343 | 17705105559344 | 17705105561062 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 170 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 63808 | 0x7fbe37412100 | 0x7fbe34424d80 | 162706 | 162706 | 15641 | 1301656 | 65536 | 94855038 | 1193196 | 0 | 381146724 | 17705105609860 | 17705105559344 | 17705105857105 | 17705105858704 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 173 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 65024 | 0x7fbe34c6df80 | 0x7fbe34424dc0 | 300682 | 300682 | 22096 | 2405464 | 65536 | 210952379 | 2299080 | 0 | 845542368 | 17705105899953 | 17705105857105 | 17705106237265 | 17705106239145 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 176 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 66240 | 0x7fbe34c6de00 | 0x7fbe34424e00 | 300150 | 300150 | 20963 | 2401208 | 65536 | 207324436 | 2293832 | 0 | 831030548 | 17705106279684 | 17705106237265 | 17705106624466 | 17705106626145 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 179 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 8 | 24 | 67456 | 0x7fbe34c6dc80 | 0x7fbe34424e40 | 163188 | 163188 | 15270 | 1305512 | 65536 | 88660520 | 1200099 | 0 | 356383684 | 17705106666304 | 17705106624466 | 17705106925107 | 17705106926737 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 182 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 68928 | 0x7fbe34c6db00 | 0x7fbe34424e80 | 176984 | 176984 | 17234 | 1415880 | 65536 | 110540438 | 1307857 | 0 | 443898016 | 17705106967236 | 17705106925107 | 17705107231828 | 17705107233520 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 185 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 70144 | 0x7fbe34c6d980 | 0x7fbe34424ec0 | 162702 | 162702 | 15277 | 1301624 | 65536 | 88359929 | 1192596 | 0 | 355179716 | 17705107280889 | 17705107231828 | 17705107528949 | 17705107530702 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 188 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 71616 | 0x7fbe34c6d800 | 0x7fbe34424f00 | 303138 | 303138 | 23854 | 2425112 | 65536 | 219345754 | 2319706 | 0 | 879113968 | 17705107570181 | 17705107528949 | 17705107914710 | 17705107916343 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 191 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 72832 | 0x7fbe34c6d680 | 0x7fbe34424f40 | 301178 | 301178 | 22581 | 2409432 | 65536 | 210856510 | 2300482 | 0 | 845156940 | 17705107956902 | 17705107914710 | 17705108296151 | 17705108297833 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 194 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 8 | 24 | 74048 | 0x7fbe37412500 | 0x7fbe34424f80 | 161016 | 161016 | 15381 | 1288136 | 65536 | 90996652 | 1185572 | 0 | 365727792 | 17705108337672 | 17705108296151 | 17705108591191 | 17705108592986 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 197 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 75776 | 0x7fbe37412380 | 0x7fbe34424fc0 | 182776 | 182776 | 17324 | 1462216 | 65536 | 106307416 | 1351053 | 0 | 426971324 | 17705108632915 | 17705108591191 | 17705108899992 | 17705108901698 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 200 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 76992 | 0x7fbe37412200 | 0x7fbe34425000 | 161966 | 161966 | 15750 | 1295736 | 65536 | 87475365 | 1182769 | 0 | 351630396 | 17705108961827 | 17705108899992 | 17705109195833 | 17705109197421 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 203 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 78464 | 0x7fbe37412080 | 0x7fbe34425040 | 300684 | 300684 | 21144 | 2405480 | 65536 | 208762624 | 2299625 | 0 | 836784340 | 17705109238380 | 17705109195833 | 17705109576954 | 17705109578621 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 206 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 79936 | 0x7fbe34c6df00 | 0x7fbe34425080 | 304284 | 304284 | 23686 | 2434280 | 65536 | 213979500 | 2316743 | 0 | 857651068 | 17705109618800 | 17705109576954 | 17705109966715 | 17705109968351 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 209 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 8 | 24 | 81408 | 0x7fbe34c6dd80 | 0x7fbe344250c0 | 163566 | 163566 | 15500 | 1308536 | 65536 | 88900516 | 1199255 | 0 | 357338716 | 17705110008030 | 17705109966715 | 17705110275675 | 17705110277544 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 212 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 83136 | 0x7fbe34c6dc00 | 0x7fbe34425100 | 193521 | 193521 | 18417 | 1548176 | 65536 | 109276187 | 1435404 | 0 | 438848224 | 17705110317593 | 17705110275675 | 17705110591996 | 17705110593646 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 215 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 84352 | 0x7fbe34c6da80 | 0x7fbe34425140 | 161511 | 161511 | 14317 | 1292096 | 65536 | 83793437 | 1183047 | 0 | 336901876 | 17705110641284 | 17705110591996 | 17705110893597 | 17705110895268 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 218 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 85824 | 0x7fbe34c6d900 | 0x7fbe34425180 | 303427 | 303427 | 24121 | 2427424 | 65536 | 220333979 | 2315446 | 0 | 883072064 | 17705110936297 | 17705110893597 | 17705111275518 | 17705111277278 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 221 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 87296 | 0x7fbe34c6d780 | 0x7fbe344251c0 | 301669 | 301669 | 22336 | 2413360 | 65536 | 193757797 | 2295441 | 0 | 776764820 | 17705111317477 | 17705111275518 | 17705111656799 | 17705111658369 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 224 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 88768 | 0x7fbe34c6d600 | 0x7fbe34425200 | 163132 | 163132 | 15814 | 1305064 | 65536 | 95038699 | 1197595 | 0 | 381887776 | 17705111698048 | 17705111656799 | 17705111951520 | 17705111953211 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 227 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 90752 | 0x7fbe37412480 | 0x7fbe34425240 | 201967 | 201967 | 17960 | 1615744 | 65536 | 129660228 | 1505036 | 0 | 520385696 | 17705111992780 | 17705111951520 | 17705112276320 | 17705112277973 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 230 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 91968 | 0x7fbe37412300 | 0x7fbe34425280 | 162336 | 162336 | 15959 | 1298696 | 65536 | 93453616 | 1190100 | 0 | 375552924 | 17705112325832 | 17705112276320 | 17705112570401 | 17705112572056 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 233 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 93440 | 0x7fbe37412180 | 0x7fbe344252c0 | 301634 | 301634 | 23478 | 2413080 | 65536 | 220970665 | 2309762 | 0 | 885618456 | 17705112613065 | 17705112570401 | 17705112959842 | 17705112961576 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 236 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 94912 | 0x7fbe37412000 | 0x7fbe34425300 | 299082 | 299082 | 20973 | 2392664 | 65536 | 209825274 | 2287308 | 0 | 841029488 | 17705113002365 | 17705112959842 | 17705113341603 | 17705113343326 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 239 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 96384 | 0x7fbe34c6de80 | 0x7fbe34425340 | 163338 | 163338 | 17143 | 1306712 | 65536 | 97560765 | 1194097 | 0 | 391972256 | 17705113383045 | 17705113341603 | 17705113637284 | 17705113638969 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 242 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 98368 | 0x7fbe34c6dd00 | 0x7fbe34425380 | 212062 | 212062 | 19332 | 1696504 | 65536 | 128162203 | 1580576 | 0 | 514394476 | 17705113679218 | 17705113637284 | 17705113963685 | 17705113965221 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 245 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 99584 | 0x7fbe34c6db80 | 0x7fbe344253c0 | 161500 | 161500 | 14666 | 1292008 | 65536 | 87294050 | 1184373 | 0 | 350904944 | 17705114012580 | 17705113963685 | 17705114266245 | 17705114267993 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 248 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 101312 | 0x7fbe34c6da00 | 0x7fbe34425400 | 299650 | 299650 | 23380 | 2397208 | 65536 | 210704906 | 2287346 | 0 | 844557572 | 17705114308002 | 17705114266245 | 17705114653286 | 17705114655013 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 251 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 102784 | 0x7fbe34c6d880 | 0x7fbe34425440 | 301088 | 301088 | 22972 | 2408712 | 65536 | 218429991 | 2302461 | 0 | 875447976 | 17705114695202 | 17705114653286 | 17705115033607 | 17705115035184 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 254 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 104256 | 0x7fbe34c6d700 | 0x7fbe34425480 | 162716 | 162716 | 16173 | 1301736 | 65536 | 99043577 | 1197113 | 0 | 397912140 | 17705115074653 | 17705115033607 | 17705115328168 | 17705115329836 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 257 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 106240 | 0x7fbe37412580 | 0x7fbe344254c0 | 220639 | 220639 | 19794 | 1765120 | 65536 | 128558622 | 1648289 | 0 | 515983636 | 17705115370005 | 17705115328168 | 17705115659049 | 17705115660728 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 260 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 107712 | 0x7fbe37412400 | 0x7fbe34425500 | 160864 | 160864 | 15304 | 1286920 | 65536 | 89554412 | 1184374 | 0 | 359961692 | 17705115709227 | 17705115659049 | 17705115952809 | 17705115954441 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 263 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 16 | 24 | 109440 | 0x7fbe37412280 | 0x7fbe34425540 | 299107 | 299107 | 22546 | 2392864 | 65536 | 214898977 | 2289918 | 0 | 861326188 | 17705115994910 | 17705115952809 | 17705116334090 | 17705116335801 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 266 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 16 | 24 | 111168 | 0x7fbe37412100 | 0x7fbe34425580 | 300940 | 300940 | 22831 | 2407528 | 65536 | 211417761 | 2295026 | 0 | 847400144 | 17705116376800 | 17705116334090 | 17705116717611 | 17705116719261 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 269 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 8 | 24 | 112896 | 0x7fbe34c6df80 | 0x7fbe344255c0 | 163791 | 163791 | 15740 | 1310336 | 65536 | 102700357 | 1208993 | 0 | 412548940 | 17705116759270 | 17705116717611 | 17705117021292 | 17705117022834 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 272 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 115136 | 0x7fbe34c6de00 | 0x7fbe34425600 | 229790 | 229790 | 19948 | 1838328 | 65536 | 146389147 | 1727826 | 0 | 587299548 | 17705117062773 | 17705117021292 | 17705117368173 | 17705117369785 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 275 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 116608 | 0x7fbe34c6dc80 | 0x7fbe34425640 | 161901 | 161901 | 15612 | 1295216 | 65536 | 93950455 | 1189186 | 0 | 377539172 | 17705117417744 | 17705117368173 | 17705117672014 | 17705117673607 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 278 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 16 | 24 | 118336 | 0x7fbe34c6db00 | 0x7fbe34425680 | 297090 | 297090 | 21085 | 2376728 | 65536 | 201047775 | 2267844 | 0 | 805930696 | 17705117714146 | 17705117672014 | 17705118051055 | 17705118052718 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 281 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 16 | 24 | 120064 | 0x7fbe34c6d980 | 0x7fbe344256c0 | 299427 | 299427 | 22491 | 2395424 | 65536 | 214013246 | 2287950 | 0 | 857786436 | 17705118093117 | 17705118051055 | 17705118442096 | 17705118443908 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 284 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 121792 | 0x7fbe34c6d800 | 0x7fbe34425700 | 164882 | 164882 | 16738 | 1319064 | 65536 | 94506540 | 1211189 | 0 | 379763596 | 17705118484447 | 17705118442096 | 17705118737296 | 17705118738801 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 287 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 124032 | 0x7fbe34c6d680 | 0x7fbe34425740 | 240737 | 240737 | 21103 | 1925904 | 65536 | 151104287 | 1811582 | 0 | 606167648 | 17705118777400 | 17705118737296 | 17705119085937 | 17705119087632 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 290 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 125504 | 0x7fbe37412500 | 0x7fbe34425780 | 161400 | 161400 | 15196 | 1291208 | 65536 | 96249785 | 1188433 | 0 | 386732316 | 17705119135421 | 17705119085937 | 17705119386098 | 17705119387754 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 293 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 127488 | 0x7fbe37412380 | 0x7fbe344257c0 | 297753 | 297753 | 20439 | 2382032 | 65536 | 194437365 | 2269987 | 0 | 779482188 | 17705119429013 | 17705119386098 | 17705119774259 | 17705119775875 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 296 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 129216 | 0x7fbe37412200 | 0x7fbe34425800 | 298452 | 298452 | 20795 | 2387624 | 65536 | 207176029 | 2280628 | 0 | 830439332 | 17705119816624 | 17705119774259 | 17705120154900 | 17705120156525 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 299 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 130944 | 0x7fbe37412080 | 0x7fbe34425840 | 171310 | 171310 | 16484 | 1370488 | 65536 | 97247228 | 1262260 | 0 | 390735836 | 17705120197584 | 17705120154900 | 17705120456341 | 17705120458048 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 302 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 133440 | 0x7fbe34c6df00 | 0x7fbe34425880 | 260352 | 260352 | 21931 | 2082824 | 65536 | 166613700 | 1965916 | 0 | 668212216 | 17705120498797 | 17705120456341 | 17705120811541 | 17705120813229 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 305 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 134912 | 0x7fbe34c6dd80 | 0x7fbe344258c0 | 162073 | 162073 | 15594 | 1296592 | 65536 | 99691185 | 1194157 | 0 | 400493056 | 17705120861668 | 17705120811541 | 17705121113622 | 17705121115311 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 308 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 136896 | 0x7fbe34c6dc00 | 0x7fbe34425900 | 296535 | 296535 | 19281 | 2372288 | 65536 | 193318573 | 2261793 | 0 | 775015300 | 17705121156680 | 17705121113622 | 17705121500183 | 17705121501742 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 311 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 138880 | 0x7fbe34c6da80 | 0x7fbe34425940 | 296783 | 296783 | 20945 | 2374272 | 65536 | 201122669 | 2263037 | 0 | 806227324 | 17705121542681 | 17705121500183 | 17705121881944 | 17705121883502 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 314 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 140864 | 0x7fbe34c6d900 | 0x7fbe34425980 | 180624 | 180624 | 17059 | 1445000 | 65536 | 103961220 | 1334548 | 0 | 417597948 | 17705121923861 | 17705121881944 | 17705122189785 | 17705122192044 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 317 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 143616 | 0x7fbe34c6d780 | 0x7fbe344259c0 | 282033 | 282033 | 23631 | 2256272 | 65536 | 181055427 | 2130146 | 0 | 725969660 | 17705122231383 | 17705122189785 | 17705122565786 | 17705122567395 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 320 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 145344 | 0x7fbe34c6d600 | 0x7fbe34425a00 | 163417 | 163417 | 17227 | 1307344 | 65536 | 100188989 | 1189989 | 0 | 402493468 | 17705122616454 | 17705122565786 | 17705122867387 | 17705122869147 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 323 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 147584 | 0x7fbe37412480 | 0x7fbe34425a40 | 295608 | 295608 | 21130 | 2364872 | 65536 | 206751819 | 2259308 | 0 | 828747444 | 17705122910206 | 17705122867387 | 17705123251388 | 17705123253258 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 326 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 149568 | 0x7fbe37412300 | 0x7fbe34425a80 | 295492 | 295492 | 21036 | 2363944 | 65536 | 195904580 | 2259274 | 0 | 785357496 | 17705123293607 | 17705123251388 | 17705123632988 | 17705123634638 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 329 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 151552 | 0x7fbe37412180 | 0x7fbe34425ac0 | 187650 | 187650 | 18078 | 1501208 | 65536 | 109297364 | 1386923 | 0 | 438939504 | 17705123674617 | 17705123632988 | 17705123950269 | 17705123952190 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 332 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 154304 | 0x7fbe37412000 | 0x7fbe34425b00 | 300632 | 300632 | 23537 | 2405064 | 65536 | 192630205 | 2290360 | 0 | 772277888 | 17705123993359 | 17705123950269 | 17705124333150 | 17705124334800 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 335 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 156288 | 0x7fbe34c6de80 | 0x7fbe34425b40 | 172730 | 172730 | 16239 | 1381848 | 65536 | 99077438 | 1274736 | 0 | 398055336 | 17705124382819 | 17705124333150 | 17705124642111 | 17705124643743 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 338 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 158784 | 0x7fbe34c6dd00 | 0x7fbe34425b80 | 300954 | 300954 | 19218 | 2407640 | 65536 | 138123305 | 2277040 | 0 | 554241304 | 17705124683662 | 17705124642111 | 17705125024992 | 17705125026583 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 341 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 161024 | 0x7fbe34c6db80 | 0x7fbe34425bc0 | 296890 | 296890 | 19487 | 2375128 | 65536 | 191421998 | 2260455 | 0 | 767429080 | 17705125066652 | 17705125024992 | 17705125406273 | 17705125408023 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 344 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 163264 | 0x7fbe34c6da00 | 0x7fbe34425c00 | 206274 | 206274 | 18392 | 1650200 | 65536 | 121668079 | 1537738 | 0 | 488418460 | 17705125448222 | 17705125406273 | 17705125729634 | 17705125731375 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 347 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 166528 | 0x7fbe34c6d880 | 0x7fbe34425c40 | 342009 | 342009 | 25878 | 2736080 | 65536 | 226571056 | 2617009 | 0 | 908049652 | 17705125770974 | 17705125729634 | 17705126138755 | 17705126164064 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 350 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 168512 | 0x7fbe34c6d700 | 0x7fbe34425c80 | 184465 | 184465 | 17499 | 1475728 | 65536 | 110383331 | 1363612 | 0 | 443278440 | 17705126191024 | 17705126138755 | 17705126470755 | 17705126472336 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 353 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 171264 | 0x7fbe37412580 | 0x7fbe34425cc0 | 296110 | 296110 | 19864 | 2368888 | 65536 | 151089341 | 2236464 | 0 | 606108080 | 17705126512945 | 17705126470755 | 17705126856516 | 17705126858247 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 356 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 173760 | 0x7fbe37412400 | 0x7fbe34425d00 | 298293 | 298293 | 20202 | 2386352 | 65536 | 159633758 | 2257555 | 0 | 640291696 | 17705126899276 | 17705126856516 | 17705127243557 | 17705127245317 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 359 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 176256 | 0x7fbe37412280 | 0x7fbe34425d40 | 225369 | 225369 | 19574 | 1802960 | 65536 | 144256915 | 1693260 | 0 | 578780064 | 17705127285016 | 17705127243557 | 17705127587238 | 17705127588888 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 362 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 179776 | 0x7fbe37412100 | 0x7fbe34425d80 | 382283 | 382283 | 28152 | 3058272 | 65536 | 258512765 | 2938287 | 0 | 1035804584 | 17705127630277 | 17705127587238 | 17705128024039 | 17705128045157 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 365 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 182272 | 0x7fbe34c6df80 | 0x7fbe34425dc0 | 212577 | 212577 | 18974 | 1700624 | 65536 | 123126580 | 1587500 | 0 | 494261720 | 17705128074826 | 17705128024039 | 17705128356360 | 17705128358029 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 368 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 185536 | 0x7fbe34c6de00 | 0x7fbe34425e00 | 305893 | 305893 | 22731 | 2447152 | 65536 | 193367890 | 2328700 | 0 | 775228268 | 17705128398848 | 17705128356360 | 17705128750921 | 17705128771599 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 371 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 188544 | 0x7fbe34c6dc80 | 0x7fbe34425e40 | 309188 | 309188 | 23345 | 2473512 | 65536 | 167706419 | 2335877 | 0 | 672592520 | 17705128791988 | 17705128750921 | 17705129151722 | 17705129169409 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 374 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 191552 | 0x7fbe34c6db00 | 0x7fbe34425e80 | 266125 | 266125 | 21615 | 2129008 | 65536 | 185080522 | 2018299 | 0 | 742090528 | 17705129192418 | 17705129151722 | 17705129513803 | 17705129515370 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 377 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 195840 | 0x7fbe34c6d980 | 0x7fbe34425ec0 | 463365 | 463365 | 32817 | 3706928 | 65536 | 333628997 | 3579897 | 0 | 1336279868 | 17705129554619 | 17705129513803 | 17705130001804 | 17705130018847 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 380 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 198592 | 0x7fbe34c6d800 | 0x7fbe34425f00 | 243765 | 243765 | 20746 | 1950128 | 65536 | 157317587 | 1841101 | 0 | 631023104 | 17705130052196 | 17705130001804 | 17705130359725 | 17705130361499 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 383 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 202368 | 0x7fbe34c6d680 | 0x7fbe34425f40 | 334611 | 334611 | 23646 | 2676896 | 65536 | 206470927 | 2559624 | 0 | 827644704 | 17705130401418 | 17705130359725 | 17705130773006 | 17705130819257 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 386 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 205888 | 0x7fbe37412500 | 0x7fbe34425f80 | 330532 | 330532 | 23907 | 2644264 | 65536 | 201129855 | 2514099 | 0 | 806281180 | 17705130829467 | 17705130773006 | 17705131206127 | 17705131248566 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 389 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 209408 | 0x7fbe37412380 | 0x7fbe34425fc0 | 307350 | 307350 | 23610 | 2458808 | 65536 | 200414154 | 2349004 | 0 | 803421972 | 17705131258526 | 17705131206127 | 17705131620848 | 17705131622387 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 392 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 214464 | 0x7fbe37412200 | 0x7fbe34426000 | 542832 | 542832 | 35572 | 4342664 | 65536 | 400074502 | 4228183 | 0 | 1602063624 | 17705131662976 | 17705131620848 | 17705132160690 | 17705132178243 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 395 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 217728 | 0x7fbe37412080 | 0x7fbe34426040 | 272520 | 272520 | 21936 | 2180168 | 65536 | 180081253 | 2067857 | 0 | 722076112 | 17705132211162 | 17705132160690 | 17705132530770 | 17705132532384 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 398 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 222016 | 0x7fbe34c6df00 | 0x7fbe34426080 | 367822 | 367822 | 28379 | 2942584 | 65536 | 237725434 | 2825705 | 0 | 952687136 | 17705132577933 | 17705132530770 | 17705132967092 | 17705132985653 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 401 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 226048 | 0x7fbe34c6dd80 | 0x7fbe344260c0 | 367479 | 367479 | 29244 | 2939840 | 65536 | 257952377 | 2827206 | 0 | 1033580388 | 17705133008672 | 17705132967092 | 17705133401653 | 17705133418842 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 404 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 230080 | 0x7fbe34c6dc00 | 0x7fbe34426100 | 348153 | 348153 | 25752 | 2785232 | 65536 | 234501716 | 2674331 | 0 | 939785488 | 17705133442882 | 17705133401653 | 17705133816214 | 17705133834462 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 407 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 235904 | 0x7fbe34c6da80 | 0x7fbe34426140 | 624609 | 624609 | 40246 | 4996880 | 65536 | 470954194 | 4878170 | 0 | 1885582068 | 17705133858311 | 17705133816214 | 17705134407415 | 17705134427867 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 410 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 239424 | 0x7fbe34c6d900 | 0x7fbe34426180 | 304469 | 304469 | 23554 | 2435760 | 65536 | 191294333 | 2320826 | 0 | 766940268 | 17705134458586 | 17705134407415 | 17705134807736 | 17705134809387 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 413 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 244224 | 0x7fbe34c6d780 | 0x7fbe344261c0 | 400571 | 400571 | 27503 | 3204576 | 65536 | 273235204 | 3090836 | 0 | 1094730484 | 17705134850126 | 17705134807736 | 17705135261657 | 17705135306605 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 416 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 248768 | 0x7fbe34c6d600 | 0x7fbe34426200 | 394317 | 394317 | 27737 | 3154544 | 65536 | 289375998 | 3043016 | 0 | 1159284056 | 17705135317064 | 17705135261657 | 17705135737178 | 17705135780083 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 419 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 253312 | 0x7fbe37412480 | 0x7fbe34426240 | 389039 | 389039 | 27751 | 3112320 | 65536 | 270868481 | 2994921 | 0 | 1085243420 | 17705135790393 | 17705135737178 | 17705136205980 | 17705136247691 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 422 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 8 | 24 | 255552 | 0x7fbe37412300 | 0x7fbe34426280 | 719713 | 719713 | 44893 | 5757712 | 65536 | 533483141 | 5630414 | 0 | 2135673152 | 17705136258251 | 17705136205980 | 17705136881181 | 17705136898805 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 425 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 259840 | 0x7fbe37412180 | 0x7fbe344262c0 | 364804 | 364804 | 26729 | 2918440 | 65536 | 253731856 | 2801940 | 0 | 1016690632 | 17705136931714 | 17705136881181 | 17705137311902 | 17705137330014 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 428 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 265664 | 0x7fbe37412000 | 0x7fbe34426300 | 470662 | 470662 | 31731 | 3765304 | 65536 | 348474782 | 3656307 | 0 | 1395684328 | 17705137354433 | 17705137311902 | 17705137813343 | 17705137830031 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 431 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 271232 | 0x7fbe34c6de80 | 0x7fbe34426340 | 471735 | 471735 | 31738 | 3773888 | 65536 | 348744261 | 3667747 | 0 | 1396758156 | 17705137855951 | 17705137813343 | 17705138325825 | 17705138372778 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 434 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 8 | 24 | 273216 | 0x7fbe34c6dd00 | 0x7fbe34426380 | 483384 | 483384 | 32673 | 3867080 | 65536 | 350520518 | 3753458 | 0 | 1403822472 | 17705138383487 | 17705138325825 | 17705138854306 | 17705138896224 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 437 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 8 | 24 | 275712 | 0x7fbe34c6db80 | 0x7fbe344263c0 | 880602 | 880602 | 53482 | 7044824 | 65536 | 673582641 | 6928580 | 0 | 2696072056 | 17705138906824 | 17705138854306 | 17705139634468 | 17705139676415 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 440 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 280768 | 0x7fbe34c6da00 | 0x7fbe34426400 | 427363 | 427363 | 29816 | 3418912 | 65536 | 315194033 | 3301516 | 0 | 1262547700 | 17705139694814 | 17705139634468 | 17705140121669 | 17705140163292 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 443 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 287616 | 0x7fbe34c6d880 | 0x7fbe34426440 | 551204 | 551204 | 35631 | 4409640 | 65536 | 402181813 | 4297049 | 0 | 1610516100 | 17705140173812 | 17705140121669 | 17705140695911 | 17705140737608 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 446 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 294208 | 0x7fbe34c6d700 | 0x7fbe34426480 | 552450 | 552450 | 36187 | 4419608 | 65536 | 416522896 | 4309135 | 0 | 1667877068 | 17705140748028 | 17705140695911 | 17705141268072 | 17705141286044 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 449 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 8 | 24 | 296960 | 0x7fbe37412580 | 0x7fbe344264c0 | 563449 | 563449 | 36252 | 4507600 | 65536 | 413502489 | 4390877 | 0 | 1655753852 | 17705141309564 | 17705141268072 | 17705141819593 | 17705141836590 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 452 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 8 | 24 | 299968 | 0x7fbe37412400 | 0x7fbe34426500 | 1042522 | 1042522 | 61930 | 8340184 | 65536 | 802571182 | 8220836 | 0 | 3212027460 | 17705141861850 | 17705141819593 | 17705142690796 | 17705142714718 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 455 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 8 | 24 | 302720 | 0x7fbe37412280 | 0x7fbe34426540 | 721252 | 721252 | 45160 | 5770024 | 65536 | 551598171 | 5656630 | 0 | 2208133300 | 17705142742378 | 17705142690796 | 17705143346797 | 17705143390841 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 458 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 305472 | 0x7fbe37412100 | 0x7fbe34426580 | 722795 | 722795 | 44561 | 5782368 | 65536 | 541632591 | 5671856 | 0 | 2168270816 | 17705143401761 | 17705143346797 | 17705144049679 | 17705144092564 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 461 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 308224 | 0x7fbe34c6df80 | 0x7fbe344265c0 | 722584 | 722584 | 44868 | 5780680 | 65536 | 548449635 | 5666470 | 0 | 2195539584 | 17705144102904 | 17705144049621 | 17705144747862 | 17705144791776 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 464 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 8 | 24 | 310976 | 0x7fbe34c6de00 | 0x7fbe34426600 | 727081 | 727081 | 45711 | 5816656 | 65536 | 552278183 | 5696365 | 0 | 2210854028 | 17705144802426 | 17705144747862 | 17705145436823 | 17705145455650 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 467 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 8 | 24 | 313216 | 0x7fbe34c6dc80 | 0x7fbe34426640 | 1370959 | 1370959 | 78429 | 10967680 | 65536 | 1057064554 | 10818261 | 0 | 4230000200 | 17705145478759 | 17705145436823 | 17705146524666 | 17705146570132 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 470 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 8 | 24 | 315968 | 0x7fbe34c6db00 | 0x7fbe34426680 | 1371134 | 1371134 | 77956 | 10969080 | 65536 | 1082146997 | 10850450 | 0 | 4330330120 | 17705146589941 | 17705146524666 | 17705147622429 | 17705147686994 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 473 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 318720 | 0x7fbe34c6d980 | 0x7fbe344266c0 | 1375712 | 1375712 | 77743 | 11005704 | 65536 | 1064506926 | 10864442 | 0 | 4259769792 | 17705147698673 | 17705147622429 | 17705148776511 | 17705148841195 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 476 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 321472 | 0x7fbe34c6d800 | 0x7fbe34426700 | 1370633 | 1370633 | 76996 | 10965072 | 65536 | 1070389452 | 10848595 | 0 | 4283298360 | 17705148852074 | 17705148776511 | 17705149917314 | 17705149982126 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 479 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 8 | 24 | 324224 | 0x7fbe34c6d680 | 0x7fbe34426740 | 1377206 | 1377206 | 77139 | 11017656 | 65536 | 1084930546 | 10890544 | 0 | 4341465248 | 17705149992916 | 17705149917314 | 17705151048677 | 17705151120567 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 482 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 8 | 24 | 326464 | 0x7fbe37412500 | 0x7fbe34426780 | 2662992 | 2662992 | 142609 | 21303944 | 65536 | 2128585524 | 21187086 | 0 | 8516083436 | 17705151131717 | 17705151048677 | 17705153025481 | 17705153090388 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 485 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 8 | 24 | 329216 | 0x7fbe37412380 | 0x7fbe344267c0 | 2670670 | 2670670 | 142588 | 21365368 | 65536 | 2126440678 | 21228281 | 0 | 8507503948 | 17705153108947 | 17705153025481 | 17705154959726 | 17705155029189 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 488 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 331968 | 0x7fbe37412200 | 0x7fbe34426800 | 2670846 | 2670846 | 143401 | 21366776 | 65536 | 2132817250 | 21244816 | 0 | 8533009492 | 17705155040309 | 17705154959726 | 17705156957651 | 17705157022759 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 491 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 12 | 24 | 334720 | 0x7fbe37412080 | 0x7fbe34426840 | 2672408 | 2672408 | 143329 | 21379272 | 65536 | 2121679110 | 21237892 | 0 | 8488457088 | 17705157033139 | 17705156957651 | 17705158946935 | 17705158987970 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 494 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 8 | 24 | 337472 | 0x7fbe34c6df00 | 0x7fbe34426880 | 2673456 | 2673456 | 143914 | 21387656 | 65536 | 2120709336 | 21258084 | 0 | 8484580216 | 17705158998950 | 17705158946935 | 17705160862940 | 17705160929781 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 497 | 229609 | 229609 | 4194304 | 256 | 0 | 0 | 8 | 24 | 0 | 0x7fbe34c6dd80 | 0x7fbe344268c0 | 5256902 | 5256902 | 274219 | 42055224 | 65536 | 4232108035 | 41931571 | 0 | 16930173956 | 17705160940141 | 17705160862940 | 17705164488388 | 17705164559200 |