44 KiB
44 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | GRBM_COUNT | GRBM_GUI_ACTIVE | SQ_WAVES | SQ_IFETCH | SQ_IFETCH_LEVEL | SQ_ACCUM_PREV_HIRES | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBufferAligned.kd | 0 | 0 | 0 | 223297 | 223297 | 33554432 | 256 | 0 | 0 | 4 | 32 | 4160 | 0x0 | 0x7fc57a604280 | 379284 | 379284 | 524288 | 4718592 | 681163 | 76310828 | 17598097140845 | 17597387743185 | 17598246526395 | 17598246639545 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 223297 | 223297 | 32768 | 256 | 0 | 0 | 12 | 24 | 13888 | 0x0 | 0x7fc57a623f80 | 33251 | 33251 | 512 | 8192 | 6010 | 679448 | 17598251787224 | 17598246526395 | 17598251919198 | 17598251924230 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 5 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 14336 | 0x7fc57d663380 | 0x7fc57a623fc0 | 163594 | 163594 | 65536 | 917504 | 141997 | 15950860 | 17598251961259 | 17598251919198 | 17598252301279 | 17598252303751 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 8 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15040 | 0x7fc57d663200 | 0x7fc57a624000 | 310676 | 310676 | 65536 | 1114112 | 172028 | 19257004 | 17598252343430 | 17598252301279 | 17598252724159 | 17598252726940 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 11 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15488 | 0x7fc57d663080 | 0x7fc57a624040 | 309020 | 309020 | 65536 | 917504 | 138926 | 15550360 | 17598252763489 | 17598252724159 | 17598253136799 | 17598253139200 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 14 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 15936 | 0x7fc57b003f00 | 0x7fc57a624080 | 164976 | 164976 | 65536 | 1048576 | 157741 | 17738236 | 17598253175849 | 17598253136799 | 17598253450240 | 17598253452452 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 17 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 16384 | 0x7fc57b003d80 | 0x7fc57a6240c0 | 163529 | 163529 | 65536 | 983040 | 148002 | 16556188 | 17598253487311 | 17598253450240 | 17598253764800 | 17598253767114 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 20 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 17088 | 0x7fc57b003c00 | 0x7fc57a624100 | 162196 | 162196 | 65536 | 1114112 | 162834 | 18259480 | 17598253814412 | 17598253764800 | 17598254076000 | 17598254086866 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 23 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 16 | 24 | 17792 | 0x7fc57b003a80 | 0x7fc57a624140 | 309800 | 309800 | 65536 | 1310720 | 206086 | 23129588 | 17598254114915 | 17598254076000 | 17598254485600 | 17598254487735 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 26 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 16 | 24 | 18496 | 0x7fc57b003900 | 0x7fc57a624180 | 306944 | 306944 | 65536 | 1179648 | 177127 | 19842568 | 17598254522574 | 17598254485600 | 17598254905121 | 17598254906905 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 29 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19200 | 0x7fc57b003780 | 0x7fc57a6241c0 | 164084 | 164084 | 65536 | 1245184 | 189398 | 21184652 | 17598254940604 | 17598254905121 | 17598255192801 | 17598255194607 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 32 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19904 | 0x7fc57b003600 | 0x7fc57a624200 | 162975 | 162975 | 65536 | 1245184 | 186637 | 20929980 | 17598255228957 | 17598255192801 | 17598255477761 | 17598255479620 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 35 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 20608 | 0x7fc57d663480 | 0x7fc57a624240 | 163260 | 163260 | 65536 | 1245184 | 188086 | 21072920 | 17598255522339 | 17598255477761 | 17598255766241 | 17598255768043 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 38 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 16 | 24 | 21312 | 0x7fc57d663300 | 0x7fc57a624280 | 308005 | 308005 | 65536 | 1441792 | 215714 | 24176728 | 17598255805652 | 17598255766241 | 17598256148642 | 17598256150373 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 41 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22016 | 0x7fc57d663180 | 0x7fc57a6242c0 | 308010 | 308010 | 65536 | 1310720 | 199745 | 22367996 | 17598256185452 | 17598256148642 | 17598256525122 | 17598256526884 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 44 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22720 | 0x7fc57d663000 | 0x7fc57a624300 | 163878 | 163878 | 65536 | 1376256 | 206041 | 23082112 | 17598256561523 | 17598256525122 | 17598256815042 | 17598256816776 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 47 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 23424 | 0x7fc57b003e80 | 0x7fc57a624340 | 163340 | 163340 | 65536 | 1441792 | 217864 | 24335144 | 17598256851235 | 17598256815042 | 17598257106722 | 17598257108309 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 50 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 24128 | 0x7fc57b003d00 | 0x7fc57a624380 | 162064 | 162064 | 65536 | 1310720 | 196821 | 22019008 | 17598257150368 | 17598257106722 | 17598257405123 | 17598257406731 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 53 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 16 | 24 | 24832 | 0x7fc57b003b80 | 0x7fc57a6243c0 | 308441 | 308441 | 65536 | 1572864 | 233127 | 26082088 | 17598257442950 | 17598257405123 | 17598257779363 | 17598257781082 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 56 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 16 | 24 | 25536 | 0x7fc57b003a00 | 0x7fc57a624400 | 304557 | 304557 | 65536 | 1441792 | 208665 | 23365924 | 17598257815321 | 17598257779363 | 17598258155363 | 17598258157062 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 59 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26240 | 0x7fc57b003880 | 0x7fc57a624440 | 162559 | 162559 | 65536 | 1507328 | 226838 | 25406660 | 17598258192311 | 17598258155363 | 17598258447363 | 17598258449185 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 62 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26944 | 0x7fc57b003700 | 0x7fc57a624480 | 163057 | 163057 | 65536 | 1638400 | 243091 | 27262240 | 17598258484414 | 17598258447363 | 17598258737924 | 17598258739588 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 65 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 27648 | 0x7fc57d663580 | 0x7fc57a6244c0 | 161757 | 161757 | 65536 | 1441792 | 214563 | 24030252 | 17598258783146 | 17598258737924 | 17598259034244 | 17598259035990 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 68 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 16 | 24 | 28608 | 0x7fc57d663400 | 0x7fc57a624500 | 305217 | 305217 | 65536 | 1703936 | 252073 | 28235268 | 17598259072069 | 17598259034244 | 17598259410084 | 17598259411920 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 71 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 16 | 24 | 29312 | 0x7fc57d663280 | 0x7fc57a624540 | 303171 | 303171 | 65536 | 1572864 | 232908 | 26123324 | 17598259447019 | 17598259410084 | 17598259783844 | 17598259785641 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 74 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 30016 | 0x7fc57d663100 | 0x7fc57a624580 | 161758 | 161758 | 65536 | 1638400 | 243285 | 27310660 | 17598259820640 | 17598259783844 | 17598260071845 | 17598260073763 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 77 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 8 | 24 | 30976 | 0x7fc57b003f80 | 0x7fc57a6245c0 | 160538 | 160538 | 65536 | 1835008 | 270103 | 30322488 | 17598260108543 | 17598260071845 | 17598260358725 | 17598260360476 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 80 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 31680 | 0x7fc57b003e00 | 0x7fc57a624600 | 163862 | 163862 | 65536 | 1507328 | 224594 | 25081836 | 17598260402215 | 17598260358725 | 17598260656645 | 17598260658339 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 83 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 16 | 24 | 32640 | 0x7fc57b003c80 | 0x7fc57a624640 | 306084 | 306084 | 65536 | 1835008 | 271175 | 30248500 | 17598260694318 | 17598260656645 | 17598261046085 | 17598261047719 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 86 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 33600 | 0x7fc57b003b00 | 0x7fc57a624680 | 307380 | 307380 | 65536 | 1703936 | 249875 | 27955212 | 17598261082628 | 17598261046085 | 17598261424326 | 17598261425939 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 89 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 34560 | 0x7fc57b003980 | 0x7fc57a6246c0 | 163238 | 163238 | 65536 | 1769472 | 265219 | 29706488 | 17598261460008 | 17598261424326 | 17598261712486 | 17598261714362 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 92 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 8 | 24 | 35520 | 0x7fc57b003800 | 0x7fc57a624700 | 162860 | 162860 | 65536 | 2031616 | 303442 | 33955492 | 17598261748951 | 17598261712486 | 17598262001606 | 17598262003354 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 95 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 36224 | 0x7fc57b003680 | 0x7fc57a624740 | 161890 | 161890 | 65536 | 1638400 | 263222 | 29471680 | 17598262044743 | 17598262001606 | 17598262297446 | 17598262299177 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 98 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 37184 | 0x7fc57d663500 | 0x7fc57a624780 | 304550 | 304550 | 65536 | 1966080 | 288953 | 32377204 | 17598262334206 | 17598262297446 | 17598262682727 | 17598262684327 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 101 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 38144 | 0x7fc57d663380 | 0x7fc57a6247c0 | 304419 | 304419 | 65536 | 1835008 | 279877 | 31253588 | 17598262719856 | 17598262682727 | 17598263061447 | 17598263063217 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 104 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 39104 | 0x7fc57d663200 | 0x7fc57a624800 | 162792 | 162792 | 65536 | 1900544 | 285508 | 31920360 | 17598263098776 | 17598263061447 | 17598263352487 | 17598263354190 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 107 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 8 | 24 | 40320 | 0x7fc57d663080 | 0x7fc57a624840 | 163607 | 163607 | 65536 | 2228224 | 346629 | 38837308 | 17598263390639 | 17598263352487 | 17598263644167 | 17598263645983 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 110 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 41280 | 0x7fc57b003f00 | 0x7fc57a624880 | 161512 | 161512 | 65536 | 1703936 | 258557 | 28939128 | 17598263688412 | 17598263644167 | 17598263940008 | 17598263941695 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 113 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 42240 | 0x7fc57b003d80 | 0x7fc57a6248c0 | 304171 | 304171 | 65536 | 2097152 | 311294 | 34802656 | 17598263978294 | 17598263940008 | 17598264318088 | 17598264320046 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 116 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 43200 | 0x7fc57b003c00 | 0x7fc57a624900 | 303740 | 303740 | 65536 | 1966080 | 285331 | 31960944 | 17598264354835 | 17598264318088 | 17598264698408 | 17598264699996 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 119 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 8 | 24 | 44160 | 0x7fc57b003a80 | 0x7fc57a624940 | 161837 | 161837 | 65536 | 2031616 | 305326 | 34228756 | 17598264734605 | 17598264698408 | 17598264988488 | 17598264990239 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 122 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 45376 | 0x7fc57b003900 | 0x7fc57a624980 | 163205 | 163205 | 65536 | 2424832 | 361416 | 40511376 | 17598265024908 | 17598264988488 | 17598265282729 | 17598265284531 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 125 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 46336 | 0x7fc57b003780 | 0x7fc57a6249c0 | 161312 | 161312 | 65536 | 1835008 | 274162 | 30739912 | 17598265326330 | 17598265282729 | 17598265578409 | 17598265580184 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 128 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 47552 | 0x7fc57b003600 | 0x7fc57a624a00 | 306564 | 306564 | 65536 | 2228224 | 328050 | 36721992 | 17598265616243 | 17598265578409 | 17598265955529 | 17598265957354 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 131 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 48512 | 0x7fc57d663480 | 0x7fc57a624a40 | 302434 | 302434 | 65536 | 2097152 | 309303 | 34586432 | 17598265992943 | 17598265955529 | 17598266337609 | 17598266339694 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 134 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 8 | 24 | 49472 | 0x7fc57d663300 | 0x7fc57a624a80 | 161867 | 161867 | 65536 | 2162688 | 318107 | 35667196 | 17598266374213 | 17598266337609 | 17598266627530 | 17598266629077 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 137 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 50688 | 0x7fc57d663180 | 0x7fc57a624ac0 | 161314 | 161314 | 65536 | 2621440 | 397899 | 44557408 | 17598266664246 | 17598266627530 | 17598266916650 | 17598266918410 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 140 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 51648 | 0x7fc57d663000 | 0x7fc57a624b00 | 160569 | 160569 | 65536 | 1966080 | 292828 | 32729708 | 17598266960678 | 17598266916650 | 17598267207370 | 17598267209012 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 143 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 52864 | 0x7fc57b003e80 | 0x7fc57a624b40 | 303754 | 303754 | 65536 | 2359296 | 347958 | 38955816 | 17598267243241 | 17598267207370 | 17598267584010 | 17598267585722 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 146 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 54080 | 0x7fc57b003d00 | 0x7fc57a624b80 | 301553 | 301553 | 65536 | 2228224 | 330564 | 37009284 | 17598267620532 | 17598267584010 | 17598267968971 | 17598267970733 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 149 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 8 | 24 | 55296 | 0x7fc57b003b80 | 0x7fc57a624bc0 | 161840 | 161840 | 65536 | 2293760 | 341860 | 38219528 | 17598268006032 | 17598267968971 | 17598268259851 | 17598268261575 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 152 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 56768 | 0x7fc57b003a00 | 0x7fc57a624c00 | 163433 | 163433 | 65536 | 2752512 | 418160 | 46830460 | 17598268297364 | 17598268259851 | 17598268553131 | 17598268555078 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 155 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 57728 | 0x7fc57b003880 | 0x7fc57a624c40 | 162472 | 162472 | 65536 | 2031616 | 327412 | 36578768 | 17598268597427 | 17598268553131 | 17598268849131 | 17598268850910 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 158 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 58944 | 0x7fc57b003700 | 0x7fc57a624c80 | 300606 | 300606 | 65536 | 2490368 | 374186 | 41850496 | 17598268885249 | 17598268849131 | 17598269224652 | 17598269226301 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 161 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 60160 | 0x7fc57d663580 | 0x7fc57a624cc0 | 301210 | 301210 | 65536 | 2359296 | 349917 | 39249832 | 17598269262130 | 17598269224652 | 17598269605612 | 17598269607311 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 164 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 8 | 24 | 61376 | 0x7fc57d663400 | 0x7fc57a624d00 | 164759 | 164759 | 65536 | 2424832 | 402021 | 45040004 | 17598269642290 | 17598269605612 | 17598269900012 | 17598269901653 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 167 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 62848 | 0x7fc57d663280 | 0x7fc57a624d40 | 168038 | 168038 | 65536 | 2949120 | 441481 | 49485848 | 17598269937442 | 17598269900012 | 17598270200332 | 17598270202336 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 170 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 63808 | 0x7fc57d663100 | 0x7fc57a624d80 | 162222 | 162222 | 65536 | 2162688 | 326133 | 36467264 | 17598270244505 | 17598270200332 | 17598270503213 | 17598270505038 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 173 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 65024 | 0x7fc57b003f80 | 0x7fc57a624dc0 | 300132 | 300132 | 65536 | 2621440 | 403067 | 45203720 | 17598270542417 | 17598270503213 | 17598270879373 | 17598270881049 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 176 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 66240 | 0x7fc57b003e00 | 0x7fc57a624e00 | 297342 | 297342 | 65536 | 2490368 | 363422 | 40682956 | 17598270916698 | 17598270879373 | 17598271251693 | 17598271253479 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 179 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 8 | 24 | 67456 | 0x7fc57b003c80 | 0x7fc57a624e40 | 161790 | 161790 | 65536 | 2555904 | 385035 | 43147484 | 17598271288108 | 17598271251693 | 17598271555373 | 17598271557111 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 182 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 68928 | 0x7fc57b003b00 | 0x7fc57a624e80 | 175315 | 175315 | 65536 | 3145728 | 465475 | 52218840 | 17598271592291 | 17598271555373 | 17598271857134 | 17598271858854 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 185 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 70144 | 0x7fc57b003980 | 0x7fc57a624ec0 | 160832 | 160832 | 65536 | 2228224 | 327517 | 36700732 | 17598271901353 | 17598271857134 | 17598272152334 | 17598272154216 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 188 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 71616 | 0x7fc57b003800 | 0x7fc57a624f00 | 301078 | 301078 | 65536 | 2752512 | 406340 | 45513568 | 17598272188625 | 17598272152334 | 17598272528174 | 17598272529867 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 191 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 72832 | 0x7fc57b003680 | 0x7fc57a624f40 | 300842 | 300842 | 65536 | 2621440 | 390699 | 43686036 | 17598272564506 | 17598272528174 | 17598272903854 | 17598272905627 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 194 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 8 | 24 | 74048 | 0x7fc57d663500 | 0x7fc57a624f80 | 160830 | 160830 | 65536 | 2686976 | 395360 | 44292492 | 17598272939826 | 17598272903854 | 17598273198735 | 17598273200550 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 197 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 75776 | 0x7fc57d663380 | 0x7fc57a624fc0 | 182347 | 182347 | 65536 | 3342336 | 500899 | 56027040 | 17598273235849 | 17598273198735 | 17598273504975 | 17598273506752 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 200 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 76992 | 0x7fc57d663200 | 0x7fc57a625000 | 160788 | 160788 | 65536 | 2359296 | 351290 | 39283156 | 17598273561021 | 17598273504975 | 17598273796495 | 17598273798285 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 203 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 78464 | 0x7fc57d663080 | 0x7fc57a625040 | 300956 | 300956 | 65536 | 2883584 | 429814 | 48155448 | 17598273834214 | 17598273796495 | 17598274177935 | 17598274180075 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 206 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 79936 | 0x7fc57b003f00 | 0x7fc57a625080 | 301294 | 301294 | 65536 | 2686976 | 397384 | 44563000 | 17598274216954 | 17598274177935 | 17598274566416 | 17598274568035 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 209 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 8 | 24 | 81408 | 0x7fc57b003d80 | 0x7fc57a6250c0 | 161951 | 161951 | 65536 | 2818048 | 427963 | 47980996 | 17598274602984 | 17598274566416 | 17598274860656 | 17598274862508 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 212 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 83136 | 0x7fc57b003c00 | 0x7fc57a625100 | 192746 | 192746 | 65536 | 3538944 | 532322 | 59602316 | 17598274897647 | 17598274860656 | 17598275170736 | 17598275172540 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 215 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 84352 | 0x7fc57b003a80 | 0x7fc57a625140 | 161368 | 161368 | 65536 | 2424832 | 362958 | 40605932 | 17598275214489 | 17598275170736 | 17598275462896 | 17598275464632 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 218 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 85824 | 0x7fc57b003900 | 0x7fc57a625180 | 298410 | 298410 | 65536 | 3014656 | 455330 | 51053144 | 17598275499312 | 17598275462896 | 17598275843537 | 17598275845343 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 221 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 87296 | 0x7fc57b003780 | 0x7fc57a6251c0 | 299703 | 299703 | 65536 | 2818048 | 414678 | 46518540 | 17598275882412 | 17598275843537 | 17598276219537 | 17598276221333 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 224 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 88768 | 0x7fc57b003600 | 0x7fc57a625200 | 163032 | 163032 | 65536 | 2949120 | 440286 | 49312880 | 17598276255762 | 17598276219537 | 17598276511057 | 17598276512946 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 227 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 90752 | 0x7fc57d663480 | 0x7fc57a625240 | 201001 | 201001 | 65536 | 3735552 | 563175 | 63022556 | 17598276548175 | 17598276511057 | 17598276828337 | 17598276830078 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 230 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 91968 | 0x7fc57d663300 | 0x7fc57a625280 | 160772 | 160772 | 65536 | 2555904 | 384541 | 43027336 | 17598276872717 | 17598276828337 | 17598277120498 | 17598277122240 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 233 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 93440 | 0x7fc57d663180 | 0x7fc57a6252c0 | 301399 | 301399 | 65536 | 3145728 | 468135 | 52410600 | 17598277157359 | 17598277120498 | 17598277502898 | 17598277504591 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 236 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 94912 | 0x7fc57d663000 | 0x7fc57a625300 | 298032 | 298032 | 65536 | 2949120 | 438122 | 49043508 | 17598277540630 | 17598277502898 | 17598277878898 | 17598277880551 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 239 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 96384 | 0x7fc57b003e80 | 0x7fc57a625340 | 161173 | 161173 | 65536 | 3080192 | 458154 | 51258132 | 17598277914490 | 17598277878898 | 17598278168978 | 17598278170684 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 242 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 98368 | 0x7fc57b003d00 | 0x7fc57a625380 | 210176 | 210176 | 65536 | 3932160 | 584119 | 65374800 | 17598278206013 | 17598278168978 | 17598278501139 | 17598278502945 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 245 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 99584 | 0x7fc57b003b80 | 0x7fc57a6253c0 | 160977 | 160977 | 65536 | 2621440 | 400352 | 44855392 | 17598278545574 | 17598278501139 | 17598278792499 | 17598278794318 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 248 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 101312 | 0x7fc57b003a00 | 0x7fc57a625400 | 298340 | 298340 | 65536 | 3276800 | 486004 | 54426996 | 17598278828297 | 17598278792499 | 17598279167379 | 17598279169138 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 251 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 102784 | 0x7fc57b003880 | 0x7fc57a625440 | 298053 | 298053 | 65536 | 3080192 | 458075 | 51352276 | 17598279204357 | 17598279167379 | 17598279543539 | 17598279545219 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 254 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 104256 | 0x7fc57b003700 | 0x7fc57a625480 | 160841 | 160841 | 65536 | 3211264 | 484596 | 54284288 | 17598279580298 | 17598279543539 | 17598279838260 | 17598279840021 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 257 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 106240 | 0x7fc57d663580 | 0x7fc57a6254c0 | 218152 | 218152 | 65536 | 4128768 | 616431 | 68878940 | 17598279875190 | 17598279838260 | 17598280167220 | 17598280168983 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 260 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 107712 | 0x7fc57d663400 | 0x7fc57a625500 | 160567 | 160567 | 65536 | 2752512 | 417745 | 46799652 | 17598280212322 | 17598280167220 | 17598280459380 | 17598280461125 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 263 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 16 | 24 | 109440 | 0x7fc57d663280 | 0x7fc57a625540 | 296492 | 296492 | 65536 | 3407872 | 505502 | 56585432 | 17598280496844 | 17598280459380 | 17598280836660 | 17598280838476 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 266 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 16 | 24 | 111168 | 0x7fc57d663100 | 0x7fc57a625580 | 298105 | 298105 | 65536 | 3211264 | 482413 | 54009352 | 17598280872815 | 17598280836660 | 17598281216181 | 17598281217926 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 269 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 8 | 24 | 112896 | 0x7fc57b003f80 | 0x7fc57a6255c0 | 161904 | 161904 | 65536 | 3276800 | 506894 | 56757116 | 17598281253465 | 17598281216181 | 17598281509781 | 17598281511629 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 272 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 115136 | 0x7fc57b003e00 | 0x7fc57a625600 | 229113 | 229113 | 65536 | 4325376 | 650894 | 72975492 | 17598281547028 | 17598281509781 | 17598281844821 | 17598281846640 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 275 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 116608 | 0x7fc57b003c80 | 0x7fc57a625640 | 160282 | 160282 | 65536 | 2818048 | 426339 | 47792836 | 17598281888169 | 17598281844821 | 17598282136981 | 17598282139263 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 278 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 16 | 24 | 118336 | 0x7fc57b003b00 | 0x7fc57a625680 | 295972 | 295972 | 65536 | 3538944 | 527007 | 59108996 | 17598282174272 | 17598282136981 | 17598282516502 | 17598282518193 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 281 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 16 | 24 | 120064 | 0x7fc57b003980 | 0x7fc57a6256c0 | 297070 | 297070 | 65536 | 3407872 | 503507 | 56377296 | 17598282553482 | 17598282516502 | 17598282895062 | 17598282896803 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 284 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 121792 | 0x7fc57b003800 | 0x7fc57a625700 | 164238 | 164238 | 65536 | 3407872 | 517939 | 58036956 | 17598282932012 | 17598282895062 | 17598283192022 | 17598283193786 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 287 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 124032 | 0x7fc57b003680 | 0x7fc57a625740 | 239990 | 239990 | 65536 | 4521984 | 674318 | 75539916 | 17598283228455 | 17598283192022 | 17598283534422 | 17598283536147 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 290 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 125504 | 0x7fc57d663500 | 0x7fc57a625780 | 160084 | 160084 | 65536 | 3014656 | 455348 | 50937812 | 17598283578066 | 17598283534422 | 17598283832983 | 17598283834680 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 293 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 127488 | 0x7fc57d663380 | 0x7fc57a6257c0 | 296176 | 296176 | 65536 | 3801088 | 570136 | 63874748 | 17598283869599 | 17598283832983 | 17598284213623 | 17598284215390 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 296 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 129216 | 0x7fc57d663200 | 0x7fc57a625800 | 295022 | 295022 | 65536 | 3670016 | 555402 | 62225088 | 17598284251499 | 17598284213623 | 17598284589463 | 17598284591170 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 299 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 130944 | 0x7fc57d663080 | 0x7fc57a625840 | 169128 | 169128 | 65536 | 3670016 | 550903 | 61687964 | 17598284626840 | 17598284589463 | 17598284884983 | 17598284886903 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 302 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 133440 | 0x7fc57b003f00 | 0x7fc57a625880 | 257246 | 257246 | 65536 | 4915200 | 736660 | 82515752 | 17598284922352 | 17598284884983 | 17598285236344 | 17598285238084 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 305 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 134912 | 0x7fc57b003d80 | 0x7fc57a6258c0 | 160272 | 160272 | 65536 | 3145728 | 466172 | 52297568 | 17598285281643 | 17598285236344 | 17598285527704 | 17598285529467 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 308 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 136896 | 0x7fc57b003c00 | 0x7fc57a625900 | 295110 | 295110 | 65536 | 4063232 | 616673 | 68984692 | 17598285563896 | 17598285527704 | 17598285904664 | 17598285906377 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 311 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 138880 | 0x7fc57b003a80 | 0x7fc57a625940 | 294604 | 294604 | 65536 | 3932160 | 591796 | 66248272 | 17598285941266 | 17598285904664 | 17598286288345 | 17598286290217 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 314 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 140864 | 0x7fc57b003900 | 0x7fc57a625980 | 177260 | 177260 | 65536 | 3932160 | 602053 | 67358980 | 17598286325246 | 17598286288345 | 17598286599225 | 17598286600979 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 317 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 143616 | 0x7fc57b003780 | 0x7fc57a6259c0 | 278792 | 278792 | 65536 | 5308416 | 794875 | 88965396 | 17598286636188 | 17598286599225 | 17598286968025 | 17598286969640 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 320 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 145344 | 0x7fc57b003600 | 0x7fc57a625a00 | 161506 | 161506 | 65536 | 3342336 | 505771 | 56643040 | 17598287011649 | 17598286968025 | 17598287265945 | 17598287267622 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 323 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 147584 | 0x7fc57d663480 | 0x7fc57a625a40 | 295276 | 295276 | 65536 | 4325376 | 651002 | 72908412 | 17598287304191 | 17598287265945 | 17598287645946 | 17598287647843 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 326 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 149568 | 0x7fc57d663300 | 0x7fc57a625a80 | 293808 | 293808 | 65536 | 4194304 | 625995 | 70176864 | 17598287682742 | 17598287645946 | 17598288020506 | 17598288022153 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 329 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 151552 | 0x7fc57d663180 | 0x7fc57a625ac0 | 186443 | 186443 | 65536 | 4194304 | 630271 | 70642760 | 17598288057092 | 17598288020506 | 17598288326586 | 17598288328415 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 332 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 154304 | 0x7fc57d663000 | 0x7fc57a625b00 | 299015 | 299015 | 65536 | 5701632 | 850965 | 95261900 | 17598288363704 | 17598288326586 | 17598288709466 | 17598288711106 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 335 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 156288 | 0x7fc57b003e80 | 0x7fc57a625b40 | 171741 | 171741 | 65536 | 3735552 | 574939 | 64440664 | 17598288753564 | 17598288709466 | 17598289014267 | 17598289015908 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 338 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 158784 | 0x7fc57b003d00 | 0x7fc57a625b80 | 296283 | 296283 | 65536 | 4849664 | 751758 | 84280972 | 17598289050267 | 17598289014267 | 17598289390587 | 17598289392308 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 341 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 161024 | 0x7fc57b003b80 | 0x7fc57a625bc0 | 296308 | 296308 | 65536 | 4718592 | 742455 | 83196816 | 17598289426447 | 17598289390587 | 17598289776027 | 17598289777868 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 344 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 163264 | 0x7fc57b003a00 | 0x7fc57a625c00 | 206779 | 206779 | 65536 | 4718592 | 727697 | 81548732 | 17598289812267 | 17598289776027 | 17598290095227 | 17598290099930 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 347 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 166528 | 0x7fc57b003880 | 0x7fc57a625c40 | 340221 | 340221 | 65536 | 6488064 | 972878 | 108993016 | 17598290132559 | 17598290095227 | 17598290500988 | 17598290523689 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 350 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 168512 | 0x7fc57b003700 | 0x7fc57a625c80 | 184260 | 184260 | 65536 | 4128768 | 613745 | 68748960 | 17598290545309 | 17598290500988 | 17598290814588 | 17598290816392 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 353 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 171264 | 0x7fc57d663580 | 0x7fc57a625cc0 | 295663 | 295663 | 65536 | 5373952 | 850650 | 95258960 | 17598290850901 | 17598290814588 | 17598291194108 | 17598291195942 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 356 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 173760 | 0x7fc57d663400 | 0x7fc57a625d00 | 295680 | 295680 | 65536 | 5242880 | 820925 | 92106848 | 17598291230841 | 17598291194108 | 17598291573949 | 17598291575513 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 359 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 176256 | 0x7fc57d663280 | 0x7fc57a625d40 | 225121 | 225121 | 65536 | 5242880 | 789646 | 88496888 | 17598291610022 | 17598291573949 | 17598291908829 | 17598291910534 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 362 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 179776 | 0x7fc57d663100 | 0x7fc57a625d80 | 379382 | 379382 | 65536 | 7274496 | 1094455 | 122617096 | 17598291945693 | 17598291908829 | 17598292340509 | 17598292361623 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 365 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 182272 | 0x7fc57b003f80 | 0x7fc57a625dc0 | 210285 | 210285 | 65536 | 4915200 | 738800 | 82677044 | 17598292384942 | 17598292340509 | 17598292671869 | 17598292673465 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 368 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 185536 | 0x7fc57b003e00 | 0x7fc57a625e00 | 304476 | 304476 | 65536 | 6422528 | 996530 | 111553876 | 17598292708054 | 17598292671869 | 17598293063870 | 17598293065545 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 371 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 188544 | 0x7fc57b003c80 | 0x7fc57a625e40 | 309795 | 309795 | 65536 | 6291456 | 1008725 | 113005204 | 17598293100184 | 17598293063870 | 17598293454270 | 17598293456575 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 374 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 191552 | 0x7fc57b003b00 | 0x7fc57a625e80 | 265016 | 265016 | 65536 | 6291456 | 960955 | 107642448 | 17598293490034 | 17598293454270 | 17598293808670 | 17598293810446 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 377 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 195840 | 0x7fc57b003980 | 0x7fc57a625ec0 | 460468 | 460468 | 65536 | 8847360 | 1340578 | 150097020 | 17598293845135 | 17598293808670 | 17598294285151 | 17598294307633 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 380 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 198592 | 0x7fc57b003800 | 0x7fc57a625f00 | 244266 | 244266 | 65536 | 5701632 | 861018 | 96425368 | 17598294328973 | 17598294285151 | 17598294653791 | 17598294655415 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 383 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 202368 | 0x7fc57b003680 | 0x7fc57a625f40 | 333187 | 333187 | 65536 | 7471104 | 1193904 | 133725160 | 17598294690874 | 17598294653791 | 17598295059551 | 17598295104823 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 386 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 205888 | 0x7fc57d663500 | 0x7fc57a625f80 | 330871 | 330871 | 65536 | 7340032 | 1159135 | 129836260 | 17598295116103 | 17598295059551 | 17598295497311 | 17598295540822 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 389 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 209408 | 0x7fc57d663380 | 0x7fc57a625fc0 | 305910 | 305910 | 65536 | 7340032 | 1121399 | 125509564 | 17598295551712 | 17598295497311 | 17598295908672 | 17598295910503 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 392 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 214464 | 0x7fc57d663200 | 0x7fc57a626000 | 542283 | 542283 | 65536 | 10420224 | 1568783 | 175813004 | 17598295945792 | 17598295908672 | 17598296439872 | 17598296482158 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 395 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 217728 | 0x7fc57d663080 | 0x7fc57a626040 | 272435 | 272435 | 65536 | 6488064 | 992618 | 111236844 | 17598296502797 | 17598296439872 | 17598296830912 | 17598296832689 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 398 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 222016 | 0x7fc57b003f00 | 0x7fc57a626080 | 364525 | 364525 | 65536 | 8519680 | 1361388 | 152365296 | 17598296869268 | 17598296830912 | 17598297256833 | 17598297299227 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 401 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 226048 | 0x7fc57b003d80 | 0x7fc57a6260c0 | 367851 | 367851 | 65536 | 8388608 | 1359359 | 152227300 | 17598297310527 | 17598297256833 | 17598297709633 | 17598297727836 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 404 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 230080 | 0x7fc57b003c00 | 0x7fc57a626100 | 346157 | 346157 | 65536 | 8388608 | 1297532 | 145388716 | 17598297745406 | 17598297709633 | 17598298117473 | 17598298163095 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 407 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 235904 | 0x7fc57b003a80 | 0x7fc57a626140 | 623057 | 623057 | 65536 | 11993088 | 1828127 | 204732500 | 17598298174855 | 17598298117473 | 17598298733954 | 17598298777430 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 410 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 239424 | 0x7fc57b003900 | 0x7fc57a626180 | 302787 | 302787 | 65536 | 7274496 | 1156188 | 129567956 | 17598298796769 | 17598298733954 | 17598299146914 | 17598299148690 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 413 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 244224 | 0x7fc57b003780 | 0x7fc57a6261c0 | 398823 | 398823 | 65536 | 9568256 | 1491465 | 167017620 | 17598299186029 | 17598299146914 | 17598299592835 | 17598299637038 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 416 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 248768 | 0x7fc57b003600 | 0x7fc57a626200 | 389443 | 389443 | 65536 | 9437184 | 1456663 | 163291036 | 17598299649217 | 17598299592835 | 17598300061315 | 17598300105206 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 419 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 253312 | 0x7fc57d663480 | 0x7fc57a626240 | 386633 | 386633 | 65536 | 9437184 | 1464421 | 163958644 | 17598300116546 | 17598300061315 | 17598300533795 | 17598300577924 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 422 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 8 | 24 | 255552 | 0x7fc57d663300 | 0x7fc57a626280 | 718746 | 718746 | 65536 | 16056320 | 2308323 | 258892844 | 17598300589654 | 17598300533795 | 17598301209156 | 17598301253387 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 425 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 259840 | 0x7fc57d663180 | 0x7fc57a6262c0 | 363190 | 363190 | 65536 | 8847360 | 1367371 | 153164760 | 17598301273886 | 17598301209156 | 17598301657636 | 17598301702005 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 428 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 265664 | 0x7fc57d663000 | 0x7fc57a626300 | 468855 | 468855 | 65536 | 11665408 | 1840693 | 206045152 | 17598301713865 | 17598301657636 | 17598302184677 | 17598302229022 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 431 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 271232 | 0x7fc57b003e80 | 0x7fc57a626340 | 471122 | 471122 | 65536 | 11468800 | 1835596 | 205579460 | 17598302240842 | 17598302184677 | 17598302714277 | 17598302758459 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 434 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 8 | 24 | 273216 | 0x7fc57b003d00 | 0x7fc57a626380 | 482691 | 482691 | 65536 | 14090240 | 2021655 | 226289536 | 17598302769468 | 17598302714277 | 17598303239557 | 17598303283735 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 437 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 8 | 24 | 275712 | 0x7fc57b003b80 | 0x7fc57a6263c0 | 879198 | 879198 | 65536 | 19202048 | 2757838 | 308615396 | 17598303295945 | 17598303239557 | 17598304018598 | 17598304060306 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 440 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 280768 | 0x7fc57b003a00 | 0x7fc57a626400 | 425606 | 425606 | 65536 | 10420224 | 1600707 | 179444132 | 17598304080715 | 17598304018598 | 17598304502758 | 17598304545083 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 443 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 287616 | 0x7fc57b003880 | 0x7fc57a626440 | 547968 | 547968 | 65536 | 13762560 | 2143950 | 240064628 | 17598304556993 | 17598304502758 | 17598305074599 | 17598305116809 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 446 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 294208 | 0x7fc57b003700 | 0x7fc57a626480 | 549766 | 549766 | 65536 | 13565952 | 2169986 | 243035864 | 17598305129159 | 17598305074599 | 17598305644199 | 17598305686654 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 449 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 8 | 24 | 296960 | 0x7fc57d663580 | 0x7fc57a6264c0 | 563418 | 563418 | 65536 | 15466496 | 2228340 | 249472868 | 17598305698124 | 17598305644199 | 17598306218120 | 17598306262830 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 452 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 8 | 24 | 299968 | 0x7fc57d663400 | 0x7fc57a626500 | 1043564 | 1043564 | 65536 | 22347776 | 3211811 | 359803404 | 17598306275119 | 17598306218120 | 17598307109960 | 17598307153547 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 455 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 8 | 24 | 302720 | 0x7fc57d663280 | 0x7fc57a626540 | 722110 | 722110 | 65536 | 20250624 | 2910147 | 325967960 | 17598307174287 | 17598307109960 | 17598307781481 | 17598307825580 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 458 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 305472 | 0x7fc57d663100 | 0x7fc57a626580 | 723565 | 723565 | 65536 | 20447232 | 2935970 | 328866128 | 17598307836850 | 17598307781481 | 17598308479401 | 17598308521872 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 461 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 308224 | 0x7fc57b003f80 | 0x7fc57a6265c0 | 721500 | 721500 | 65536 | 19595264 | 2814676 | 315453276 | 17598308533312 | 17598308479225 | 17598309162745 | 17598309208785 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 464 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 8 | 24 | 310976 | 0x7fc57b003e00 | 0x7fc57a626600 | 726076 | 726076 | 65536 | 20381696 | 2936476 | 328942212 | 17598309219944 | 17598309162745 | 17598309838265 | 17598309881097 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 467 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 8 | 24 | 313216 | 0x7fc57b003c80 | 0x7fc57a626640 | 1366825 | 1366825 | 65536 | 31522816 | 4514898 | 505583912 | 17598309891967 | 17598309838265 | 17598310928665 | 17598310975270 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 470 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 8 | 24 | 315968 | 0x7fc57b003b00 | 0x7fc57a626680 | 1371641 | 1371641 | 65536 | 38993920 | 5589029 | 626214956 | 17598310996489 | 17598310928665 | 17598312012346 | 17598312056892 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 473 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 318720 | 0x7fc57b003980 | 0x7fc57a6266c0 | 1372673 | 1372673 | 65536 | 39124992 | 5608013 | 627989248 | 17598312068272 | 17598312012346 | 17598313119226 | 17598313184094 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 476 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 321472 | 0x7fc57b003800 | 0x7fc57a626700 | 1370411 | 1370411 | 65536 | 38469632 | 5519358 | 617861312 | 17598313195153 | 17598313119226 | 17598314243227 | 17598314312425 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 479 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 8 | 24 | 324224 | 0x7fc57b003680 | 0x7fc57a626740 | 1375071 | 1375071 | 65536 | 39059456 | 5597910 | 626915124 | 17598314324455 | 17598314243227 | 17598315372347 | 17598315439636 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 482 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 8 | 24 | 326464 | 0x7fc57d663500 | 0x7fc57a626780 | 2664520 | 2664520 | 65536 | 60489728 | 8660095 | 969801984 | 17598315451946 | 17598315372347 | 17598317343388 | 17598317410306 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 485 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 8 | 24 | 329216 | 0x7fc57d663380 | 0x7fc57a6267c0 | 2666822 | 2666822 | 65536 | 77266944 | 11060008 | 1238260984 | 17598317430076 | 17598317343388 | 17598319273789 | 17598319343217 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 488 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 331968 | 0x7fc57d663200 | 0x7fc57a626800 | 2671085 | 2671085 | 65536 | 77398016 | 11073139 | 1240205108 | 17598319355797 | 17598319273789 | 17598321268189 | 17598321335786 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 491 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 12 | 24 | 334720 | 0x7fc57d663080 | 0x7fc57a626840 | 2668714 | 2668714 | 65536 | 76218368 | 10914634 | 1222575476 | 17598321348676 | 17598321268189 | 17598323245470 | 17598323317666 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 494 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 8 | 24 | 337472 | 0x7fc57b003f00 | 0x7fc57a626880 | 2674890 | 2674890 | 65536 | 77332480 | 11062184 | 1239088008 | 17598323330526 | 17598323245470 | 17598325194911 | 17598325263067 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 497 | 223297 | 223297 | 4194304 | 256 | 0 | 0 | 8 | 24 | 0 | 0x7fc57b003d80 | 0x7fc57a6268c0 | 5255732 | 5255732 | 65536 | 120258560 | 17190583 | 1925804324 | 17598325275167 | 17598325194911 | 17598328815713 | 17598328885995 |