48 KiB
48 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | GRBM_COUNT | GRBM_GUI_ACTIVE | CPC_ME1_BUSY_FOR_PACKET_DECODE | SQ_CYCLES | SQ_WAVES | SQ_WAVE_CYCLES | SQ_BUSY_CYCLES | SQ_LEVEL_WAVES | SQ_ACCUM_PREV_HIRES | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBufferAligned.kd | 0 | 0 | 0 | 188242 | 188242 | 33554432 | 256 | 0 | 0 | 4 | 32 | 4160 | 0x0 | 0x7fd4a6804280 | 388284 | 388284 | 8778 | 3106280 | 524288 | 244967804 | 3019488 | 0 | 996171404 | 17019739890511 | 17019036428116 | 17019885027682 | 17019885140781 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 188242 | 188242 | 32768 | 256 | 0 | 0 | 12 | 24 | 13888 | 0x0 | 0x7fd4a6823f80 | 33728 | 33728 | 30230 | 269832 | 512 | 1693019 | 164026 | 0 | 6785384 | 17019890314053 | 17019885027682 | 17019890453268 | 17019890458139 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 5 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 14336 | 0x7fd4a9882380 | 0x7fd4a6823fc0 | 164607 | 164607 | 14285 | 1316864 | 65536 | 82622429 | 1217167 | 0 | 332218900 | 17019890502057 | 17019890453268 | 17019890848147 | 17019890850967 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 8 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15040 | 0x7fd4a9882200 | 0x7fd4a6824000 | 309658 | 309658 | 24076 | 2477272 | 65536 | 219012158 | 2366437 | 0 | 877775120 | 17019890896976 | 17019890848147 | 17019891277266 | 17019891279845 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 11 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15488 | 0x7fd4a9882080 | 0x7fd4a6824040 | 310040 | 310040 | 24363 | 2480328 | 65536 | 225077705 | 2376809 | 0 | 902038996 | 17019891321304 | 17019891277266 | 17019891699345 | 17019891701683 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 14 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 15936 | 0x7fd4a7223f00 | 0x7fd4a6824080 | 165622 | 165622 | 13528 | 1324984 | 65536 | 86026125 | 1218875 | 0 | 345830844 | 17019891743592 | 17019891699345 | 17019892029104 | 17019892031313 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 17 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 16384 | 0x7fd4a7223d80 | 0x7fd4a68240c0 | 165750 | 165750 | 13270 | 1326008 | 65536 | 80475542 | 1220716 | 0 | 323633496 | 17019892072222 | 17019892029104 | 17019892357103 | 17019892359374 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 20 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 17088 | 0x7fd4a7223c00 | 0x7fd4a6824100 | 163432 | 163432 | 14791 | 1307464 | 65536 | 93585040 | 1205188 | 0 | 376071904 | 17019892412603 | 17019892357103 | 17019892681902 | 17019892684125 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 23 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 16 | 24 | 17792 | 0x7fd4a7223a80 | 0x7fd4a6824140 | 309075 | 309075 | 24205 | 2472608 | 65536 | 225997374 | 2372366 | 0 | 905718780 | 17019892724894 | 17019892681902 | 17019893114221 | 17019893116502 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 26 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 16 | 24 | 18496 | 0x7fd4a7223900 | 0x7fd4a6824180 | 308706 | 308706 | 22158 | 2469656 | 65536 | 220629382 | 2366323 | 0 | 884246820 | 17019893156931 | 17019893114221 | 17019893531180 | 17019893533490 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 29 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19200 | 0x7fd4a7223780 | 0x7fd4a68241c0 | 164153 | 164153 | 13740 | 1313232 | 65536 | 85861322 | 1212366 | 0 | 345182672 | 17019893573259 | 17019893531180 | 17019893856780 | 17019893858951 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 32 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19904 | 0x7fd4a7223600 | 0x7fd4a6824200 | 164678 | 164678 | 14770 | 1317432 | 65536 | 103433271 | 1217099 | 0 | 415458036 | 17019893899070 | 17019893856780 | 17019894189899 | 17019894192201 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 35 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 20608 | 0x7fd4a9882480 | 0x7fd4a6824240 | 164178 | 164178 | 15592 | 1313432 | 65536 | 101440947 | 1208305 | 0 | 407487052 | 17019894244890 | 17019894189899 | 17019894528778 | 17019894530732 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 38 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 16 | 24 | 21312 | 0x7fd4a9882300 | 0x7fd4a6824280 | 308446 | 308446 | 24181 | 2467576 | 65536 | 232378960 | 2368086 | 0 | 931244284 | 17019894573300 | 17019894528778 | 17019894915177 | 17019894916821 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 41 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22016 | 0x7fd4a9882180 | 0x7fd4a68242c0 | 311585 | 311585 | 22500 | 2492688 | 65536 | 214489817 | 2384988 | 0 | 859688956 | 17019894960409 | 17019894915177 | 17019895303976 | 17019895305769 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 44 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22720 | 0x7fd4a9882000 | 0x7fd4a6824300 | 163900 | 163900 | 14490 | 1311208 | 65536 | 99622775 | 1212799 | 0 | 400219084 | 17019895349028 | 17019895303976 | 17019895606535 | 17019895608381 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 47 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 23424 | 0x7fd4a7223e80 | 0x7fd4a6824340 | 164189 | 164189 | 14508 | 1313520 | 65536 | 92243976 | 1212687 | 0 | 370707872 | 17019895650189 | 17019895606535 | 17019895903335 | 17019895905092 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 50 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 24128 | 0x7fd4a7223d00 | 0x7fd4a6824380 | 162516 | 162516 | 14902 | 1300136 | 65536 | 105724239 | 1201244 | 0 | 424614336 | 17019895954481 | 17019895903335 | 17019896201574 | 17019896203283 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 53 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 16 | 24 | 24832 | 0x7fd4a7223b80 | 0x7fd4a68243c0 | 311124 | 311124 | 24294 | 2489000 | 65536 | 225784686 | 2377134 | 0 | 904870576 | 17019896248312 | 17019896201574 | 17019896603013 | 17019896604732 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 56 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 16 | 24 | 25536 | 0x7fd4a7223a00 | 0x7fd4a6824400 | 304448 | 304448 | 20623 | 2435592 | 65536 | 214120756 | 2334150 | 0 | 858213992 | 17019896647051 | 17019896603013 | 17019896987332 | 17019896989151 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 59 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26240 | 0x7fd4a7223880 | 0x7fd4a6824440 | 164215 | 164215 | 15996 | 1313728 | 65536 | 91156932 | 1206010 | 0 | 366361024 | 17019897030770 | 17019896987332 | 17019897286211 | 17019897287952 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 62 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26944 | 0x7fd4a7223700 | 0x7fd4a6824480 | 162962 | 162962 | 14589 | 1303704 | 65536 | 100328217 | 1202971 | 0 | 403035840 | 17019897331531 | 17019897286211 | 17019897586371 | 17019897587983 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 65 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 27648 | 0x7fd4a9882580 | 0x7fd4a68244c0 | 162961 | 162961 | 14487 | 1303696 | 65536 | 90055159 | 1201273 | 0 | 361963328 | 17019897637642 | 17019897586371 | 17019897899170 | 17019897900994 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 68 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 16 | 24 | 28608 | 0x7fd4a9882400 | 0x7fd4a6824500 | 308294 | 308294 | 24020 | 2466360 | 65536 | 229014296 | 2370344 | 0 | 917788228 | 17019897947633 | 17019897899170 | 17019898309569 | 17019898311363 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 71 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 16 | 24 | 29312 | 0x7fd4a9882280 | 0x7fd4a6824540 | 306400 | 306400 | 20640 | 2451208 | 65536 | 220045737 | 2352752 | 0 | 881911332 | 17019898354911 | 17019898309569 | 17019898699008 | 17019898700691 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 74 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 30016 | 0x7fd4a9882100 | 0x7fd4a6824580 | 162081 | 162081 | 15031 | 1296656 | 65536 | 97679953 | 1198562 | 0 | 392454068 | 17019898743080 | 17019898699008 | 17019898996287 | 17019898997983 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 77 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 8 | 24 | 30976 | 0x7fd4a7223f80 | 0x7fd4a68245c0 | 162850 | 162850 | 15183 | 1302808 | 65536 | 86385221 | 1197567 | 0 | 347274720 | 17019899040172 | 17019898996287 | 17019899294687 | 17019899296444 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 80 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 31680 | 0x7fd4a7223e00 | 0x7fd4a6824600 | 162497 | 162497 | 15028 | 1299984 | 65536 | 104394021 | 1200433 | 0 | 419296472 | 17019899344993 | 17019899294687 | 17019899590206 | 17019899592086 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 83 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 16 | 24 | 32640 | 0x7fd4a7223c80 | 0x7fd4a6824640 | 307540 | 307540 | 23742 | 2460328 | 65536 | 225376191 | 2355673 | 0 | 903239688 | 17019899634165 | 17019899590206 | 17019899979645 | 17019899981385 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 86 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 33600 | 0x7fd4a7223b00 | 0x7fd4a6824680 | 307633 | 307633 | 23147 | 2461072 | 65536 | 216517802 | 2350793 | 0 | 867799744 | 17019900023674 | 17019899979645 | 17019900365244 | 17019900366854 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 89 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 34560 | 0x7fd4a7223980 | 0x7fd4a68246c0 | 163094 | 163094 | 14194 | 1304760 | 65536 | 93813826 | 1204080 | 0 | 376987852 | 17019900410352 | 17019900365244 | 17019900665083 | 17019900667035 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 92 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 8 | 24 | 35520 | 0x7fd4a7223800 | 0x7fd4a6824700 | 162627 | 162627 | 13806 | 1301024 | 65536 | 88290809 | 1202985 | 0 | 354889552 | 17019900709134 | 17019900665083 | 17019900961083 | 17019900962717 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 95 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 36224 | 0x7fd4a7223680 | 0x7fd4a6824740 | 161989 | 161989 | 14427 | 1295920 | 65536 | 97056218 | 1198379 | 0 | 389954544 | 17019901011405 | 17019900961083 | 17019901257402 | 17019901259068 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 98 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 37184 | 0x7fd4a9882500 | 0x7fd4a6824780 | 308085 | 308085 | 25114 | 2464688 | 65536 | 229681431 | 2358272 | 0 | 920455980 | 17019901305687 | 17019901257402 | 17019901652761 | 17019901654387 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 101 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 38144 | 0x7fd4a9882380 | 0x7fd4a68247c0 | 307826 | 307826 | 23005 | 2462616 | 65536 | 223872907 | 2363147 | 0 | 897220124 | 17019901696946 | 17019901652761 | 17019902040280 | 17019902042006 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 104 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 39104 | 0x7fd4a9882200 | 0x7fd4a6824800 | 162465 | 162465 | 14822 | 1299728 | 65536 | 94669907 | 1199458 | 0 | 380403800 | 17019902095604 | 17019902040280 | 17019902351319 | 17019902353147 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 107 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 8 | 24 | 40320 | 0x7fd4a9882080 | 0x7fd4a6824840 | 162384 | 162384 | 14944 | 1299080 | 65536 | 91745975 | 1197851 | 0 | 368707724 | 17019902395426 | 17019902351319 | 17019902653559 | 17019902655258 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 110 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 41280 | 0x7fd4a7223f00 | 0x7fd4a6824880 | 162393 | 162393 | 14204 | 1299152 | 65536 | 85230595 | 1196219 | 0 | 342653732 | 17019902704137 | 17019902653559 | 17019902950678 | 17019902952390 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 113 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 42240 | 0x7fd4a7223d80 | 0x7fd4a68248c0 | 305058 | 305058 | 23550 | 2440472 | 65536 | 216727852 | 2336323 | 0 | 868640936 | 17019902999248 | 17019902950678 | 17019903344917 | 17019903346598 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 116 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 43200 | 0x7fd4a7223c00 | 0x7fd4a6824900 | 306000 | 306000 | 22154 | 2448008 | 65536 | 220302769 | 2339223 | 0 | 882942584 | 17019903389427 | 17019903344917 | 17019903737556 | 17019903739237 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 119 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 8 | 24 | 44160 | 0x7fd4a7223a80 | 0x7fd4a6824940 | 162884 | 162884 | 14925 | 1303080 | 65536 | 92419461 | 1197223 | 0 | 371410720 | 17019903780286 | 17019903737556 | 17019904034355 | 17019904036028 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 122 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 45376 | 0x7fd4a7223900 | 0x7fd4a6824980 | 162925 | 162925 | 14138 | 1303408 | 65536 | 89579375 | 1201507 | 0 | 360046444 | 17019904077757 | 17019904034355 | 17019904332754 | 17019904334480 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 125 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 46336 | 0x7fd4a7223780 | 0x7fd4a68249c0 | 161424 | 161424 | 13639 | 1291400 | 65536 | 95625232 | 1193766 | 0 | 384223076 | 17019904383438 | 17019904332754 | 17019904636914 | 17019904638581 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 128 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 47552 | 0x7fd4a7223600 | 0x7fd4a6824a00 | 306826 | 306826 | 24307 | 2454616 | 65536 | 227545425 | 2349969 | 0 | 911910784 | 17019904679340 | 17019904636914 | 17019905022673 | 17019905024380 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 131 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 48512 | 0x7fd4a9882480 | 0x7fd4a6824a40 | 303566 | 303566 | 21192 | 2428536 | 65536 | 208896318 | 2325717 | 0 | 837314772 | 17019905067229 | 17019905022673 | 17019905407632 | 17019905409509 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 134 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 8 | 24 | 49472 | 0x7fd4a9882300 | 0x7fd4a6824a80 | 161841 | 161841 | 14773 | 1294736 | 65536 | 89673533 | 1194627 | 0 | 360432088 | 17019905451138 | 17019905407632 | 17019905709391 | 17019905710990 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 137 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 50688 | 0x7fd4a9882180 | 0x7fd4a6824ac0 | 161504 | 161504 | 15314 | 1292040 | 65536 | 96147774 | 1192435 | 0 | 386328292 | 17019905753439 | 17019905709391 | 17019906009230 | 17019906010992 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 140 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 51648 | 0x7fd4a9882000 | 0x7fd4a6824b00 | 160927 | 160927 | 14319 | 1287424 | 65536 | 88443027 | 1184781 | 0 | 355504476 | 17019906060020 | 17019906009230 | 17019906316430 | 17019906318233 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 143 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 52864 | 0x7fd4a7223e80 | 0x7fd4a6824b40 | 303278 | 303278 | 21505 | 2426232 | 65536 | 216485546 | 2325192 | 0 | 867674576 | 17019906359782 | 17019906316430 | 17019906700429 | 17019906702022 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 146 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 54080 | 0x7fd4a7223d00 | 0x7fd4a6824b80 | 302207 | 302207 | 21903 | 2417664 | 65536 | 215251597 | 2313509 | 0 | 862734640 | 17019906745211 | 17019906700429 | 17019907096428 | 17019907098201 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 149 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 8 | 24 | 55296 | 0x7fd4a7223b80 | 0x7fd4a6824bc0 | 162374 | 162374 | 14591 | 1299000 | 65536 | 87150686 | 1196659 | 0 | 350336144 | 17019907139759 | 17019907096428 | 17019907393387 | 17019907395222 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 152 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 56768 | 0x7fd4a7223a00 | 0x7fd4a6824c00 | 162502 | 162502 | 15914 | 1300024 | 65536 | 99921286 | 1199466 | 0 | 401418900 | 17019907436201 | 17019907393387 | 17019907696906 | 17019907698663 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 155 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 57728 | 0x7fd4a7223880 | 0x7fd4a6824c40 | 162706 | 162706 | 13818 | 1301656 | 65536 | 82762351 | 1196598 | 0 | 332775980 | 17019907747712 | 17019907696906 | 17019907998026 | 17019907999705 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 158 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 58944 | 0x7fd4a7223700 | 0x7fd4a6824c80 | 304267 | 304267 | 23145 | 2434144 | 65536 | 222478996 | 2327122 | 0 | 891651456 | 17019908046543 | 17019907998026 | 17019908388905 | 17019908390764 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 161 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 60160 | 0x7fd4a9882580 | 0x7fd4a6824cc0 | 303952 | 303952 | 21478 | 2431624 | 65536 | 205506097 | 2321658 | 0 | 823754880 | 17019908432852 | 17019908388905 | 17019908780104 | 17019908782002 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 164 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 8 | 24 | 61376 | 0x7fd4a9882400 | 0x7fd4a6824d00 | 163539 | 163539 | 14605 | 1308320 | 65536 | 91273930 | 1208643 | 0 | 366826044 | 17019908824281 | 17019908780104 | 17019909078503 | 17019909080104 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 167 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 62848 | 0x7fd4a9882280 | 0x7fd4a6824d40 | 168437 | 168437 | 15920 | 1347504 | 65536 | 104031738 | 1247420 | 0 | 417876240 | 17019909122133 | 17019909078503 | 17019909384742 | 17019909386605 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 170 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 63808 | 0x7fd4a9882100 | 0x7fd4a6824d80 | 162267 | 162267 | 14211 | 1298144 | 65536 | 86702542 | 1196100 | 0 | 348543284 | 17019909435804 | 17019909384742 | 17019909695782 | 17019909697586 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 173 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 65024 | 0x7fd4a7223f80 | 0x7fd4a6824dc0 | 301846 | 301846 | 23584 | 2414776 | 65536 | 220577811 | 2309798 | 0 | 884045032 | 17019909744465 | 17019909695782 | 17019910086341 | 17019910088055 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 176 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 66240 | 0x7fd4a7223e00 | 0x7fd4a6824e00 | 300915 | 300915 | 20299 | 2407328 | 65536 | 207299666 | 2300930 | 0 | 830933840 | 17019910131624 | 17019910086341 | 17019910477220 | 17019910479174 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 179 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 8 | 24 | 67456 | 0x7fd4a7223c80 | 0x7fd4a6824e40 | 163140 | 163140 | 14627 | 1305128 | 65536 | 85402584 | 1203745 | 0 | 343350424 | 17019910520492 | 17019910477220 | 17019910777059 | 17019910779015 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 182 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 68928 | 0x7fd4a7223b00 | 0x7fd4a6824e80 | 176787 | 176787 | 16716 | 1414304 | 65536 | 112737567 | 1311115 | 0 | 452688444 | 17019910821164 | 17019910777059 | 17019911086338 | 17019911088016 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 185 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 70144 | 0x7fd4a7223980 | 0x7fd4a6824ec0 | 161020 | 161020 | 14372 | 1288168 | 65536 | 92487796 | 1189123 | 0 | 371685284 | 17019911136975 | 17019911086338 | 17019911394178 | 17019911395877 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 188 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 71616 | 0x7fd4a7223800 | 0x7fd4a6824f00 | 301434 | 301434 | 22449 | 2411480 | 65536 | 218029663 | 2304365 | 0 | 873853416 | 17019911436996 | 17019911394178 | 17019911787777 | 17019911789416 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 191 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 72832 | 0x7fd4a7223680 | 0x7fd4a6824f40 | 302838 | 302838 | 22796 | 2422712 | 65536 | 217653524 | 2319895 | 0 | 872345508 | 17019911830465 | 17019911787777 | 17019912175136 | 17019912176875 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 194 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 8 | 24 | 74048 | 0x7fd4a9882500 | 0x7fd4a6824f80 | 161946 | 161946 | 14277 | 1295576 | 65536 | 81898690 | 1189989 | 0 | 329331848 | 17019912218774 | 17019912175136 | 17019912473375 | 17019912475106 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 197 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 75776 | 0x7fd4a9882380 | 0x7fd4a6824fc0 | 183802 | 183802 | 17838 | 1470424 | 65536 | 108675391 | 1356103 | 0 | 436441112 | 17019912517555 | 17019912473375 | 17019912788574 | 17019912790317 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 200 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 76992 | 0x7fd4a9882200 | 0x7fd4a6825000 | 163048 | 163048 | 14920 | 1304392 | 65536 | 88705420 | 1199342 | 0 | 356549296 | 17019912853326 | 17019912788574 | 17019913087934 | 17019913089659 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 203 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 78464 | 0x7fd4a9882080 | 0x7fd4a6825040 | 303024 | 303024 | 23587 | 2424200 | 65536 | 220057061 | 2315133 | 0 | 881959948 | 17019913131548 | 17019913087934 | 17019913479133 | 17019913480818 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 206 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 79936 | 0x7fd4a7223f00 | 0x7fd4a6825080 | 299786 | 299786 | 21443 | 2398296 | 65536 | 202728627 | 2290698 | 0 | 812647892 | 17019913522156 | 17019913479133 | 17019913872412 | 17019913874136 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 209 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 8 | 24 | 81408 | 0x7fd4a7223d80 | 0x7fd4a68250c0 | 162637 | 162637 | 14888 | 1301104 | 65536 | 93603878 | 1200522 | 0 | 376153116 | 17019913915665 | 17019913872412 | 17019914171771 | 17019914173788 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 212 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 83136 | 0x7fd4a7223c00 | 0x7fd4a6825100 | 191869 | 191869 | 17386 | 1534960 | 65536 | 116139410 | 1429153 | 0 | 466302880 | 17019914215096 | 17019914171771 | 17019914492730 | 17019914494408 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 215 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 84352 | 0x7fd4a7223a80 | 0x7fd4a6825140 | 161842 | 161842 | 14539 | 1294744 | 65536 | 96989194 | 1192942 | 0 | 389685368 | 17019914543777 | 17019914492730 | 17019914793369 | 17019914795070 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 218 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 85824 | 0x7fd4a7223900 | 0x7fd4a6825180 | 299986 | 299986 | 21390 | 2399896 | 65536 | 214601266 | 2296357 | 0 | 860144212 | 17019914836609 | 17019914793369 | 17019915178648 | 17019915180419 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 221 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 87296 | 0x7fd4a7223780 | 0x7fd4a68251c0 | 298612 | 298612 | 21830 | 2388904 | 65536 | 216239686 | 2288185 | 0 | 866688832 | 17019915222447 | 17019915178648 | 17019915560728 | 17019915562458 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 224 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 88768 | 0x7fd4a7223600 | 0x7fd4a6825200 | 162085 | 162085 | 15188 | 1296688 | 65536 | 92027840 | 1195005 | 0 | 369843584 | 17019915603646 | 17019915560728 | 17019915859607 | 17019915861369 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 227 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 90752 | 0x7fd4a9882480 | 0x7fd4a6825240 | 201297 | 201297 | 17661 | 1610384 | 65536 | 120329790 | 1502863 | 0 | 483074492 | 17019915903528 | 17019915859607 | 17019916188566 | 17019916190339 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 230 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 91968 | 0x7fd4a9882300 | 0x7fd4a6825280 | 161178 | 161178 | 15171 | 1289432 | 65536 | 90401143 | 1189957 | 0 | 363334664 | 17019916239898 | 17019916188566 | 17019916488085 | 17019916489881 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 233 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 93440 | 0x7fd4a9882180 | 0x7fd4a68252c0 | 300550 | 300550 | 22709 | 2404408 | 65536 | 220693741 | 2305668 | 0 | 884509940 | 17019916532090 | 17019916488085 | 17019916875124 | 17019916876810 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 236 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 94912 | 0x7fd4a9882000 | 0x7fd4a6825300 | 300454 | 300454 | 21781 | 2403640 | 65536 | 210303545 | 2301283 | 0 | 842948192 | 17019916919968 | 17019916875124 | 17019917261843 | 17019917263559 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 239 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 96384 | 0x7fd4a7223e80 | 0x7fd4a6825340 | 162212 | 162212 | 15338 | 1297704 | 65536 | 99053766 | 1196518 | 0 | 397946816 | 17019917305037 | 17019917261843 | 17019917562163 | 17019917563950 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 242 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 98368 | 0x7fd4a7223d00 | 0x7fd4a6825380 | 209361 | 209361 | 18083 | 1674896 | 65536 | 140555691 | 1574100 | 0 | 563964608 | 17019917604909 | 17019917562163 | 17019917893042 | 17019917894760 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 245 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 99584 | 0x7fd4a7223b80 | 0x7fd4a68253c0 | 160416 | 160416 | 14229 | 1283336 | 65536 | 86177494 | 1183982 | 0 | 346440704 | 17019917943099 | 17019917893042 | 17019918197681 | 17019918199452 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 248 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 101312 | 0x7fd4a7223a00 | 0x7fd4a6825400 | 303291 | 303291 | 24575 | 2426336 | 65536 | 220231046 | 2316246 | 0 | 882658956 | 17019918240940 | 17019918197681 | 17019918592080 | 17019918593790 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 251 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 102784 | 0x7fd4a7223880 | 0x7fd4a6825440 | 298452 | 298452 | 20933 | 2387624 | 65536 | 212328676 | 2287737 | 0 | 851046284 | 17019918636129 | 17019918592080 | 17019918977359 | 17019918978939 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 254 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 104256 | 0x7fd4a7223700 | 0x7fd4a6825480 | 162640 | 162640 | 16033 | 1301128 | 65536 | 98429647 | 1197944 | 0 | 395456820 | 17019919020628 | 17019918977359 | 17019919275919 | 17019919277581 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 257 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 106240 | 0x7fd4a9882580 | 0x7fd4a68254c0 | 218895 | 218895 | 19088 | 1751168 | 65536 | 134916509 | 1640669 | 0 | 541412780 | 17019919319649 | 17019919275919 | 17019919609038 | 17019919610721 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 260 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 107712 | 0x7fd4a9882400 | 0x7fd4a6825500 | 160860 | 160860 | 14714 | 1286888 | 65536 | 88793768 | 1182386 | 0 | 356912272 | 17019919659370 | 17019919609038 | 17019919908717 | 17019919910502 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 263 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 16 | 24 | 109440 | 0x7fd4a9882280 | 0x7fd4a6825540 | 297703 | 297703 | 22507 | 2381632 | 65536 | 216068787 | 2280285 | 0 | 866004788 | 17019919957431 | 17019919908717 | 17019920302636 | 17019920304321 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 266 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 16 | 24 | 111168 | 0x7fd4a9882100 | 0x7fd4a6825580 | 299560 | 299560 | 21941 | 2396488 | 65536 | 216480426 | 2292872 | 0 | 867654480 | 17019920347060 | 17019920302636 | 17019920688075 | 17019920689830 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 269 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 8 | 24 | 112896 | 0x7fd4a7223f80 | 0x7fd4a68255c0 | 162441 | 162441 | 16205 | 1299536 | 65536 | 100361258 | 1192677 | 0 | 403186300 | 17019920731679 | 17019920688075 | 17019920991915 | 17019920993631 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 272 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 115136 | 0x7fd4a7223e00 | 0x7fd4a6825600 | 228520 | 228520 | 19496 | 1828168 | 65536 | 155942898 | 1721727 | 0 | 625514120 | 17019921034580 | 17019920991915 | 17019921331754 | 17019921333412 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 275 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 116608 | 0x7fd4a7223c80 | 0x7fd4a6825640 | 161723 | 161723 | 15118 | 1293792 | 65536 | 96500804 | 1192708 | 0 | 387745060 | 17019921382040 | 17019921331754 | 17019921630793 | 17019921632563 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 278 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 16 | 24 | 118336 | 0x7fd4a7223b00 | 0x7fd4a6825680 | 298307 | 298307 | 21565 | 2386464 | 65536 | 209764458 | 2280926 | 0 | 840797696 | 17019921674392 | 17019921630793 | 17019922015592 | 17019922017392 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 281 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 16 | 24 | 120064 | 0x7fd4a7223980 | 0x7fd4a68256c0 | 298191 | 298191 | 21439 | 2385536 | 65536 | 215904989 | 2285082 | 0 | 865356384 | 17019922059011 | 17019922015592 | 17019922411751 | 17019922413661 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 284 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 121792 | 0x7fd4a7223800 | 0x7fd4a6825700 | 164533 | 164533 | 16524 | 1316272 | 65536 | 100042591 | 1217850 | 0 | 401910124 | 17019922454709 | 17019922411751 | 17019922713190 | 17019922715032 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 287 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 124032 | 0x7fd4a7223680 | 0x7fd4a6825740 | 237923 | 237923 | 19939 | 1903392 | 65536 | 167035144 | 1801814 | 0 | 669888720 | 17019922755431 | 17019922713190 | 17019923064550 | 17019923066602 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 290 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 125504 | 0x7fd4a9882500 | 0x7fd4a6825780 | 161449 | 161449 | 15348 | 1291600 | 65536 | 93591873 | 1189343 | 0 | 376103256 | 17019923115861 | 17019923064550 | 17019923367429 | 17019923369183 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 293 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 127488 | 0x7fd4a9882380 | 0x7fd4a68257c0 | 298067 | 298067 | 20487 | 2384544 | 65536 | 205317305 | 2280812 | 0 | 823003440 | 17019923410852 | 17019923367429 | 17019923750788 | 17019923752522 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 296 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 129216 | 0x7fd4a9882200 | 0x7fd4a6825800 | 300351 | 300351 | 20739 | 2402816 | 65536 | 202860591 | 2289812 | 0 | 813175988 | 17019923796111 | 17019923750788 | 17019924136547 | 17019924138231 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 299 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 130944 | 0x7fd4a9882080 | 0x7fd4a6825840 | 169039 | 169039 | 15512 | 1352320 | 65536 | 103270277 | 1254107 | 0 | 414829888 | 17019924180680 | 17019924136547 | 17019924441026 | 17019924442752 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 302 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 133440 | 0x7fd4a7223f00 | 0x7fd4a6825880 | 258821 | 258821 | 21059 | 2070576 | 65536 | 180542266 | 1963442 | 0 | 723936176 | 17019924484891 | 17019924441026 | 17019924801025 | 17019924802772 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 305 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 134912 | 0x7fd4a7223d80 | 0x7fd4a68258c0 | 161377 | 161377 | 15076 | 1291024 | 65536 | 98133457 | 1192008 | 0 | 394267164 | 17019924851861 | 17019924801025 | 17019925105025 | 17019925106673 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 308 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 136896 | 0x7fd4a7223c00 | 0x7fd4a6825900 | 296691 | 296691 | 20516 | 2373536 | 65536 | 198936311 | 2264724 | 0 | 797485032 | 17019925147732 | 17019925105025 | 17019925493664 | 17019925495622 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 311 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 138880 | 0x7fd4a7223a80 | 0x7fd4a6825940 | 297183 | 297183 | 21323 | 2377472 | 65536 | 213698839 | 2272864 | 0 | 856539284 | 17019925537061 | 17019925493664 | 17019925878783 | 17019925880601 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 314 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 140864 | 0x7fd4a7223900 | 0x7fd4a6825980 | 178355 | 178355 | 16471 | 1426848 | 65536 | 105439006 | 1323191 | 0 | 423505148 | 17019925922350 | 17019925878783 | 17019926200702 | 17019926202732 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 317 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 143616 | 0x7fd4a7223780 | 0x7fd4a68259c0 | 280283 | 280283 | 22487 | 2242272 | 65536 | 194211448 | 2130790 | 0 | 778597920 | 17019926244501 | 17019926200702 | 17019926586781 | 17019926588551 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 320 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 145344 | 0x7fd4a7223600 | 0x7fd4a6825a00 | 161161 | 161161 | 15111 | 1289296 | 65536 | 103828108 | 1191034 | 0 | 417045624 | 17019926636930 | 17019926586781 | 17019926892540 | 17019926894152 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 323 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 147584 | 0x7fd4a9882480 | 0x7fd4a6825a40 | 296477 | 296477 | 20738 | 2371824 | 65536 | 200644064 | 2263878 | 0 | 804345152 | 17019926940221 | 17019926892540 | 17019927285179 | 17019927286931 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 326 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 149568 | 0x7fd4a9882300 | 0x7fd4a6825a80 | 295792 | 295792 | 20843 | 2366344 | 65536 | 205543210 | 2263088 | 0 | 823913448 | 17019927329410 | 17019927285179 | 17019927670619 | 17019927672430 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 329 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 151552 | 0x7fd4a9882180 | 0x7fd4a6825ac0 | 187161 | 187161 | 17759 | 1497296 | 65536 | 113535657 | 1387980 | 0 | 455895632 | 17019927713099 | 17019927670619 | 17019927991578 | 17019927993341 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 332 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 154304 | 0x7fd4a9882000 | 0x7fd4a6825b00 | 301126 | 301126 | 23560 | 2409016 | 65536 | 195683995 | 2297517 | 0 | 784487464 | 17019928035589 | 17019927991578 | 17019928379897 | 17019928381529 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 335 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 156288 | 0x7fd4a7223e80 | 0x7fd4a6825b40 | 172838 | 172838 | 16831 | 1382712 | 65536 | 99877559 | 1272699 | 0 | 401255600 | 17019928430808 | 17019928379897 | 17019928692696 | 17019928694451 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 338 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 158784 | 0x7fd4a7223d00 | 0x7fd4a6825b80 | 301854 | 301854 | 19691 | 2414840 | 65536 | 142169715 | 2276076 | 0 | 570431448 | 17019928735269 | 17019928692696 | 17019929083255 | 17019929085049 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 341 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 161024 | 0x7fd4a7223b80 | 0x7fd4a6825bc0 | 298791 | 298791 | 20675 | 2390336 | 65536 | 189378255 | 2269517 | 0 | 759256000 | 17019929126528 | 17019929083255 | 17019929473494 | 17019929475318 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 344 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 163264 | 0x7fd4a7223a00 | 0x7fd4a6825c00 | 204332 | 204332 | 18213 | 1634664 | 65536 | 131375671 | 1527534 | 0 | 527258728 | 17019929516117 | 17019929473494 | 17019929798773 | 17019929800689 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 347 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 166528 | 0x7fd4a7223880 | 0x7fd4a6825c40 | 340143 | 340143 | 25746 | 2721152 | 65536 | 241232295 | 2610996 | 0 | 966686884 | 17019929841158 | 17019929798773 | 17019930212052 | 17019930260406 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 350 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 168512 | 0x7fd4a7223700 | 0x7fd4a6825c80 | 184388 | 184388 | 17456 | 1475112 | 65536 | 112387719 | 1363915 | 0 | 451295804 | 17019930279635 | 17019930212052 | 17019930564692 | 17019930566547 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 353 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 171264 | 0x7fd4a9882580 | 0x7fd4a6825cc0 | 294137 | 294137 | 20138 | 2353104 | 65536 | 193105829 | 2247784 | 0 | 774178636 | 17019930608576 | 17019930564692 | 17019930948851 | 17019930950496 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 356 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 173760 | 0x7fd4a9882400 | 0x7fd4a6825d00 | 296040 | 296040 | 19946 | 2368328 | 65536 | 176452178 | 2260936 | 0 | 707561580 | 17019930993075 | 17019930948851 | 17019931335250 | 17019931337025 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 359 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 176256 | 0x7fd4a9882280 | 0x7fd4a6825d40 | 225869 | 225869 | 19777 | 1806960 | 65536 | 142663616 | 1693625 | 0 | 572413440 | 17019931379484 | 17019931335250 | 17019931677329 | 17019931679115 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 362 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 179776 | 0x7fd4a9882100 | 0x7fd4a6825d80 | 381688 | 381688 | 27505 | 3053512 | 65536 | 271221019 | 2939507 | 0 | 1086640092 | 17019931721464 | 17019931677329 | 17019932120848 | 17019932166401 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 365 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 182272 | 0x7fd4a7223f80 | 0x7fd4a6825dc0 | 210977 | 210977 | 18418 | 1687824 | 65536 | 129803780 | 1581665 | 0 | 520962156 | 17019932186530 | 17019932120848 | 17019932476687 | 17019932478582 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 368 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 185536 | 0x7fd4a7223e00 | 0x7fd4a6825e00 | 309112 | 309112 | 23640 | 2472904 | 65536 | 184640761 | 2346017 | 0 | 740330276 | 17019932520181 | 17019932476687 | 17019932872366 | 17019932914309 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 371 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 188544 | 0x7fd4a7223c80 | 0x7fd4a6825e40 | 310819 | 310819 | 21589 | 2486560 | 65536 | 186183429 | 2361326 | 0 | 746506536 | 17019932925889 | 17019932872366 | 17019933296365 | 17019933298288 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 374 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 191552 | 0x7fd4a7223b00 | 0x7fd4a6825e80 | 266224 | 266224 | 21258 | 2129800 | 65536 | 169670490 | 2021152 | 0 | 680440276 | 17019933339257 | 17019933296365 | 17019933663404 | 17019933665208 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 377 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 195840 | 0x7fd4a7223980 | 0x7fd4a6825ec0 | 462509 | 462509 | 31297 | 3700080 | 65536 | 331978181 | 3583026 | 0 | 1329674540 | 17019933707527 | 17019933663404 | 17019934152843 | 17019934174633 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 380 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 198592 | 0x7fd4a7223800 | 0x7fd4a6825f00 | 243308 | 243308 | 20340 | 1946472 | 65536 | 168963774 | 1843389 | 0 | 677609504 | 17019934205242 | 17019934152843 | 17019934519242 | 17019934520873 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 383 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 202368 | 0x7fd4a7223680 | 0x7fd4a6825f40 | 335477 | 335477 | 23548 | 2683824 | 65536 | 216303014 | 2569221 | 0 | 866987324 | 17019934564502 | 17019934519242 | 17019934938281 | 17019934980730 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 386 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 205888 | 0x7fd4a9882500 | 0x7fd4a6825f80 | 328686 | 328686 | 22970 | 2629496 | 65536 | 207113270 | 2513175 | 0 | 830218444 | 17019934992470 | 17019934938281 | 17019935369640 | 17019935411328 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 389 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 209408 | 0x7fd4a9882380 | 0x7fd4a6825fc0 | 307135 | 307135 | 23981 | 2457088 | 65536 | 214318920 | 2344555 | 0 | 859034864 | 17019935422998 | 17019935369640 | 17019935784839 | 17019935786587 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 392 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 214464 | 0x7fd4a9882200 | 0x7fd4a6826000 | 542384 | 542384 | 35431 | 4339080 | 65536 | 406972513 | 4225789 | 0 | 1629654268 | 17019935828886 | 17019935784839 | 17019936331718 | 17019936373700 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 395 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 217728 | 0x7fd4a9882080 | 0x7fd4a6826040 | 271653 | 271653 | 21618 | 2173232 | 65536 | 189926627 | 2066340 | 0 | 761462052 | 17019936394060 | 17019936331718 | 17019936723557 | 17019936725430 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 398 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 222016 | 0x7fd4a7223f00 | 0x7fd4a6826080 | 365656 | 365656 | 26400 | 2925256 | 65536 | 239544602 | 2802159 | 0 | 959963024 | 17019936767519 | 17019936723557 | 17019937158116 | 17019937200167 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 401 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 226048 | 0x7fd4a7223d80 | 0x7fd4a68260c0 | 367182 | 367182 | 29185 | 2937464 | 65536 | 253698655 | 2819589 | 0 | 1016566828 | 17019937211696 | 17019937158116 | 17019937614915 | 17019937633424 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 404 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 230080 | 0x7fd4a7223c00 | 0x7fd4a6826100 | 347284 | 347284 | 25374 | 2778280 | 65536 | 243127918 | 2665619 | 0 | 974277912 | 17019937658233 | 17019937614915 | 17019938036994 | 17019938055602 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 407 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 235904 | 0x7fd4a7223a80 | 0x7fd4a6826140 | 623848 | 623848 | 39545 | 4990792 | 65536 | 476972784 | 4876202 | 0 | 1909661196 | 17019938087101 | 17019938036994 | 17019938643712 | 17019938663674 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 410 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 239424 | 0x7fd4a7223900 | 0x7fd4a6826180 | 303270 | 303270 | 22844 | 2426168 | 65536 | 206351438 | 2319175 | 0 | 827172668 | 17019938695814 | 17019938643712 | 17019939049151 | 17019939050853 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 413 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 244224 | 0x7fd4a7223780 | 0x7fd4a68261c0 | 397024 | 397024 | 27275 | 3176200 | 65536 | 276897054 | 3067980 | 0 | 1109374504 | 17019939092252 | 17019939049151 | 17019939504670 | 17019939522360 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 416 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 248768 | 0x7fd4a7223600 | 0x7fd4a6826200 | 391322 | 391322 | 27324 | 3130584 | 65536 | 293408837 | 3027057 | 0 | 1175417380 | 17019939550119 | 17019939504670 | 17019939964029 | 17019939980666 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 419 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 253312 | 0x7fd4a9882480 | 0x7fd4a6826240 | 387216 | 387216 | 27149 | 3097736 | 65536 | 276453939 | 2989703 | 0 | 1107586408 | 17019940007466 | 17019939964029 | 17019940408508 | 17019940427314 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 422 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 8 | 24 | 255552 | 0x7fd4a9882300 | 0x7fd4a6826280 | 718893 | 718893 | 44892 | 5751152 | 65536 | 540909144 | 5631157 | 0 | 2165377160 | 17019940451463 | 17019940408508 | 17019941069466 | 17019941087035 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 425 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 259840 | 0x7fd4a9882180 | 0x7fd4a68262c0 | 362692 | 362692 | 26410 | 2901544 | 65536 | 269988979 | 2797078 | 0 | 1081718476 | 17019941121724 | 17019941069466 | 17019941508185 | 17019941524652 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 428 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 265664 | 0x7fd4a9882000 | 0x7fd4a6826300 | 468925 | 468925 | 31339 | 3751408 | 65536 | 353206683 | 3646392 | 0 | 1414610572 | 17019941558011 | 17019941508185 | 17019942019224 | 17019942036587 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 431 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 271232 | 0x7fd4a7223e80 | 0x7fd4a6826340 | 471945 | 471945 | 31667 | 3775568 | 65536 | 353064816 | 3674954 | 0 | 1414038500 | 17019942061736 | 17019942019224 | 17019942556663 | 17019942583791 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 434 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 8 | 24 | 273216 | 0x7fd4a7223d00 | 0x7fd4a6826380 | 482646 | 482646 | 32494 | 3861176 | 65536 | 350916002 | 3748279 | 0 | 1405404980 | 17019942599371 | 17019942556663 | 17019943064822 | 17019943106176 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 437 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 8 | 24 | 275712 | 0x7fd4a7223b80 | 0x7fd4a68263c0 | 879860 | 879860 | 52531 | 7038888 | 65536 | 673266878 | 6925663 | 0 | 2694808708 | 17019943117766 | 17019943064822 | 17019943842900 | 17019943884464 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 440 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 280768 | 0x7fd4a7223a00 | 0x7fd4a6826400 | 426810 | 426810 | 29389 | 3414488 | 65536 | 318360271 | 3302521 | 0 | 1275208344 | 17019943905024 | 17019943842900 | 17019944337299 | 17019944379180 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 443 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 287616 | 0x7fd4a7223880 | 0x7fd4a6826440 | 548651 | 548651 | 35190 | 4389216 | 65536 | 411611099 | 4291196 | 0 | 1648231508 | 17019944390770 | 17019944337299 | 17019944915377 | 17019944957113 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 446 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 294208 | 0x7fd4a7223700 | 0x7fd4a6826480 | 550796 | 550796 | 35888 | 4406376 | 65536 | 418298817 | 4302485 | 0 | 1674977700 | 17019944969823 | 17019944915377 | 17019945488336 | 17019945530227 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 449 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 8 | 24 | 296960 | 0x7fd4a9882580 | 0x7fd4a68264c0 | 564263 | 564263 | 36432 | 4514112 | 65536 | 413688773 | 4395485 | 0 | 1656498992 | 17019945541717 | 17019945488336 | 17019946061294 | 17019946082871 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 452 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 8 | 24 | 299968 | 0x7fd4a9882400 | 0x7fd4a6826500 | 1041668 | 1041668 | 61157 | 8333352 | 65536 | 808631621 | 8221391 | 0 | 3236268028 | 17019946105760 | 17019946061294 | 17019946933132 | 17019946977205 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 455 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 8 | 24 | 302720 | 0x7fd4a9882280 | 0x7fd4a6826540 | 721977 | 721977 | 44212 | 5775824 | 65536 | 542724440 | 5658955 | 0 | 2172638428 | 17019946996855 | 17019946933132 | 17019947605771 | 17019947654306 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 458 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 305472 | 0x7fd4a9882100 | 0x7fd4a6826580 | 723172 | 723172 | 44340 | 5785384 | 65536 | 552253073 | 5671886 | 0 | 2210754476 | 17019947666266 | 17019947605785 | 17019948300342 | 17019948342346 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 461 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 308224 | 0x7fd4a7223f80 | 0x7fd4a68265c0 | 722513 | 722513 | 44340 | 5780112 | 65536 | 544174125 | 5659357 | 0 | 2178437688 | 17019948353756 | 17019948300342 | 17019948985781 | 17019949028687 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 464 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 8 | 24 | 310976 | 0x7fd4a7223e00 | 0x7fd4a6826600 | 724900 | 724900 | 44665 | 5799208 | 65536 | 556871694 | 5691208 | 0 | 2229227556 | 17019949040096 | 17019948985781 | 17019949675219 | 17019949719167 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 467 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 8 | 24 | 313216 | 0x7fd4a7223c80 | 0x7fd4a6826640 | 1366652 | 1366652 | 76866 | 10933224 | 65536 | 1073587196 | 10814138 | 0 | 4296090528 | 17019949730776 | 17019949675219 | 17019950786576 | 17019950832925 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 470 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 8 | 24 | 315968 | 0x7fd4a7223b00 | 0x7fd4a6826680 | 1370605 | 1370605 | 77400 | 10964848 | 65536 | 1079096524 | 10849885 | 0 | 4318127900 | 17019950853444 | 17019950786576 | 17019951888174 | 17019951954703 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 473 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 318720 | 0x7fd4a7223980 | 0x7fd4a68266c0 | 1373983 | 1373983 | 78215 | 10991872 | 65536 | 1081142446 | 10858613 | 0 | 4326311496 | 17019951966762 | 17019951888174 | 17019953044491 | 17019953111700 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 476 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 321472 | 0x7fd4a7223800 | 0x7fd4a6826700 | 1370219 | 1370219 | 76932 | 10961760 | 65536 | 1079430818 | 10852790 | 0 | 4319464284 | 17019953124029 | 17019953044491 | 17019954190408 | 17019954260837 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 479 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 8 | 24 | 324224 | 0x7fd4a7223680 | 0x7fd4a6826740 | 1375940 | 1375940 | 77352 | 11007528 | 65536 | 1087603614 | 10892151 | 0 | 4352157020 | 17019954273096 | 17019954190408 | 17019955322246 | 17019955389134 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 482 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 8 | 24 | 326464 | 0x7fd4a9882500 | 0x7fd4a6826780 | 2661862 | 2661862 | 142555 | 21294904 | 65536 | 2128760507 | 21183129 | 0 | 8516783620 | 17019955400884 | 17019955322246 | 17019957285441 | 17019957357258 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 485 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 8 | 24 | 329216 | 0x7fd4a9882380 | 0x7fd4a68267c0 | 2669925 | 2669925 | 142004 | 21359408 | 65536 | 2133316233 | 21234463 | 0 | 8535005948 | 17019957376547 | 17019957285441 | 17019959224956 | 17019959294972 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 488 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 331968 | 0x7fd4a9882200 | 0x7fd4a6826800 | 2668610 | 2668610 | 142740 | 21348888 | 65536 | 2133378969 | 21236291 | 0 | 8535256284 | 17019959308242 | 17019959224956 | 17019961226232 | 17019961292545 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 491 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 12 | 24 | 334720 | 0x7fd4a9882080 | 0x7fd4a6826840 | 2668083 | 2668083 | 143159 | 21344672 | 65536 | 2125348844 | 21224417 | 0 | 8503136340 | 17019961304345 | 17019961226232 | 17019963216147 | 17019963288077 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 494 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 8 | 24 | 337472 | 0x7fd4a7223f00 | 0x7fd4a6826880 | 2672360 | 2672360 | 143522 | 21378888 | 65536 | 2126093067 | 21259179 | 0 | 8506114380 | 17019963299897 | 17019963216147 | 17019965167982 | 17019965235301 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 497 | 188242 | 188242 | 4194304 | 256 | 0 | 0 | 8 | 24 | 0 | 0x7fd4a7223d80 | 0x7fd4a68268c0 | 5257989 | 5257989 | 273624 | 42063920 | 65536 | 4230758330 | 41923563 | 0 | 16924775100 | 17019965246801 | 17019965167982 | 17019968796454 | 17019968867607 |