41 KiB
41 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | SQ_INSTS_SMEM | SQ_INST_LEVEL_SMEM | SQ_ACCUM_PREV_HIRES | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBufferAligned.kd | 0 | 0 | 0 | 223075 | 223075 | 33554432 | 256 | 0 | 0 | 4 | 32 | 4160 | 0x0 | 0x7f931ec04280 | 3670016 | 2924224 | 327281248 | 17597154367976 | 17588719430319 | 17597306738811 | 17597306856651 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 223075 | 223075 | 32768 | 256 | 0 | 0 | 12 | 24 | 13888 | 0x0 | 0x7f931ec23f80 | 512 | 96990 | 10865032 | 17597311964571 | 17597306738811 | 17597312097854 | 17597312102767 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 5 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 14336 | 0x7f9321c13380 | 0x7f931ec23fc0 | 65536 | 635542 | 71138720 | 17597312138116 | 17597312097854 | 17597312468574 | 17597312471268 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 8 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15040 | 0x7f9321c13200 | 0x7f931ec24000 | 65536 | 668954 | 74844872 | 17597312508957 | 17597312468574 | 17597312880734 | 17597312883107 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 11 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15488 | 0x7f9321c13080 | 0x7f931ec24040 | 65536 | 665030 | 74552216 | 17597312916436 | 17597312880734 | 17597313280574 | 17597313282907 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 14 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 15936 | 0x7f931f46df00 | 0x7f931ec24080 | 65536 | 664266 | 74264696 | 17597313316306 | 17597313280574 | 17597313587455 | 17597313589829 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 17 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 16384 | 0x7f931f46dd80 | 0x7f931ec240c0 | 65536 | 662688 | 74184792 | 17597313622909 | 17597313587455 | 17597313898815 | 17597313901412 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 20 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 17088 | 0x7f931f46dc00 | 0x7f931ec24100 | 131072 | 674174 | 75457840 | 17597313946930 | 17597313898815 | 17597314213215 | 17597314215744 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 23 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 16 | 24 | 17792 | 0x7f931f46da80 | 0x7f931ec24140 | 131072 | 726098 | 81306128 | 17597314248903 | 17597314213215 | 17597314618655 | 17597314621123 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 26 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 16 | 24 | 18496 | 0x7f931f46d900 | 0x7f931ec24180 | 65536 | 679034 | 76165256 | 17597314652482 | 17597314618655 | 17597315014976 | 17597315017543 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 29 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19200 | 0x7f931f46d780 | 0x7f931ec241c0 | 131072 | 712554 | 79823496 | 17597315047612 | 17597315014976 | 17597315336576 | 17597315338935 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 32 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19904 | 0x7f931f46d600 | 0x7f931ec24200 | 131072 | 703346 | 78696448 | 17597315372044 | 17597315336576 | 17597315646976 | 17597315649507 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 35 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 20608 | 0x7f9321c13480 | 0x7f931ec24240 | 131072 | 704280 | 78756160 | 17597315689836 | 17597315646976 | 17597315959136 | 17597315961459 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 38 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 16 | 24 | 21312 | 0x7f9321c13300 | 0x7f931ec24280 | 131072 | 714192 | 79980280 | 17597315994668 | 17597315959136 | 17597316355616 | 17597316358149 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 41 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22016 | 0x7f9321c13180 | 0x7f931ec242c0 | 65536 | 674066 | 75458304 | 17597316390698 | 17597316355616 | 17597316750817 | 17597316753269 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 44 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22720 | 0x7f9321c13000 | 0x7f931ec24300 | 131072 | 706866 | 79057552 | 17597316786328 | 17597316750817 | 17597317057377 | 17597317059851 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 47 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 23424 | 0x7f931f46de80 | 0x7f931ec24340 | 131072 | 718248 | 80420472 | 17597317091891 | 17597317057377 | 17597317362657 | 17597317365124 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 50 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 24128 | 0x7f931f46dd00 | 0x7f931ec24380 | 131072 | 703250 | 78853504 | 17597317404783 | 17597317362657 | 17597317667937 | 17597317670476 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 53 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 16 | 24 | 24832 | 0x7f931f46db80 | 0x7f931ec243c0 | 131072 | 714636 | 79960808 | 17597317703385 | 17597317667937 | 17597318060577 | 17597318062946 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 56 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 16 | 24 | 25536 | 0x7f931f46da00 | 0x7f931ec24400 | 65536 | 630326 | 70626920 | 17597318105805 | 17597318060577 | 17597318506178 | 17597318508775 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 59 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26240 | 0x7f931f46d880 | 0x7f931ec24440 | 131072 | 715790 | 80058024 | 17597318540724 | 17597318506178 | 17597318813698 | 17597318816247 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 62 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26944 | 0x7f931f46d700 | 0x7f931ec24480 | 131072 | 691454 | 77402272 | 17597318850086 | 17597318813698 | 17597319118178 | 17597319120109 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 65 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 27648 | 0x7f9321c13580 | 0x7f931ec244c0 | 131072 | 669112 | 74898928 | 17597319159448 | 17597319118178 | 17597319397378 | 17597319399412 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 68 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 16 | 24 | 28608 | 0x7f9321c13400 | 0x7f931ec24500 | 131072 | 708748 | 79261640 | 17597319432951 | 17597319397378 | 17597319761858 | 17597319763613 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 71 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 16 | 24 | 29312 | 0x7f9321c13280 | 0x7f931ec24540 | 65536 | 688240 | 77087656 | 17597319796522 | 17597319761858 | 17597320130979 | 17597320132803 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 74 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 30016 | 0x7f9321c13100 | 0x7f931ec24580 | 131072 | 678180 | 75974336 | 17597320165302 | 17597320130979 | 17597320407939 | 17597320410176 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 77 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 8 | 24 | 30976 | 0x7f931f46df80 | 0x7f931ec245c0 | 131072 | 660320 | 74001800 | 17597320442495 | 17597320407939 | 17597320685539 | 17597320687419 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 80 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 31680 | 0x7f931f46de00 | 0x7f931ec24600 | 131072 | 694760 | 77826152 | 17597320725998 | 17597320685539 | 17597320971939 | 17597320973862 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 83 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 16 | 24 | 32640 | 0x7f931f46dc80 | 0x7f931ec24640 | 131072 | 652222 | 73024600 | 17597321006161 | 17597320971939 | 17597321339779 | 17597321341672 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 86 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 33600 | 0x7f931f46db00 | 0x7f931ec24680 | 65536 | 644760 | 72175248 | 17597321373252 | 17597321339779 | 17597321712100 | 17597321713953 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 89 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 34560 | 0x7f931f46d980 | 0x7f931ec246c0 | 131072 | 697950 | 78224064 | 17597321744992 | 17597321712100 | 17597321996580 | 17597321998466 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 92 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 8 | 24 | 35520 | 0x7f931f46d800 | 0x7f931ec24700 | 131072 | 715062 | 80079536 | 17597322030445 | 17597321996580 | 17597322285540 | 17597322287398 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 95 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 36224 | 0x7f931f46d680 | 0x7f931ec24740 | 131072 | 697808 | 78194000 | 17597322326607 | 17597322285540 | 17597322567620 | 17597322569481 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 98 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 37184 | 0x7f9321c13500 | 0x7f931ec24780 | 131072 | 682792 | 76451232 | 17597322600290 | 17597322567620 | 17597322935940 | 17597322937742 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 101 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 38144 | 0x7f9321c13380 | 0x7f931ec247c0 | 65536 | 664222 | 74436624 | 17597322970181 | 17597322935940 | 17597323304901 | 17597323306962 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 104 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 39104 | 0x7f9321c13200 | 0x7f931ec24800 | 131072 | 735872 | 82313560 | 17597323338562 | 17597323304901 | 17597323584421 | 17597323586475 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 107 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 8 | 24 | 40320 | 0x7f9321c13080 | 0x7f931ec24840 | 131072 | 697810 | 78129336 | 17597323618265 | 17597323584421 | 17597323864421 | 17597323866248 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 110 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 41280 | 0x7f931f46df00 | 0x7f931ec24880 | 131072 | 694898 | 77830464 | 17597323905857 | 17597323864421 | 17597324147781 | 17597324149601 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 113 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 42240 | 0x7f931f46dd80 | 0x7f931ec248c0 | 131072 | 702560 | 78715112 | 17597324181220 | 17597324147781 | 17597324518021 | 17597324519812 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 116 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 43200 | 0x7f931f46dc00 | 0x7f931ec24900 | 65536 | 634644 | 70977992 | 17597324551461 | 17597324518021 | 17597324889862 | 17597324891632 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 119 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 8 | 24 | 44160 | 0x7f931f46da80 | 0x7f931ec24940 | 131072 | 697140 | 78131152 | 17597324922462 | 17597324889862 | 17597325169382 | 17597325171185 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 122 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 45376 | 0x7f931f46d900 | 0x7f931ec24980 | 131072 | 697980 | 78084744 | 17597325203334 | 17597325169382 | 17597325449542 | 17597325451328 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 125 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 46336 | 0x7f931f46d780 | 0x7f931ec249c0 | 131072 | 696226 | 78049968 | 17597325489587 | 17597325449542 | 17597325728582 | 17597325730501 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 128 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 47552 | 0x7f931f46d600 | 0x7f931ec24a00 | 131072 | 702108 | 78737352 | 17597325762170 | 17597325728582 | 17597326091302 | 17597326093172 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 131 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 48512 | 0x7f9321c13480 | 0x7f931ec24a40 | 65536 | 666410 | 74655072 | 17597326126661 | 17597326091302 | 17597326462503 | 17597326464312 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 134 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 8 | 24 | 49472 | 0x7f9321c13300 | 0x7f931ec24a80 | 131072 | 673530 | 75430064 | 17597326496362 | 17597326462503 | 17597326746023 | 17597326747925 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 137 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 50688 | 0x7f9321c13180 | 0x7f931ec24ac0 | 131072 | 667014 | 74670760 | 17597326780364 | 17597326746023 | 17597327028903 | 17597327030658 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 140 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 51648 | 0x7f9321c13000 | 0x7f931ec24b00 | 131072 | 671252 | 75264880 | 17597327069437 | 17597327028903 | 17597327319143 | 17597327320991 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 143 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 52864 | 0x7f931f46de80 | 0x7f931ec24b40 | 131072 | 712228 | 79799792 | 17597327352480 | 17597327319143 | 17597327684743 | 17597327686711 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 146 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 54080 | 0x7f931f46dd00 | 0x7f931ec24b80 | 65536 | 658750 | 73677624 | 17597327718170 | 17597327684743 | 17597328048424 | 17597328050372 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 149 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 8 | 24 | 55296 | 0x7f931f46db80 | 0x7f931ec24bc0 | 131072 | 697100 | 78223472 | 17597328081711 | 17597328048424 | 17597328327144 | 17597328329005 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 152 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 56768 | 0x7f931f46da00 | 0x7f931ec24c00 | 131072 | 710644 | 79686320 | 17597328361274 | 17597328327144 | 17597328610504 | 17597328612358 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 155 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 57728 | 0x7f931f46d880 | 0x7f931ec24c40 | 131072 | 710408 | 79587520 | 17597328651187 | 17597328610504 | 17597328889224 | 17597328891190 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 158 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 58944 | 0x7f931f46d700 | 0x7f931ec24c80 | 131072 | 672038 | 75223808 | 17597328922200 | 17597328889224 | 17597329257704 | 17597329259461 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 161 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 60160 | 0x7f9321c13580 | 0x7f931ec24cc0 | 65536 | 662710 | 74304592 | 17597329291530 | 17597329257704 | 17597329622665 | 17597329624542 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 164 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 8 | 24 | 61376 | 0x7f9321c13400 | 0x7f931ec24d00 | 131072 | 706096 | 79082776 | 17597329656121 | 17597329622665 | 17597329903945 | 17597329905965 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 167 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 62848 | 0x7f9321c13280 | 0x7f931ec24d40 | 131072 | 702730 | 78712760 | 17597329937524 | 17597329903945 | 17597330201385 | 17597330203447 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 170 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 63808 | 0x7f9321c13100 | 0x7f931ec24d80 | 131072 | 716614 | 80258024 | 17597330242846 | 17597330201385 | 17597330484425 | 17597330486270 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 173 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 65024 | 0x7f931f46df80 | 0x7f931ec24dc0 | 131072 | 656912 | 73598504 | 17597330519099 | 17597330484425 | 17597330848105 | 17597330850041 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 176 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 66240 | 0x7f931f46de00 | 0x7f931ec24e00 | 65536 | 633070 | 70869888 | 17597330882520 | 17597330848105 | 17597331212106 | 17597331213981 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 179 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 8 | 24 | 67456 | 0x7f931f46dc80 | 0x7f931ec24e40 | 131072 | 705818 | 79022760 | 17597331245461 | 17597331212106 | 17597331490506 | 17597331492484 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 182 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 68928 | 0x7f931f46db00 | 0x7f931ec24e80 | 131072 | 718288 | 80554376 | 17597331523804 | 17597331490506 | 17597331778346 | 17597331780317 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 185 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 70144 | 0x7f931f46d980 | 0x7f931ec24ec0 | 131072 | 661874 | 74136848 | 17597331818476 | 17597331778346 | 17597332056586 | 17597332058540 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 188 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 71616 | 0x7f931f46d800 | 0x7f931ec24f00 | 131072 | 703060 | 78572800 | 17597332089789 | 17597332056586 | 17597332424266 | 17597332426101 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 191 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 72832 | 0x7f931f46d680 | 0x7f931ec24f40 | 65536 | 662214 | 74344912 | 17597332457410 | 17597332424266 | 17597332790346 | 17597332792111 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 194 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 8 | 24 | 74048 | 0x7f9321c13500 | 0x7f931ec24f80 | 131072 | 667848 | 74811800 | 17597332823461 | 17597332790346 | 17597333076107 | 17597333078104 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 197 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 75776 | 0x7f9321c13380 | 0x7f931ec24fc0 | 131072 | 670202 | 75058656 | 17597333109323 | 17597333076107 | 17597333368267 | 17597333370227 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 200 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 76992 | 0x7f9321c13200 | 0x7f931ec25000 | 131072 | 708088 | 79246456 | 17597333409146 | 17597333368267 | 17597333653547 | 17597333655430 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 203 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 78464 | 0x7f9321c13080 | 0x7f931ec25040 | 131072 | 704406 | 78916808 | 17597333688409 | 17597333653547 | 17597334019627 | 17597334021430 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 206 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 79936 | 0x7f931f46df00 | 0x7f931ec25080 | 65536 | 676510 | 75787792 | 17597334053709 | 17597334019627 | 17597334404587 | 17597334406740 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 209 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 8 | 24 | 81408 | 0x7f931f46dd80 | 0x7f931ec250c0 | 131072 | 708676 | 79361680 | 17597334438370 | 17597334404587 | 17597334688428 | 17597334690223 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 212 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 83136 | 0x7f931f46dc00 | 0x7f931ec25100 | 131072 | 703188 | 78758032 | 17597334721262 | 17597334688428 | 17597334986828 | 17597334988716 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 215 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 84352 | 0x7f931f46da80 | 0x7f931ec25140 | 131072 | 711374 | 79750704 | 17597335038064 | 17597334986828 | 17597335266988 | 17597335269488 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 218 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 85824 | 0x7f931f46d900 | 0x7f931ec25180 | 131072 | 709356 | 79350424 | 17597335302398 | 17597335266988 | 17597335641228 | 17597335643189 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 221 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 87296 | 0x7f931f46d780 | 0x7f931ec251c0 | 65536 | 665750 | 74682744 | 17597335674408 | 17597335641228 | 17597336012428 | 17597336014399 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 224 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 88768 | 0x7f931f46d600 | 0x7f931ec25200 | 131072 | 692582 | 77599992 | 17597336045289 | 17597336012428 | 17597336290989 | 17597336293122 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 227 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 90752 | 0x7f9321c13480 | 0x7f931ec25240 | 131072 | 702280 | 78569912 | 17597336324782 | 17597336290989 | 17597336592269 | 17597336594275 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 230 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 91968 | 0x7f9321c13300 | 0x7f931ec25280 | 131072 | 693860 | 77791912 | 17597336633174 | 17597336592269 | 17597336871629 | 17597336873568 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 233 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 93440 | 0x7f9321c13180 | 0x7f931ec252c0 | 131072 | 706080 | 79064344 | 17597336905237 | 17597336871629 | 17597337239629 | 17597337241428 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 236 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 94912 | 0x7f9321c13000 | 0x7f931ec25300 | 65536 | 666258 | 74630208 | 17597337273267 | 17597337239629 | 17597337603309 | 17597337605369 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 239 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 96384 | 0x7f931f46de80 | 0x7f931ec25340 | 131072 | 710070 | 79682480 | 17597337636328 | 17597337603309 | 17597337882670 | 17597337884502 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 242 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 98368 | 0x7f931f46dd00 | 0x7f931ec25380 | 131072 | 702104 | 78648408 | 17597337916431 | 17597337882670 | 17597338197070 | 17597338198944 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 245 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 99584 | 0x7f931f46db80 | 0x7f931ec253c0 | 131072 | 700538 | 78454816 | 17597338239503 | 17597338197070 | 17597338489870 | 17597338491926 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 248 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 101312 | 0x7f931f46da00 | 0x7f931ec25400 | 131072 | 666856 | 74761672 | 17597338524835 | 17597338489870 | 17597338860910 | 17597338862717 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 251 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 102784 | 0x7f931f46d880 | 0x7f931ec25440 | 65536 | 659098 | 73784752 | 17597338894486 | 17597338860910 | 17597339223950 | 17597339225938 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 254 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 104256 | 0x7f931f46d700 | 0x7f931ec25480 | 131072 | 662732 | 74236680 | 17597339257507 | 17597339223950 | 17597339502511 | 17597339504391 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 257 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 106240 | 0x7f9321c13580 | 0x7f931ec254c0 | 131072 | 667880 | 74684280 | 17597339536040 | 17597339502511 | 17597339817871 | 17597339819773 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 260 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 107712 | 0x7f9321c13400 | 0x7f931ec25500 | 131072 | 661066 | 74072560 | 17597339859702 | 17597339817871 | 17597340101391 | 17597340103275 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 263 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 16 | 24 | 109440 | 0x7f9321c13280 | 0x7f931ec25540 | 131072 | 710230 | 79482104 | 17597340135205 | 17597340101391 | 17597340468591 | 17597340470596 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 266 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 16 | 24 | 111168 | 0x7f9321c13100 | 0x7f931ec25580 | 65536 | 661678 | 74174808 | 17597340502315 | 17597340468591 | 17597340835951 | 17597340838057 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 269 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 8 | 24 | 112896 | 0x7f931f46df80 | 0x7f931ec255c0 | 131072 | 707212 | 79293872 | 17597340870236 | 17597340835951 | 17597341117872 | 17597341119770 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 272 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 115136 | 0x7f931f46de00 | 0x7f931ec25600 | 131072 | 699874 | 78369792 | 17597341151399 | 17597341117872 | 17597341439152 | 17597341441202 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 275 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 116608 | 0x7f931f46dc80 | 0x7f931ec25640 | 131072 | 725092 | 81096840 | 17597341479951 | 17597341439152 | 17597341719312 | 17597341721264 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 278 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 16 | 24 | 118336 | 0x7f931f46db00 | 0x7f931ec25680 | 131072 | 698688 | 78273480 | 17597341752264 | 17597341719312 | 17597342088272 | 17597342090355 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 281 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 16 | 24 | 120064 | 0x7f931f46d980 | 0x7f931ec256c0 | 65536 | 656586 | 73608176 | 17597342122474 | 17597342088272 | 17597342457712 | 17597342459566 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 284 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 121792 | 0x7f931f46d800 | 0x7f931ec25700 | 131072 | 698516 | 78338248 | 17597342490885 | 17597342457712 | 17597342740273 | 17597342742229 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 287 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 124032 | 0x7f931f46d680 | 0x7f931ec25740 | 131072 | 700370 | 78477592 | 17597342773698 | 17597342740273 | 17597343068753 | 17597343070740 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 290 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 125504 | 0x7f9321c13500 | 0x7f931ec25780 | 131072 | 730982 | 81860504 | 17597343108739 | 17597343068753 | 17597343346033 | 17597343347943 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 293 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 127488 | 0x7f9321c13380 | 0x7f931ec257c0 | 131072 | 703298 | 78797712 | 17597343380002 | 17597343346033 | 17597343712593 | 17597343714574 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 296 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 129216 | 0x7f9321c13200 | 0x7f931ec25800 | 65536 | 665594 | 74649432 | 17597343746363 | 17597343712593 | 17597344077713 | 17597344079695 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 299 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 130944 | 0x7f9321c13080 | 0x7f931ec25840 | 131072 | 660658 | 73990392 | 17597344110364 | 17597344077713 | 17597344363314 | 17597344365207 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 302 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 133440 | 0x7f931f46df00 | 0x7f931ec25880 | 131072 | 666714 | 74697072 | 17597344396947 | 17597344363314 | 17597344708914 | 17597344710799 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 305 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 134912 | 0x7f931f46dd80 | 0x7f931ec258c0 | 131072 | 1038386 | 116257656 | 17597344749948 | 17597344708914 | 17597345001554 | 17597345003581 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 308 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 136896 | 0x7f931f46dc00 | 0x7f931ec25900 | 131072 | 670534 | 75076112 | 17597345033950 | 17597345001554 | 17597345368114 | 17597345370072 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 311 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 138880 | 0x7f931f46da80 | 0x7f931ec25940 | 65536 | 666894 | 74621088 | 17597345400881 | 17597345368114 | 17597345735794 | 17597345737533 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 314 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 140864 | 0x7f931f46d900 | 0x7f931ec25980 | 131072 | 718126 | 80443832 | 17597345769252 | 17597345735794 | 17597346028915 | 17597346030965 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 317 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 143616 | 0x7f931f46d780 | 0x7f931ec259c0 | 131072 | 697842 | 78253680 | 17597346062644 | 17597346028915 | 17597346391315 | 17597346393496 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 320 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 145344 | 0x7f931f46d600 | 0x7f931ec25a00 | 131072 | 1031090 | 115861136 | 17597346433055 | 17597346391315 | 17597346675795 | 17597346677779 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 323 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 147584 | 0x7f9321c13480 | 0x7f931ec25a40 | 131072 | 705648 | 79054560 | 17597346708888 | 17597346675795 | 17597347044435 | 17597347046459 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 326 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 149568 | 0x7f9321c13300 | 0x7f931ec25a80 | 65536 | 670954 | 75064088 | 17597347078618 | 17597347044435 | 17597347409715 | 17597347411750 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 329 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 151552 | 0x7f9321c13180 | 0x7f931ec25ac0 | 131072 | 663496 | 74294224 | 17597347443289 | 17597347409715 | 17597347707476 | 17597347709542 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 332 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 154304 | 0x7f9321c13000 | 0x7f931ec25b00 | 131072 | 668400 | 74793240 | 17597347741332 | 17597347707476 | 17597348082676 | 17597348084693 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 335 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 156288 | 0x7f931f46de80 | 0x7f931ec25b40 | 131072 | 1026636 | 114897616 | 17597348123932 | 17597348082676 | 17597348373556 | 17597348375415 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 338 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 158784 | 0x7f931f46dd00 | 0x7f931ec25b80 | 131072 | 698430 | 78182680 | 17597348407765 | 17597348373556 | 17597348741236 | 17597348743166 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 341 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 161024 | 0x7f931f46db80 | 0x7f931ec25bc0 | 65536 | 683402 | 76514448 | 17597348774895 | 17597348741236 | 17597349113237 | 17597349115207 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 344 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 163264 | 0x7f931f46da00 | 0x7f931ec25c00 | 131072 | 672808 | 75413400 | 17597349146026 | 17597349113237 | 17597349420437 | 17597349422399 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 347 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 166528 | 0x7f931f46d880 | 0x7f931ec25c40 | 131072 | 671530 | 75195136 | 17597349454338 | 17597349420437 | 17597349812757 | 17597349833198 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 350 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 168512 | 0x7f931f46d700 | 0x7f931ec25c80 | 131072 | 1032970 | 115454920 | 17597349854798 | 17597349812757 | 17597350118357 | 17597350120291 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 353 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 171264 | 0x7f9321c13580 | 0x7f931ec25cc0 | 131072 | 676368 | 75721968 | 17597350151800 | 17597350118357 | 17597350490517 | 17597350492541 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 356 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 173760 | 0x7f9321c13400 | 0x7f931ec25d00 | 65536 | 669610 | 74897784 | 17597350524561 | 17597350490517 | 17597350858518 | 17597350860582 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 359 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 176256 | 0x7f9321c13280 | 0x7f931ec25d40 | 131072 | 668750 | 74900584 | 17597350892281 | 17597350858518 | 17597351182358 | 17597351184154 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 362 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 179776 | 0x7f9321c13100 | 0x7f931ec25d80 | 131072 | 670176 | 75023824 | 17597351216313 | 17597351182358 | 17597351598518 | 17597351620443 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 365 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 182272 | 0x7f931f46df80 | 0x7f931ec25dc0 | 131072 | 1001158 | 111996720 | 17597351639712 | 17597351598518 | 17597351922358 | 17597351924465 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 368 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 185536 | 0x7f931f46de00 | 0x7f931ec25e00 | 131072 | 697152 | 78221344 | 17597351955654 | 17597351922358 | 17597352300919 | 17597352304986 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 371 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 188544 | 0x7f931f46dc80 | 0x7f931ec25e40 | 65536 | 672452 | 75382408 | 17597352334805 | 17597352300919 | 17597352682039 | 17597352703415 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 374 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 191552 | 0x7f931f46db00 | 0x7f931ec25e80 | 131072 | 672120 | 75272112 | 17597352714855 | 17597352682039 | 17597353037559 | 17597353039557 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 377 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 195840 | 0x7f931f46d980 | 0x7f931ec25ec0 | 131072 | 670680 | 75082576 | 17597353070026 | 17597353037559 | 17597353507319 | 17597353526105 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 380 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 198592 | 0x7f931f46d800 | 0x7f931ec25f00 | 131072 | 1040348 | 116659016 | 17597353549374 | 17597353507319 | 17597353851959 | 17597353853856 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 383 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 202368 | 0x7f931f46d680 | 0x7f931ec25f40 | 131072 | 1006542 | 112700832 | 17597353885225 | 17597353851959 | 17597354245720 | 17597354269046 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 386 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 205888 | 0x7f9321c13500 | 0x7f931ec25f80 | 65536 | 671122 | 75258728 | 17597354281075 | 17597354245720 | 17597354660920 | 17597354680075 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 389 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 209408 | 0x7f9321c13380 | 0x7f931ec25fc0 | 131072 | 653696 | 73301256 | 17597354694815 | 17597354660920 | 17597355044280 | 17597355046316 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 392 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 214464 | 0x7f9321c13200 | 0x7f931ec26000 | 131072 | 666582 | 74693536 | 17597355078635 | 17597355044280 | 17597355565881 | 17597355608712 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 395 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 217728 | 0x7f9321c13080 | 0x7f931ec26040 | 131072 | 1041874 | 116597504 | 17597355629221 | 17597355565881 | 17597355946361 | 17597355948133 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 398 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 222016 | 0x7f931f46df00 | 0x7f931ec26080 | 131072 | 1032236 | 115775712 | 17597355980002 | 17597355946361 | 17597356360441 | 17597356403071 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 401 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 226048 | 0x7f931f46dd80 | 0x7f931ec260c0 | 65536 | 665294 | 74496584 | 17597356415051 | 17597356360441 | 17597356807481 | 17597356826960 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 404 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 230080 | 0x7f931f46dc00 | 0x7f931ec26100 | 131072 | 664030 | 74379976 | 17597356840870 | 17597356807481 | 17597357213242 | 17597357230970 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 407 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 235904 | 0x7f931f46da80 | 0x7f931ec26140 | 131072 | 681610 | 76317440 | 17597357247050 | 17597357213242 | 17597357791962 | 17597357810505 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 410 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 239424 | 0x7f931f46d900 | 0x7f931ec26180 | 131072 | 1042806 | 116904424 | 17597357833835 | 17597357791962 | 17597358175322 | 17597358177346 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 413 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 244224 | 0x7f931f46d780 | 0x7f931ec261c0 | 131072 | 1011952 | 113558168 | 17597358208925 | 17597358175322 | 17597358622682 | 17597358669334 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 416 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 248768 | 0x7f931f46d600 | 0x7f931ec26200 | 65536 | 664286 | 74368744 | 17597358681623 | 17597358622682 | 17597359095643 | 17597359137992 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 419 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 253312 | 0x7f9321c13480 | 0x7f931ec26240 | 131072 | 666756 | 74648400 | 17597359149211 | 17597359095643 | 17597359551643 | 17597359594280 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 422 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 8 | 24 | 255552 | 0x7f9321c13300 | 0x7f931ec26280 | 131072 | 1038062 | 116465224 | 17597359606080 | 17597359551643 | 17597360223003 | 17597360265703 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 425 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 259840 | 0x7f9321c13180 | 0x7f931ec262c0 | 131072 | 1045256 | 117014992 | 17597360286333 | 17597360223003 | 17597360665244 | 17597360707782 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 428 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 265664 | 0x7f9321c13000 | 0x7f931ec26300 | 131072 | 1007058 | 112558008 | 17597360719592 | 17597360665244 | 17597361182524 | 17597361224979 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 431 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 271232 | 0x7f931f46de80 | 0x7f931ec26340 | 65536 | 657532 | 73680936 | 17597361237358 | 17597361182524 | 17597361699164 | 17597361717576 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 434 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 8 | 24 | 273216 | 0x7f931f46dd00 | 0x7f931ec26380 | 131072 | 1005954 | 112684560 | 17597361732206 | 17597361699164 | 17597362190845 | 17597362239043 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 437 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 8 | 24 | 275712 | 0x7f931f46db80 | 0x7f931ec263c0 | 131072 | 1042374 | 116961312 | 17597362251443 | 17597362190845 | 17597362972445 | 17597363015383 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 440 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 280768 | 0x7f931f46da00 | 0x7f931ec26400 | 131072 | 1064520 | 119203776 | 17597363035773 | 17597362972445 | 17597363460285 | 17597363504371 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 443 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 287616 | 0x7f931f46d880 | 0x7f931ec26440 | 131072 | 1042964 | 116718240 | 17597363515870 | 17597363460285 | 17597364027806 | 17597364070626 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 446 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 294208 | 0x7f931f46d700 | 0x7f931ec26480 | 65536 | 663618 | 74381656 | 17597364083626 | 17597364027806 | 17597364592766 | 17597364635562 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 449 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 8 | 24 | 296960 | 0x7f9321c13580 | 0x7f931ec264c0 | 131072 | 1000220 | 112098968 | 17597364647432 | 17597364592766 | 17597365157886 | 17597365200478 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 452 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 8 | 24 | 299968 | 0x7f9321c13400 | 0x7f931ec26500 | 131072 | 1043906 | 116970336 | 17597365212197 | 17597365157886 | 17597366032927 | 17597366080735 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 455 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 8 | 24 | 302720 | 0x7f9321c13280 | 0x7f931ec26540 | 131072 | 1039030 | 116234576 | 17597366103624 | 17597366032927 | 17597366708287 | 17597366753068 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 458 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 305472 | 0x7f9321c13100 | 0x7f931ec26580 | 131072 | 1029336 | 115203056 | 17597366765068 | 17597366708287 | 17597367397408 | 17597367439831 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 461 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 308224 | 0x7f931f46df80 | 0x7f931ec265c0 | 65536 | 676850 | 75914936 | 17597367452270 | 17597367397408 | 17597368079328 | 17597368123053 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 464 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 8 | 24 | 310976 | 0x7f931f46de00 | 0x7f931ec26600 | 131072 | 1030904 | 115374280 | 17597368134303 | 17597368079328 | 17597368745249 | 17597368788626 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 467 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 8 | 24 | 313216 | 0x7f931f46dc80 | 0x7f931ec26640 | 131072 | 1030312 | 115314640 | 17597368800216 | 17597368745099 | 17597369840139 | 17597369888059 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 470 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 8 | 24 | 315968 | 0x7f931f46db00 | 0x7f931ec26680 | 131072 | 1030648 | 115399864 | 17597369908628 | 17597369840139 | 17597370924619 | 17597370974181 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 473 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 318720 | 0x7f931f46d980 | 0x7f931ec266c0 | 131072 | 1028750 | 115070680 | 17597370986871 | 17597370924619 | 17597372057579 | 17597372122792 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 476 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 321472 | 0x7f931f46d800 | 0x7f931ec26700 | 65536 | 667858 | 74772640 | 17597372135112 | 17597372057579 | 17597373192780 | 17597373258383 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 479 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 8 | 24 | 324224 | 0x7f931f46d680 | 0x7f931ec26740 | 131072 | 1048612 | 117538728 | 17597373270383 | 17597373192780 | 17597374307340 | 17597374377395 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 482 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 8 | 24 | 326464 | 0x7f9321c13500 | 0x7f931ec26780 | 131072 | 1042638 | 117104624 | 17597374390544 | 17597374307340 | 17597376275021 | 17597376340695 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 485 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 8 | 24 | 329216 | 0x7f9321c13380 | 0x7f931ec267c0 | 131072 | 1030956 | 115495896 | 17597376361114 | 17597376275021 | 17597378203661 | 17597378279105 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 488 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 331968 | 0x7f9321c13200 | 0x7f931ec26800 | 131072 | 1032982 | 115519584 | 17597378292145 | 17597378203661 | 17597380199502 | 17597380268425 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 491 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 12 | 24 | 334720 | 0x7f9321c13080 | 0x7f931ec26840 | 65536 | 672240 | 75212416 | 17597380281674 | 17597380199502 | 17597382174223 | 17597382243035 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 494 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 8 | 24 | 337472 | 0x7f931f46df00 | 0x7f931ec26880 | 131072 | 1041268 | 116482736 | 17597382255654 | 17597382174223 | 17597384122543 | 17597384191705 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 497 | 223075 | 223075 | 4194304 | 256 | 0 | 0 | 8 | 24 | 0 | 0x7f931f46dd80 | 0x7f931ec268c0 | 131072 | 1045480 | 116818840 | 17597384204405 | 17597384122543 | 17597387742704 | 17597387818633 |