43 KiB
43 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | SQ_INSTS_VMEM | SQ_INST_LEVEL_VMEM | SQ_ACCUM_PREV_HIRES | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBuffer.kd | 0 | 0 | 0 | 936686 | 936691 | 33554432 | 256 | 0 | 0 | 8 | 32 | 6464 | 0x0 | 0x7fa3b8c04180 | 1048576 | 11096456 | 1419911252 | 12076631726864889 | 12076631974434106 | 12076631974755065 | 12076631974864438 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 936686 | 936691 | 32768 | 256 | 0 | 0 | 24 | 24 | 12480 | 0x0 | 0x7fa3b8c35100 | 4096 | 107784 | 13788356 | 12076631989518086 | 12076631989806097 | 12076631989812497 | 12076631989817693 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 4 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 12928 | 0x7fa4c491a900 | 0x7fa3b8c35140 | 524288 | 10667896 | 1365491840 | 12076631989877063 | 12076631990100976 | 12076631990238896 | 12076631990242964 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 6 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 36 | 24 | 13632 | 0x7fa4c491a800 | 0x7fa3b8c35180 | 524288 | 13037531 | 1668759720 | 12076631990314367 | 12076631990488335 | 12076631990742414 | 12076631990810750 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 8 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 14080 | 0x7fa4c491a700 | 0x7fa3b8c351c0 | 524288 | 13959441 | 1786798668 | 12076631990847188 | 12076631991030093 | 12076631991286732 | 12076631991355774 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 10 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 14528 | 0x7fa4c491a600 | 0x7fa3b8c35200 | 524288 | 10689784 | 1368193348 | 12076631991381402 | 12076631991568812 | 12076631991707211 | 12076631991710684 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 12 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 14976 | 0x7fa4c491a500 | 0x7fa3b8c35240 | 524288 | 10655940 | 1363974456 | 12076631991762390 | 12076631991925130 | 12076631992064170 | 12076631992067828 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 14 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 15424 | 0x7fa4c491a400 | 0x7fa3b8c35280 | 524288 | 11186260 | 1431745012 | 12076631992148108 | 12076631992322569 | 12076631992459369 | 12076631992462773 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 16 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 16128 | 0x7fa4c491a300 | 0x7fa3b8c352c0 | 524288 | 13594400 | 1740078036 | 12076631992511934 | 12076631992691208 | 12076631992944807 | 12076631992987780 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 18 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 16832 | 0x7fa4c491aa00 | 0x7fa3b8c35300 | 524288 | 14091881 | 1803759428 | 12076631993018276 | 12076631993203366 | 12076631993497925 | 12076631993540698 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 20 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 17536 | 0x7fa4c491a900 | 0x7fa3b8c35340 | 524288 | 12434664 | 1591612184 | 12076631993566897 | 12076631993763365 | 12076631993894724 | 12076631993898233 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 22 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 18240 | 0x7fa4c491a800 | 0x7fa3b8c35380 | 524288 | 13287858 | 1700833736 | 12076631993952885 | 12076631994123684 | 12076631994252003 | 12076631994255778 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 24 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 18944 | 0x7fa4c491a700 | 0x7fa3b8c353c0 | 524288 | 12675209 | 1622335436 | 12076631994322272 | 12076631994486722 | 12076631994617762 | 12076631994621148 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 26 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 19904 | 0x7fa4c491a600 | 0x7fa3b8c35400 | 524288 | 13780254 | 1763880268 | 12076631994671482 | 12076631994836801 | 12076631995091841 | 12076631995161984 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 28 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 20608 | 0x7fa4c491a500 | 0x7fa3b8c35440 | 524288 | 14284271 | 1828348304 | 12076631995189024 | 12076631995374080 | 12076631995622399 | 12076631995689605 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 30 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 21312 | 0x7fa4c491a400 | 0x7fa3b8c35480 | 524288 | 12727172 | 1629027216 | 12076631995716886 | 12076631995897598 | 12076631996026878 | 12076631996030650 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 32 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 22016 | 0x7fa4c491a300 | 0x7fa3b8c354c0 | 524288 | 11350987 | 1452996020 | 12076631996079160 | 12076631996249757 | 12076631996385277 | 12076631996388806 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 34 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 22720 | 0x7fa4c491aa00 | 0x7fa3b8c35500 | 524288 | 12579972 | 1610252068 | 12076631996452134 | 12076631996616476 | 12076631996747355 | 12076631996750779 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 36 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 23680 | 0x7fa4c491a900 | 0x7fa3b8c35540 | 524288 | 12812013 | 1639861484 | 12076631996800953 | 12076631996964635 | 12076631997225914 | 12076631997294401 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 38 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 24384 | 0x7fa4c491a800 | 0x7fa3b8c35580 | 524288 | 13955090 | 1786187824 | 12076631997317964 | 12076631997507513 | 12076631997761112 | 12076631997828504 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 40 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 25088 | 0x7fa4c491a700 | 0x7fa3b8c355c0 | 524288 | 12648248 | 1618952704 | 12076631997855043 | 12076631998038071 | 12076631998168471 | 12076631998172133 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 42 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 25792 | 0x7fa4c491a600 | 0x7fa3b8c35600 | 524288 | 11189762 | 1432283564 | 12076631998221645 | 12076631998396150 | 12076631998532150 | 12076631998535780 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 44 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 26496 | 0x7fa4c491a500 | 0x7fa3b8c35640 | 524288 | 13050016 | 1670295384 | 12076631998597074 | 12076631998758549 | 12076631998887829 | 12076631998891311 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 46 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 27712 | 0x7fa4c491a400 | 0x7fa3b8c35680 | 524288 | 13693562 | 1752750104 | 12076631998942657 | 12076631999114228 | 12076631999373427 | 12076631999443258 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 48 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 28416 | 0x7fa4c491a300 | 0x7fa3b8c356c0 | 524288 | 13879294 | 1776540664 | 12076631999467823 | 12076631999648466 | 12076631999905266 | 12076631999972562 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 50 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 29120 | 0x7fa4c491aa00 | 0x7fa3b8c35700 | 524288 | 12094408 | 1547985556 | 12076631999999783 | 12076632000180625 | 12076632000313424 | 12076632000317183 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 52 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 30080 | 0x7fa4c491a900 | 0x7fa3b8c35740 | 524288 | 12382294 | 1584924164 | 12076632000369150 | 12076632000527984 | 12076632000660783 | 12076632000664299 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 54 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 30784 | 0x7fa4c491a800 | 0x7fa3b8c35780 | 524288 | 12566523 | 1608501928 | 12076632000726465 | 12076632000889582 | 12076632001020462 | 12076632001024289 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 56 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 32000 | 0x7fa4c491a700 | 0x7fa3b8c357c0 | 524288 | 13388619 | 1713662940 | 12076632001073971 | 12076632001253581 | 12076632001515181 | 12076632001582848 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 58 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 32960 | 0x7fa4c491a600 | 0x7fa3b8c35800 | 524288 | 13637840 | 1745632680 | 12076632001609788 | 12076632001788940 | 12076632002041419 | 12076632002112032 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 60 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 33920 | 0x7fa4c491a500 | 0x7fa3b8c35840 | 524288 | 12761042 | 1633355396 | 12076632002136287 | 12076632002318218 | 12076632002449418 | 12076632002452956 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 62 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 34880 | 0x7fa4c491a400 | 0x7fa3b8c35880 | 524288 | 11217114 | 1435872640 | 12076632002504522 | 12076632002667817 | 12076632002804457 | 12076632002807966 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 64 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 35840 | 0x7fa4c491a300 | 0x7fa3b8c358c0 | 524288 | 12495035 | 1599387404 | 12076632002871154 | 12076632003039816 | 12076632003171175 | 12076632003175119 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 66 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 37312 | 0x7fa4c491aa00 | 0x7fa3b8c35900 | 524288 | 13371610 | 1711527468 | 12076632003225263 | 12076632003396935 | 12076632003654534 | 12076632003722938 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 68 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 38272 | 0x7fa4c491a900 | 0x7fa3b8c35940 | 524288 | 13837964 | 1771234508 | 12076632003750319 | 12076632003928293 | 12076632004184292 | 12076632004253135 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 70 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 39232 | 0x7fa4c491a800 | 0x7fa3b8c35980 | 524288 | 11566995 | 1480559520 | 12076632004281047 | 12076632004459811 | 12076632004595651 | 12076632004599128 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 72 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 40192 | 0x7fa4c491a700 | 0x7fa3b8c359c0 | 524288 | 12757724 | 1633023048 | 12076632004649241 | 12076632004829410 | 12076632004961250 | 12076632004964899 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 74 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 41152 | 0x7fa4c491a600 | 0x7fa3b8c35a00 | 524288 | 12429876 | 1590980968 | 12076632005032524 | 12076632005197249 | 12076632005327329 | 12076632005331040 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 76 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 42624 | 0x7fa4c491a500 | 0x7fa3b8c35a40 | 524288 | 13457016 | 1722474288 | 12076632005381123 | 12076632005545568 | 12076632005801887 | 12076632005870243 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 78 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 43584 | 0x7fa4c491a400 | 0x7fa3b8c35a80 | 524288 | 13657110 | 1748062052 | 12076632005893145 | 12076632006076446 | 12076632006336766 | 12076632006406029 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 80 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 44544 | 0x7fa4c491a300 | 0x7fa3b8c35ac0 | 524288 | 12748746 | 1631856924 | 12076632006432769 | 12076632006608285 | 12076632006739324 | 12076632006742946 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 82 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 45760 | 0x7fa4c491aa00 | 0x7fa3b8c35b00 | 524288 | 10426734 | 1334713616 | 12076632006792678 | 12076632006956444 | 12076632007096923 | 12076632007100561 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 84 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 46720 | 0x7fa4c491a900 | 0x7fa3b8c35b40 | 524288 | 12588625 | 1611260212 | 12076632007163057 | 12076632007324762 | 12076632007455162 | 12076632007458918 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 86 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 48448 | 0x7fa4c491a800 | 0x7fa3b8c35b80 | 524288 | 13875290 | 1776031308 | 12076632007510233 | 12076632007673401 | 12076632007938201 | 12076632008013810 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 88 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 49408 | 0x7fa4c491a700 | 0x7fa3b8c35bc0 | 524288 | 14085119 | 1802903820 | 12076632008038195 | 12076632008219640 | 12076632008474999 | 12076632008545379 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 90 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 50368 | 0x7fa4c491a600 | 0x7fa3b8c35c00 | 524288 | 13172884 | 1686138416 | 12076632008567961 | 12076632008750518 | 12076632008878358 | 12076632008881915 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 92 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 51584 | 0x7fa4c491a500 | 0x7fa3b8c35c40 | 524288 | 10440186 | 1336242800 | 12076632008932238 | 12076632009099157 | 12076632009238677 | 12076632009242375 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 94 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 52544 | 0x7fa4c491a400 | 0x7fa3b8c35c80 | 524288 | 12648685 | 1619016092 | 12076632009305503 | 12076632009466676 | 12076632009597075 | 12076632009600642 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 96 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 54272 | 0x7fa4c491a300 | 0x7fa3b8c35cc0 | 524288 | 13896022 | 1778697304 | 12076632009650184 | 12076632009812115 | 12076632010083474 | 12076632010152879 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 98 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 55488 | 0x7fa4c491aa00 | 0x7fa3b8c35d00 | 524288 | 13695447 | 1753024176 | 12076632010178286 | 12076632010361073 | 12076632010657072 | 12076632010724733 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 100 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 56704 | 0x7fa4c491a900 | 0x7fa3b8c35d40 | 524288 | 11033413 | 1412272048 | 12076632010749959 | 12076632010926031 | 12076632011063791 | 12076632011067530 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 102 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 58176 | 0x7fa4c491a800 | 0x7fa3b8c35d80 | 524288 | 9420400 | 1205790712 | 12076632011118144 | 12076632011282030 | 12076632011424750 | 12076632011428281 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 104 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 59392 | 0x7fa4c491a700 | 0x7fa3b8c35dc0 | 524288 | 12316996 | 1576606928 | 12076632011489926 | 12076632011651469 | 12076632011784749 | 12076632011788612 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 106 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 61376 | 0x7fa4c491a600 | 0x7fa3b8c35e00 | 524288 | 13748793 | 1759803552 | 12076632011838214 | 12076632012000748 | 12076632012271627 | 12076632012314850 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 108 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 62592 | 0x7fa4c491a500 | 0x7fa3b8c35e40 | 524288 | 13590756 | 1739682560 | 12076632012338805 | 12076632012523946 | 12076632012781865 | 12076632012847862 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 110 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 63808 | 0x7fa4c491a400 | 0x7fa3b8c35e80 | 524288 | 11638260 | 1489764796 | 12076632012876605 | 12076632013057385 | 12076632013191624 | 12076632013195368 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 112 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 65280 | 0x7fa4c491a300 | 0x7fa3b8c35ec0 | 524288 | 8879909 | 1136630552 | 12076632013244410 | 12076632013414664 | 12076632013553863 | 12076632013557342 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 114 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 66496 | 0x7fa4c491aa00 | 0x7fa3b8c35f00 | 524288 | 12450878 | 1593642436 | 12076632013619327 | 12076632013782502 | 12076632013914022 | 12076632013917592 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 116 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 68480 | 0x7fa4c491a900 | 0x7fa3b8c35f40 | 524288 | 13561968 | 1735908564 | 12076632013966843 | 12076632014138341 | 12076632014398660 | 12076632014467595 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 118 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 69696 | 0x7fa4c491a800 | 0x7fa3b8c35f80 | 524288 | 13479846 | 1725387392 | 12076632014493673 | 12076632014671140 | 12076632014928259 | 12076632014995086 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 120 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 70912 | 0x7fa4c491a700 | 0x7fa3b8c35fc0 | 524288 | 11674039 | 1494197704 | 12076632015027055 | 12076632015203458 | 12076632015338978 | 12076632015342612 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 122 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 72384 | 0x7fa4c491a600 | 0x7fa3b8c36000 | 524288 | 7078457 | 906093676 | 12076632015391303 | 12076632015556257 | 12076632015695616 | 12076632015699256 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 124 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 73600 | 0x7fa4c491a500 | 0x7fa3b8c36040 | 524288 | 12426427 | 1590556356 | 12076632015761031 | 12076632015922496 | 12076632016054335 | 12076632016058193 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 126 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 75840 | 0x7fa4c491a400 | 0x7fa3b8c36080 | 524288 | 12975973 | 1660968428 | 12076632016108226 | 12076632016285695 | 12076632016554494 | 12076632016603939 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 128 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 77056 | 0x7fa4c491a300 | 0x7fa3b8c360c0 | 524288 | 13050721 | 1670492132 | 12076632016628494 | 12076632016805693 | 12076632017062332 | 12076632017113046 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 130 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 78272 | 0x7fa4c491aa00 | 0x7fa3b8c36100 | 524288 | 12464778 | 1595380240 | 12076632017137361 | 12076632017318171 | 12076632017450171 | 12076632017453789 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 132 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 80000 | 0x7fa4c491a900 | 0x7fa3b8c36140 | 524288 | 7302888 | 934678224 | 12076632017502510 | 12076632017665210 | 12076632017809850 | 12076632017813499 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 134 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 81216 | 0x7fa4c491a800 | 0x7fa3b8c36180 | 524288 | 11572968 | 1481327076 | 12076632017875514 | 12076632018041049 | 12076632018175609 | 12076632018179459 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 136 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 83456 | 0x7fa4c491a700 | 0x7fa3b8c361c0 | 524288 | 12964342 | 1659505604 | 12076632018229482 | 12076632018400248 | 12076632018662807 | 12076632018712851 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 138 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 84928 | 0x7fa4c491a600 | 0x7fa3b8c36200 | 524288 | 13652339 | 1747483944 | 12076632018736005 | 12076632018914966 | 12076632019171606 | 12076632019222810 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 140 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 86400 | 0x7fa4c491a500 | 0x7fa3b8c36240 | 524288 | 11193312 | 1432687492 | 12076632019250552 | 12076632019427445 | 12076632019563604 | 12076632019567371 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 142 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 88128 | 0x7fa4c491a400 | 0x7fa3b8c36280 | 524288 | 5695137 | 728931472 | 12076632019618155 | 12076632019777844 | 12076632019928883 | 12076632019932670 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 144 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 89600 | 0x7fa4c491a300 | 0x7fa3b8c362c0 | 524288 | 10959406 | 1402768040 | 12076632020023449 | 12076632020184722 | 12076632020322482 | 12076632020326072 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 146 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 92096 | 0x7fa4c491aa00 | 0x7fa3b8c36300 | 524288 | 12813072 | 1640044404 | 12076632020376556 | 12076632020546321 | 12076632020815280 | 12076632020865185 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 148 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 93568 | 0x7fa4c491a900 | 0x7fa3b8c36340 | 524288 | 13523973 | 1730967548 | 12076632020890813 | 12076632021071920 | 12076632021327119 | 12076632021377628 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 150 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 95040 | 0x7fa4c491a800 | 0x7fa3b8c36380 | 524288 | 11713883 | 1499301460 | 12076632021405300 | 12076632021581678 | 12076632021716558 | 12076632021720466 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 152 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 96768 | 0x7fa4c491a700 | 0x7fa3b8c363c0 | 524288 | 4941367 | 632540184 | 12076632021771761 | 12076632021934157 | 12076632022093836 | 12076632022097567 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 154 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 98240 | 0x7fa4c491a600 | 0x7fa3b8c36400 | 524288 | 10799652 | 1382412612 | 12076632022161166 | 12076632022331916 | 12076632022469195 | 12076632022472986 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 156 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 100736 | 0x7fa4c491a500 | 0x7fa3b8c36440 | 524288 | 11637447 | 1489586852 | 12076632022522528 | 12076632022686955 | 12076632022955594 | 12076632022979057 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 158 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 102208 | 0x7fa4c491a400 | 0x7fa3b8c36480 | 524288 | 12905568 | 1651914172 | 12076632023026165 | 12076632023186793 | 12076632023443592 | 12076632023494265 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 160 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 103680 | 0x7fa4c491a300 | 0x7fa3b8c364c0 | 524288 | 11704822 | 1498183668 | 12076632023519052 | 12076632023693352 | 12076632023827911 | 12076632023831653 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 162 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 105664 | 0x7fa4c491aa00 | 0x7fa3b8c36500 | 524288 | 3762652 | 481574592 | 12076632023882107 | 12076632024057190 | 12076632024222470 | 12076632024226297 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 164 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 107136 | 0x7fa4c491a900 | 0x7fa3b8c36540 | 524288 | 12605205 | 1613459792 | 12076632024292961 | 12076632024473029 | 12076632024604069 | 12076632024607827 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 166 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 109888 | 0x7fa4c491a800 | 0x7fa3b8c36580 | 524288 | 10444034 | 1336771500 | 12076632024656838 | 12076632024826308 | 12076632025090787 | 12076632025141429 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 168 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 111360 | 0x7fa4c491a700 | 0x7fa3b8c365c0 | 524288 | 13406164 | 1715990536 | 12076632025164843 | 12076632025347266 | 12076632025605986 | 12076632025653522 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 170 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 112832 | 0x7fa4c491a600 | 0x7fa3b8c36600 | 524288 | 11540052 | 1477134588 | 12076632025682526 | 12076632025854945 | 12076632025989344 | 12076632025993064 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 172 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 114816 | 0x7fa4c491a500 | 0x7fa3b8c36640 | 524288 | 3620430 | 463424412 | 12076632026044579 | 12076632026209184 | 12076632026383263 | 12076632026387066 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 174 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 116288 | 0x7fa4c491a400 | 0x7fa3b8c36680 | 524288 | 11668692 | 1493571988 | 12076632026449573 | 12076632026609982 | 12076632026745982 | 12076632026749681 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 176 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 119040 | 0x7fa4c491a300 | 0x7fa3b8c366c0 | 524288 | 8056353 | 1031230972 | 12076632026798572 | 12076632026965501 | 12076632027230941 | 12076632027282121 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 178 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 120768 | 0x7fa4c491aa00 | 0x7fa3b8c36700 | 524288 | 13749320 | 1759956576 | 12076632027305415 | 12076632027492220 | 12076632027752699 | 12076632027799995 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 180 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 122496 | 0x7fa4c491a900 | 0x7fa3b8c36740 | 524288 | 10784351 | 1380429000 | 12076632027826113 | 12076632028002458 | 12076632028141818 | 12076632028145487 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 182 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 124736 | 0x7fa4c491a800 | 0x7fa3b8c36780 | 524288 | 3311186 | 423791844 | 12076632028195270 | 12076632028364217 | 12076632028547096 | 12076632028550881 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 184 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 126464 | 0x7fa4c491a700 | 0x7fa3b8c367c0 | 524288 | 11121544 | 1423671032 | 12076632028615211 | 12076632028774776 | 12076632028912055 | 12076632028915730 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 186 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 20 | 24 | 127936 | 0x7fa4c491a600 | 0x7fa3b8c36800 | 524288 | 4286397 | 548630380 | 12076632028964851 | 12076632029138615 | 12076632029404534 | 12076632029428644 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 188 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 129664 | 0x7fa4c491a500 | 0x7fa3b8c36840 | 524288 | 13462371 | 1723138352 | 12076632029470582 | 12076632029629973 | 12076632029893652 | 12076632029940606 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 190 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 131392 | 0x7fa4c491a400 | 0x7fa3b8c36880 | 524288 | 12055338 | 1543171640 | 12076632029965813 | 12076632030148691 | 12076632030281971 | 12076632030285869 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 192 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 133632 | 0x7fa4c491a300 | 0x7fa3b8c368c0 | 524288 | 3580745 | 458347708 | 12076632030335832 | 12076632030500690 | 12076632030693010 | 12076632030740785 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 194 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 135360 | 0x7fa4c491aa00 | 0x7fa3b8c36900 | 524288 | 10762855 | 1377632076 | 12076632030778806 | 12076632030936049 | 12076632031074929 | 12076632031078844 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 196 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 20 | 24 | 136832 | 0x7fa4c491a900 | 0x7fa3b8c36940 | 524288 | 2965668 | 379544784 | 12076632031129438 | 12076632031301968 | 12076632031587567 | 12076632031637383 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 198 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 138560 | 0x7fa4c491a800 | 0x7fa3b8c36980 | 524288 | 13724870 | 1756829964 | 12076632031664984 | 12076632031841006 | 12076632032101005 | 12076632032149555 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 200 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 140288 | 0x7fa4c491a700 | 0x7fa3b8c369c0 | 524288 | 12556783 | 1607226172 | 12076632032177487 | 12076632032353645 | 12076632032486924 | 12076632032490890 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 202 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 142784 | 0x7fa4c491a600 | 0x7fa3b8c36a00 | 524288 | 3509537 | 449168532 | 12076632032541094 | 12076632032703083 | 12076632032913163 | 12076632032960313 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 204 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 144768 | 0x7fa4c491a500 | 0x7fa3b8c36a40 | 524288 | 9577535 | 1225947856 | 12076632032998785 | 12076632033167082 | 12076632033310442 | 12076632033314402 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 206 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 20 | 24 | 145728 | 0x7fa4c491a400 | 0x7fa3b8c36a80 | 524288 | 2549341 | 326373608 | 12076632033365447 | 12076632033528041 | 12076632033835560 | 12076632033882228 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 208 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 147712 | 0x7fa4c491a300 | 0x7fa3b8c36ac0 | 524288 | 13938329 | 1784048764 | 12076632033904650 | 12076632034089479 | 12076632034352038 | 12076632034402696 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 210 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 149696 | 0x7fa4c491aa00 | 0x7fa3b8c36b00 | 524288 | 9647066 | 1234926464 | 12076632034426060 | 12076632034604838 | 12076632034744357 | 12076632034748249 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 212 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 152192 | 0x7fa4c491a900 | 0x7fa3b8c36b40 | 524288 | 3497597 | 447756936 | 12076632034796669 | 12076632034959076 | 12076632035187236 | 12076632035237569 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 214 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 154176 | 0x7fa4c491a800 | 0x7fa3b8c36b80 | 524288 | 10935167 | 1399592344 | 12076632035275720 | 12076632035441315 | 12076632035577155 | 12076632035581098 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 216 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 20 | 24 | 155648 | 0x7fa4c491a700 | 0x7fa3b8c36bc0 | 524288 | 2487821 | 318415480 | 12076632035630039 | 12076632035796354 | 12076632036126913 | 12076632036176236 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 218 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 157632 | 0x7fa4c491a600 | 0x7fa3b8c36c00 | 524288 | 13487975 | 1726388348 | 12076632036200771 | 12076632036381632 | 12076632036638911 | 12076632036686435 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 220 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 159616 | 0x7fa4c491a500 | 0x7fa3b8c36c40 | 524288 | 10837100 | 1387119932 | 12076632036712363 | 12076632036887390 | 12076632037028510 | 12076632037032228 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 222 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 162368 | 0x7fa4c491a400 | 0x7fa3b8c36c80 | 524288 | 3418032 | 437393740 | 12076632037082782 | 12076632037247576 | 12076632037493816 | 12076632037520967 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 224 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 164608 | 0x7fa4c491a300 | 0x7fa3b8c36cc0 | 524288 | 9739267 | 1246664408 | 12076632037571831 | 12076632037734934 | 12076632037875574 | 12076632037878542 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 226 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 20 | 24 | 166336 | 0x7fa4c491aa00 | 0x7fa3b8c36d00 | 524288 | 2392954 | 306166508 | 12076632037926591 | 12076632038102133 | 12076632038479893 | 12076632038529072 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 228 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 168576 | 0x7fa4c491a900 | 0x7fa3b8c36d40 | 524288 | 11973629 | 1532529168 | 12076632038558877 | 12076632038733492 | 12076632038999891 | 12076632039047356 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 230 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 170816 | 0x7fa4c491a800 | 0x7fa3b8c36d80 | 524288 | 9364067 | 1198516552 | 12076632039084305 | 12076632039248691 | 12076632039388531 | 12076632039391546 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 232 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 174080 | 0x7fa4c491a700 | 0x7fa3b8c36dc0 | 524288 | 3430122 | 439102892 | 12076632039440808 | 12076632039615090 | 12076632039895090 | 12076632039917334 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 234 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 176576 | 0x7fa4c491a600 | 0x7fa3b8c36e00 | 524288 | 8700235 | 1113566308 | 12076632039971595 | 12076632040143409 | 12076632040283249 | 12076632040286551 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 236 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 20 | 24 | 177792 | 0x7fa4c491a500 | 0x7fa3b8c36e40 | 524288 | 2361529 | 302112880 | 12076632040336604 | 12076632040499408 | 12076632040947727 | 12076632040994448 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 238 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 180288 | 0x7fa4c491a400 | 0x7fa3b8c36e80 | 524288 | 10828654 | 1386005372 | 12076632041026187 | 12076632041206767 | 12076632041475406 | 12076632041522701 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 240 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 182784 | 0x7fa4c491a300 | 0x7fa3b8c36ec0 | 524288 | 7486533 | 958334076 | 12076632041549200 | 12076632041729006 | 12076632041869006 | 12076632041871770 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 242 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 186304 | 0x7fa4c491aa00 | 0x7fa3b8c36f00 | 524288 | 3449786 | 441526416 | 12076632041920781 | 12076632042089965 | 12076632042405644 | 12076632042455185 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 244 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 189312 | 0x7fa4c491a900 | 0x7fa3b8c36f40 | 524288 | 4153049 | 531489656 | 12076632042496352 | 12076632042660524 | 12076632042814124 | 12076632042817058 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 246 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 20 | 24 | 190784 | 0x7fa4c491a800 | 0x7fa3b8c36f80 | 524288 | 2386279 | 305359020 | 12076632042866139 | 12076632043043563 | 12076632043563402 | 12076632043613570 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 248 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 193792 | 0x7fa4c491a700 | 0x7fa3b8c36fc0 | 524288 | 7969875 | 1020139468 | 12076632043638085 | 12076632043818442 | 12076632044118121 | 12076632044167029 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 250 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 196800 | 0x7fa4c491a600 | 0x7fa3b8c37000 | 524288 | 3407015 | 435995508 | 12076632044190914 | 12076632044376840 | 12076632044532040 | 12076632044535024 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 252 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 201088 | 0x7fa4c491a500 | 0x7fa3b8c37040 | 524288 | 3473919 | 444763716 | 12076632044584306 | 12076632044752360 | 12076632045163879 | 12076632045187578 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 254 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 204608 | 0x7fa4c491a400 | 0x7fa3b8c37080 | 524288 | 3272315 | 418740372 | 12076632045246337 | 12076632045413478 | 12076632045590598 | 12076632045594014 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 256 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 20 | 24 | 206080 | 0x7fa4c491a300 | 0x7fa3b8c370c0 | 524288 | 2294983 | 293732696 | 12076632045643756 | 12076632045807557 | 12076632046418916 | 12076632046469482 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 258 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 209600 | 0x7fa4c491aa00 | 0x7fa3b8c37100 | 524288 | 4396336 | 562643820 | 12076632046492745 | 12076632046680036 | 12076632047007875 | 12076632047056684 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 260 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 213120 | 0x7fa4c491a900 | 0x7fa3b8c37140 | 524288 | 3356672 | 429650728 | 12076632047089546 | 12076632047260994 | 12076632047440194 | 12076632047443404 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 262 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 218176 | 0x7fa4c491a800 | 0x7fa3b8c37180 | 524288 | 3698088 | 473353416 | 12076632047493357 | 12076632047655714 | 12076632048111233 | 12076632048160708 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 264 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 222208 | 0x7fa4c491a700 | 0x7fa3b8c371c0 | 524288 | 3115363 | 398663524 | 12076632048197096 | 12076632048360512 | 12076632048560352 | 12076632048608731 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 266 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 20 | 24 | 223936 | 0x7fa4c491a600 | 0x7fa3b8c37200 | 524288 | 2353399 | 301326212 | 12076632048638747 | 12076632048819391 | 12076632049524030 | 12076632049574578 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 268 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 227968 | 0x7fa4c491a500 | 0x7fa3b8c37240 | 524288 | 3759297 | 481240984 | 12076632049597982 | 12076632049780989 | 12076632050154908 | 12076632050204870 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 270 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 232000 | 0x7fa4c491a400 | 0x7fa3b8c37280 | 524288 | 3337562 | 427130436 | 12076632050230498 | 12076632050409788 | 12076632050614107 | 12076632050661219 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 272 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 237824 | 0x7fa4c491a300 | 0x7fa3b8c372c0 | 524288 | 4483183 | 573876308 | 12076632050687679 | 12076632050863067 | 12076632051389626 | 12076632051440479 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 274 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 242368 | 0x7fa4c491aa00 | 0x7fa3b8c37300 | 524288 | 3191474 | 408441500 | 12076632051481154 | 12076632051645305 | 12076632051870265 | 12076632051916845 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 276 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 20 | 24 | 243584 | 0x7fa4c491a900 | 0x7fa3b8c37340 | 524288 | 2314303 | 296064368 | 12076632051943294 | 12076632052123864 | 12076632052925143 | 12076632052974532 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 278 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 248128 | 0x7fa4c491a800 | 0x7fa3b8c37380 | 524288 | 3330637 | 426356880 | 12076632052998307 | 12076632053183222 | 12076632053605461 | 12076632053655018 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 280 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 252672 | 0x7fa4c491a700 | 0x7fa3b8c373c0 | 524288 | 3178098 | 406760076 | 12076632053678402 | 12076632053858101 | 12076632054084020 | 12076632054134019 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 282 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 259264 | 0x7fa4c491a600 | 0x7fa3b8c37400 | 524288 | 4681601 | 599231332 | 12076632054161791 | 12076632054342900 | 12076632054940659 | 12076632054989581 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 284 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 264832 | 0x7fa4c491a500 | 0x7fa3b8c37440 | 524288 | 3300771 | 422651168 | 12076632055030657 | 12076632055198738 | 12076632055468177 | 12076632055518154 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 286 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 20 | 24 | 266304 | 0x7fa4c491a400 | 0x7fa3b8c37480 | 524288 | 2318734 | 296756940 | 12076632055546176 | 12076632055725617 | 12076632056713135 | 12076632056783137 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 288 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 28 | 24 | 271872 | 0x7fa4c491a300 | 0x7fa3b8c374c0 | 524288 | 3537473 | 452802788 | 12076632056818092 | 12076632056985934 | 12076632057502733 | 12076632057571854 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 290 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 277440 | 0x7fa4c491aa00 | 0x7fa3b8c37500 | 524288 | 3306185 | 423158436 | 12076632057603863 | 12076632057780493 | 12076632058053772 | 12076632058122468 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 292 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 12 | 24 | 279936 | 0x7fa4c491a900 | 0x7fa3b8c37540 | 524288 | 2211182 | 283065684 | 12076632058155329 | 12076632058324332 | 12076632059063530 | 12076632059131936 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 294 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 286528 | 0x7fa4c491a800 | 0x7fa3b8c37580 | 524288 | 3343527 | 427946244 | 12076632059175547 | 12076632059338729 | 12076632059655529 | 12076632059722444 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 296 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 20 | 24 | 288000 | 0x7fa4c491a700 | 0x7fa3b8c375c0 | 524288 | 2272972 | 290999932 | 12076632059747401 | 12076632059928968 | 12076632061102246 | 12076632061171640 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 298 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 32 | 24 | 294592 | 0x7fa4c491a600 | 0x7fa3b8c37600 | 524288 | 3455071 | 442240716 | 12076632061201365 | 12076632061387525 | 12076632061996164 | 12076632062064481 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 300 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 301184 | 0x7fa4c491a500 | 0x7fa3b8c37640 | 524288 | 3344160 | 428037120 | 12076632062093996 | 12076632062276483 | 12076632062596643 | 12076632062663014 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 302 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 12 | 24 | 304960 | 0x7fa4c491a400 | 0x7fa3b8c37680 | 524288 | 2215325 | 283556952 | 12076632062686568 | 12076632062871682 | 12076632063751680 | 12076632063820357 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 304 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 24 | 24 | 313600 | 0x7fa4c491a300 | 0x7fa3b8c376c0 | 524288 | 3332364 | 426460868 | 12076632063861203 | 12076632064032160 | 12076632064444959 | 12076632064513807 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 306 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 20 | 24 | 314816 | 0x7fa4c491aa00 | 0x7fa3b8c37700 | 524288 | 2296507 | 293956708 | 12076632064536629 | 12076632064719038 | 12076632066269595 | 12076632066338411 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 308 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 20 | 24 | 317568 | 0x7fa4c491a900 | 0x7fa3b8c37740 | 524288 | 2267842 | 290215000 | 12076632066369378 | 12076632066552955 | 12076632067348313 | 12076632067416947 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 310 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 12 | 24 | 320320 | 0x7fa4c491a800 | 0x7fa3b8c37780 | 524288 | 2156090 | 275898460 | 12076632067446322 | 12076632067628632 | 12076632068067031 | 12076632068135273 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 312 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 12 | 24 | 324096 | 0x7fa4c491a700 | 0x7fa3b8c377c0 | 524288 | 2232883 | 285813132 | 12076632068165610 | 12076632068346391 | 12076632069505588 | 12076632069574180 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 314 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 12 | 24 | 328896 | 0x7fa4c491a600 | 0x7fa3b8c37800 | 524288 | 2225959 | 285007468 | 12076632069618492 | 12076632069786388 | 12076632070573266 | 12076632070643479 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 316 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 20 | 24 | 330112 | 0x7fa4c491a500 | 0x7fa3b8c37840 | 524288 | 2662622 | 340672136 | 12076632070676410 | 12076632070851826 | 12076632073906059 | 12076632073976108 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 318 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 20 | 24 | 332864 | 0x7fa4c491a400 | 0x7fa3b8c37880 | 524288 | 2315165 | 296215488 | 12076632074010582 | 12076632074194539 | 12076632075739016 | 12076632075809107 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 320 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 12 | 24 | 335616 | 0x7fa4c491a300 | 0x7fa3b8c378c0 | 524288 | 2180249 | 278951920 | 12076632075842059 | 12076632076032295 | 12076632076822053 | 12076632076890990 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 322 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 12 | 24 | 339392 | 0x7fa4c491aa00 | 0x7fa3b8c37900 | 524288 | 2566313 | 328514036 | 12076632076915155 | 12076632077120613 | 12076632079403168 | 12076632079473193 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 324 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 12 | 24 | 344192 | 0x7fa4c491a900 | 0x7fa3b8c37940 | 524288 | 2340991 | 299613432 | 12076632079518137 | 12076632079686847 | 12076632081222524 | 12076632081291946 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 326 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 20 | 24 | 345408 | 0x7fa4c491a800 | 0x7fa3b8c37980 | 524288 | 2837649 | 363088816 | 12076632081322042 | 12076632081503164 | 12076632087560911 | 12076632087632931 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 328 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 20 | 24 | 348160 | 0x7fa4c491a700 | 0x7fa3b8c379c0 | 524288 | 3308509 | 423416964 | 12076632087658479 | 12076632087838991 | 12076632090885384 | 12076632090958577 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 330 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 12 | 24 | 350912 | 0x7fa4c491a600 | 0x7fa3b8c37a00 | 524288 | 2303191 | 294805748 | 12076632090985548 | 12076632091177224 | 12076632092716581 | 12076632092788411 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 332 | 936686 | 936691 | 4194304 | 256 | 0 | 0 | 12 | 24 | 0 | 0x7fa4c491a500 | 0x7fa3b8c37a40 | 524288 | 2535117 | 324431768 | 12076632092814990 | 12076632093004740 | 12076632097533531 | 12076632097603959 |