50 KiB
50 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | GRBM_COUNT | GRBM_GUI_ACTIVE | CPC_ME1_BUSY_FOR_PACKET_DECODE | SQ_CYCLES | SQ_WAVES | SQ_WAVE_CYCLES | SQ_BUSY_CYCLES | SQ_LEVEL_WAVES | SQ_ACCUM_PREV_HIRES | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBuffer.kd | 0 | 0 | 0 | 921529 | 921534 | 33554432 | 256 | 0 | 0 | 8 | 32 | 6464 | 0x0 | 0x7f6f26204180 | 502695 | 502695 | 17046 | 4021568 | 524288 | 372600279 | 3816924 | 0 | 1505167052 | 12076327135265660 | 12076327381325743 | 12076327381649102 | 12076327381757735 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 921529 | 921534 | 32768 | 256 | 0 | 0 | 24 | 24 | 12480 | 0x0 | 0x7f6f26235100 | 27819 | 27819 | 20311 | 222560 | 512 | 1122712 | 74488 | 0 | 4504968 | 12076327396356075 | 12076327396679513 | 12076327396685593 | 12076327396695125 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 4 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 12928 | 0x7f7031f1d900 | 0x7f6f26235140 | 219204 | 219204 | 20615 | 1753640 | 65536 | 131444628 | 1582707 | 0 | 527592892 | 12076327396760457 | 12076327397000951 | 12076327397134071 | 12076327397138189 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 6 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 36 | 24 | 13632 | 0x7f7031f1d800 | 0x7f6f26235180 | 393764 | 393764 | 29108 | 3150120 | 65536 | 273156985 | 2982062 | 0 | 1094444912 | 12076327397217927 | 12076327397422229 | 12076327397672148 | 12076327397741230 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 8 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 14080 | 0x7f7031f1d700 | 0x7f6f262351c0 | 395572 | 395572 | 29591 | 3164584 | 65536 | 329910429 | 2975811 | 0 | 1321457988 | 12076327397777507 | 12076327397981747 | 12076327398231986 | 12076327398301691 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 10 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 14528 | 0x7f7031f1d600 | 0x7f6f26235200 | 218644 | 218644 | 19473 | 1749160 | 65536 | 142658733 | 1577012 | 0 | 572449732 | 12076327398326708 | 12076327398535344 | 12076327398668944 | 12076327398672611 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 12 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 14976 | 0x7f7031f1d500 | 0x7f6f26235240 | 223812 | 223812 | 21749 | 1790504 | 65536 | 129076135 | 1616347 | 0 | 518113844 | 12076327398733073 | 12076327398925743 | 12076327399061742 | 12076327399065290 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 14 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 15424 | 0x7f7031f1d400 | 0x7f6f26235280 | 214716 | 214716 | 21675 | 1717736 | 65536 | 156951182 | 1550654 | 0 | 629619912 | 12076327399159065 | 12076327399352781 | 12076327399483820 | 12076327399487345 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 16 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 16128 | 0x7f7031f1d300 | 0x7f6f262352c0 | 410276 | 410276 | 35397 | 3282216 | 65536 | 251123097 | 3107336 | 0 | 1006308440 | 12076327399545924 | 12076327399746699 | 12076327400007178 | 12076327400048898 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 18 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 16832 | 0x7f7031f1da00 | 0x7f6f26235300 | 402596 | 402596 | 32151 | 3220776 | 65536 | 344690180 | 3048123 | 0 | 1380576460 | 12076327400084054 | 12076327400278697 | 12076327400534855 | 12076327400600644 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 20 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 17536 | 0x7f7031f1d900 | 0x7f6f26235340 | 212812 | 212812 | 20992 | 1702504 | 65536 | 158222018 | 1522110 | 0 | 634707908 | 12076327400625730 | 12076327400831974 | 12076327400960773 | 12076327400964410 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 22 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 18240 | 0x7f7031f1d800 | 0x7f6f26235380 | 220165 | 220165 | 19547 | 1761328 | 65536 | 130366679 | 1592966 | 0 | 523283296 | 12076327401031384 | 12076327401226212 | 12076327401360932 | 12076327401364714 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 24 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 18944 | 0x7f7031f1d700 | 0x7f6f262353c0 | 211117 | 211117 | 23784 | 1688944 | 65536 | 161737692 | 1514441 | 0 | 648770336 | 12076327401438120 | 12076327401618050 | 12076327401745730 | 12076327401749449 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 26 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 19904 | 0x7f7031f1d600 | 0x7f6f26235400 | 390460 | 390460 | 32628 | 3123688 | 65536 | 354858086 | 2954174 | 0 | 1421250132 | 12076327401809110 | 12076327402004129 | 12076327402252448 | 12076327402320219 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 28 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 20608 | 0x7f7031f1d500 | 0x7f6f26235440 | 394516 | 394516 | 24590 | 3156136 | 65536 | 283285198 | 2973684 | 0 | 1134958092 | 12076327402348241 | 12076327402558526 | 12076327402808765 | 12076327402875511 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 30 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 21312 | 0x7f7031f1d400 | 0x7f6f26235480 | 217573 | 217573 | 21130 | 1740592 | 65536 | 153580056 | 1576273 | 0 | 616131828 | 12076327402899105 | 12076327403106044 | 12076327403239163 | 12076327403242664 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 32 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 22016 | 0x7f7031f1d300 | 0x7f6f262354c0 | 225605 | 225605 | 22467 | 1804848 | 65536 | 131000276 | 1631073 | 0 | 525813924 | 12076327403301754 | 12076327403496282 | 12076327403633881 | 12076327403637518 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 34 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 22720 | 0x7f7031f1da00 | 0x7f6f26235500 | 217076 | 217076 | 22910 | 1736616 | 65536 | 149158415 | 1571313 | 0 | 598450084 | 12076327403711806 | 12076327403894680 | 12076327404027480 | 12076327404031019 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 36 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 23680 | 0x7f7031f1d900 | 0x7f6f26235540 | 404245 | 404245 | 28723 | 3233968 | 65536 | 304219837 | 3050101 | 0 | 1218693512 | 12076327404091441 | 12076327404286678 | 12076327404543957 | 12076327404609955 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 38 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 24384 | 0x7f7031f1d800 | 0x7f6f26235580 | 403804 | 403804 | 32386 | 3230440 | 65536 | 310926216 | 3042740 | 0 | 1245520580 | 12076327404635522 | 12076327404835956 | 12076327405091795 | 12076327405160448 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 40 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 25088 | 0x7f7031f1d700 | 0x7f6f262355c0 | 216180 | 216180 | 22874 | 1729448 | 65536 | 158862653 | 1556802 | 0 | 637268020 | 12076327405185514 | 12076327405387953 | 12076327405519473 | 12076327405522942 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 42 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 25792 | 0x7f7031f1d600 | 0x7f6f26235600 | 217501 | 217501 | 21934 | 1740016 | 65536 | 147479529 | 1568848 | 0 | 591739008 | 12076327405580599 | 12076327405776112 | 12076327405909071 | 12076327405912806 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 44 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 26496 | 0x7f7031f1d500 | 0x7f6f26235640 | 210060 | 210060 | 23028 | 1680488 | 65536 | 164043640 | 1511714 | 0 | 657992736 | 12076327405985571 | 12076327406168270 | 12076327406295949 | 12076327406299665 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 46 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 27712 | 0x7f7031f1d400 | 0x7f6f26235680 | 393477 | 393477 | 32926 | 3147824 | 65536 | 357396499 | 2976003 | 0 | 1431403828 | 12076327406360127 | 12076327406545388 | 12076327406796107 | 12076327406862571 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 48 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 28416 | 0x7f7031f1d300 | 0x7f6f262356c0 | 398429 | 398429 | 33952 | 3187440 | 65536 | 332660786 | 3007281 | 0 | 1332456112 | 12076327406887347 | 12076327407098186 | 12076327407351304 | 12076327407418034 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 50 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 29120 | 0x7f7031f1da00 | 0x7f6f26235700 | 216244 | 216244 | 22358 | 1729960 | 65536 | 157383696 | 1557729 | 0 | 631354700 | 12076327407442800 | 12076327407643783 | 12076327407776103 | 12076327407779575 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 52 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 30080 | 0x7f7031f1d900 | 0x7f6f26235740 | 217580 | 217580 | 24233 | 1740648 | 65536 | 150988090 | 1559666 | 0 | 605769248 | 12076327407840849 | 12076327408034501 | 12076327408167141 | 12076327408170622 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 54 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 30784 | 0x7f7031f1d800 | 0x7f6f26235780 | 210893 | 210893 | 22265 | 1687152 | 65536 | 149125876 | 1519036 | 0 | 598327684 | 12076327408242526 | 12076327408421700 | 12076327408550659 | 12076327408554225 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 56 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 32000 | 0x7f7031f1d700 | 0x7f6f262357c0 | 409284 | 409284 | 25773 | 3274280 | 65536 | 292572722 | 3093447 | 0 | 1172118292 | 12076327408611902 | 12076327408807618 | 12076327409069217 | 12076327409137980 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 58 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 32960 | 0x7f7031f1d600 | 0x7f6f26235800 | 408380 | 408380 | 28494 | 3267048 | 65536 | 299768216 | 3087224 | 0 | 1200888340 | 12076327409163868 | 12076327409364255 | 12076327409624734 | 12076327409691719 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 60 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 33920 | 0x7f7031f1d500 | 0x7f6f26235840 | 213756 | 213756 | 20522 | 1710056 | 65536 | 152821004 | 1532412 | 0 | 613119968 | 12076327409714421 | 12076327409916093 | 12076327410046012 | 12076327410049744 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 62 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 34880 | 0x7f7031f1d400 | 0x7f6f26235880 | 218309 | 218309 | 24528 | 1746480 | 65536 | 149435080 | 1579429 | 0 | 599589488 | 12076327410109516 | 12076327410298011 | 12076327410432091 | 12076327410435742 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 64 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 35840 | 0x7f7031f1d300 | 0x7f6f262358c0 | 215316 | 215316 | 23307 | 1722536 | 65536 | 163066672 | 1547928 | 0 | 654085080 | 12076327410507655 | 12076327410681529 | 12076327410812729 | 12076327410816469 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 66 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 37312 | 0x7f7031f1da00 | 0x7f6f26235900 | 397596 | 397596 | 34004 | 3180776 | 65536 | 339692340 | 3011197 | 0 | 1360585612 | 12076327410876621 | 12076327411063448 | 12076327411318167 | 12076327411367904 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 68 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 38272 | 0x7f7031f1d900 | 0x7f6f26235940 | 405661 | 405661 | 25737 | 3245296 | 65536 | 299813626 | 3067280 | 0 | 1201063276 | 12076327411394413 | 12076327411595605 | 12076327411854164 | 12076327411874325 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 70 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 39232 | 0x7f7031f1d800 | 0x7f6f26235980 | 226668 | 226668 | 23868 | 1813352 | 65536 | 132811821 | 1636779 | 0 | 533068744 | 12076327411933886 | 12076327412106323 | 12076327412245522 | 12076327412249032 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 72 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 40192 | 0x7f7031f1d700 | 0x7f6f262359c0 | 230268 | 230268 | 25125 | 1842152 | 65536 | 143495999 | 1669554 | 0 | 575821568 | 12076327412308292 | 12076327412496241 | 12076327412637841 | 12076327412641491 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 74 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 41152 | 0x7f7031f1d600 | 0x7f6f26235a00 | 218252 | 218252 | 22378 | 1746024 | 65536 | 155191739 | 1582506 | 0 | 622584292 | 12076327412713294 | 12076327412889039 | 12076327413022959 | 12076327413026697 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 76 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 42624 | 0x7f7031f1d500 | 0x7f6f26235a40 | 413413 | 413413 | 32653 | 3307312 | 65536 | 316670030 | 3129785 | 0 | 1268499144 | 12076327413087500 | 12076327413278478 | 12076327413543276 | 12076327413610221 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 78 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 43584 | 0x7f7031f1d400 | 0x7f6f26235a80 | 399837 | 399837 | 32660 | 3198704 | 65536 | 338705455 | 3027094 | 0 | 1356637164 | 12076327413634026 | 12076327413830955 | 12076327414086474 | 12076327414155715 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 80 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 44544 | 0x7f7031f1d300 | 0x7f6f26235ac0 | 218965 | 218965 | 22655 | 1751728 | 65536 | 153280811 | 1578906 | 0 | 614938856 | 12076327414180111 | 12076327414379593 | 12076327414513032 | 12076327414516636 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 82 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 45760 | 0x7f7031f1da00 | 0x7f6f26235b00 | 223740 | 223740 | 25739 | 1789928 | 65536 | 154857430 | 1610991 | 0 | 621254560 | 12076327414576868 | 12076327414766151 | 12076327414904070 | 12076327414907853 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 84 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 46720 | 0x7f7031f1d900 | 0x7f6f26235b40 | 213637 | 213637 | 23276 | 1709104 | 65536 | 154593955 | 1534868 | 0 | 620206840 | 12076327414979075 | 12076327415161349 | 12076327415291589 | 12076327415295213 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 86 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 48448 | 0x7f7031f1d800 | 0x7f6f26235b80 | 422453 | 422453 | 31736 | 3379632 | 65536 | 347170319 | 3198706 | 0 | 1390498552 | 12076327415352569 | 12076327415540387 | 12076327415811106 | 12076327415877134 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 88 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 49408 | 0x7f7031f1d700 | 0x7f6f26235bc0 | 402364 | 402364 | 27621 | 3218920 | 65536 | 295437547 | 3043653 | 0 | 1183568840 | 12076327415901850 | 12076327416100545 | 12076327416357664 | 12076327416424562 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 90 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 50368 | 0x7f7031f1d600 | 0x7f6f26235c00 | 212053 | 212053 | 21868 | 1696432 | 65536 | 167095985 | 1525051 | 0 | 670203184 | 12076327416448827 | 12076327416651742 | 12076327416781662 | 12076327416785302 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 92 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 51584 | 0x7f7031f1d500 | 0x7f6f26235c40 | 222060 | 222060 | 27474 | 1776488 | 65536 | 153260821 | 1586295 | 0 | 614878272 | 12076327416843450 | 12076327417037821 | 12076327417173980 | 12076327417177762 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 94 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 52544 | 0x7f7031f1d400 | 0x7f6f26235c80 | 220788 | 220788 | 25033 | 1766312 | 65536 | 154861311 | 1578134 | 0 | 621263124 | 12076327417249405 | 12076327417427739 | 12076327417561658 | 12076327417565572 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 96 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 54272 | 0x7f7031f1d300 | 0x7f6f26235cc0 | 424573 | 424573 | 33241 | 3396592 | 65536 | 315580726 | 3210664 | 0 | 1264140496 | 12076327417628589 | 12076327417817497 | 12076327418089176 | 12076327418157532 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 98 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 55488 | 0x7f7031f1da00 | 0x7f6f26235d00 | 407037 | 407037 | 25976 | 3256304 | 65536 | 270289769 | 3083323 | 0 | 1082974556 | 12076327418183921 | 12076327418383894 | 12076327418644373 | 12076327418685403 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 100 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 56704 | 0x7f7031f1d900 | 0x7f6f26235d40 | 217708 | 217708 | 23341 | 1741672 | 65536 | 156839408 | 1568149 | 0 | 629187568 | 12076327418717453 | 12076327418904532 | 12076327419037492 | 12076327419041255 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 102 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 58176 | 0x7f7031f1d800 | 0x7f6f26235d80 | 228813 | 228813 | 28100 | 1830512 | 65536 | 154939878 | 1639042 | 0 | 621630896 | 12076327419100204 | 12076327419287090 | 12076327419428530 | 12076327419432662 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 104 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 59392 | 0x7f7031f1d700 | 0x7f6f26235dc0 | 215820 | 215820 | 23377 | 1726568 | 65536 | 153362587 | 1548163 | 0 | 615282076 | 12076327419503885 | 12076327419677009 | 12076327419809008 | 12076327419812538 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 106 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 61376 | 0x7f7031f1d600 | 0x7f6f26235e00 | 409525 | 409525 | 32150 | 3276208 | 65536 | 301364347 | 3089841 | 0 | 1207276568 | 12076327419871979 | 12076327420063407 | 12076327420326606 | 12076327420392746 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 108 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 62592 | 0x7f7031f1d500 | 0x7f6f26235e40 | 406124 | 406124 | 31722 | 3249000 | 65536 | 310573904 | 3068570 | 0 | 1244112300 | 12076327420417472 | 12076327420615884 | 12076327420875243 | 12076327420941486 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 110 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 63808 | 0x7f7031f1d400 | 0x7f6f26235e80 | 217965 | 217965 | 22411 | 1743728 | 65536 | 150401905 | 1576953 | 0 | 603452992 | 12076327420965751 | 12076327421174122 | 12076327421308201 | 12076327421312155 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 112 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 65280 | 0x7f7031f1d300 | 0x7f6f26235ec0 | 223125 | 223125 | 29767 | 1785008 | 65536 | 165065178 | 1589301 | 0 | 662106268 | 12076327421372577 | 12076327421560520 | 12076327421697959 | 12076327421701499 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 114 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 66496 | 0x7f7031f1da00 | 0x7f6f26235f00 | 218885 | 218885 | 22790 | 1751088 | 65536 | 148990112 | 1583444 | 0 | 597783068 | 12076327421773042 | 12076327421946598 | 12076327422081158 | 12076327422085011 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 116 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 68480 | 0x7f7031f1d900 | 0x7f6f26235f40 | 411148 | 411148 | 33901 | 3289192 | 65536 | 338400769 | 3104057 | 0 | 1355437308 | 12076327422144492 | 12076327422334757 | 12076327422598115 | 12076327422665029 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 118 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 69696 | 0x7f7031f1d800 | 0x7f6f26235f80 | 408093 | 408093 | 27376 | 3264752 | 65536 | 283857796 | 3074190 | 0 | 1137242732 | 12076327422690376 | 12076327422885634 | 12076327423146753 | 12076327423213539 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 120 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 70912 | 0x7f7031f1d700 | 0x7f6f26235fc0 | 212516 | 212516 | 25414 | 1700136 | 65536 | 163318892 | 1522937 | 0 | 655110428 | 12076327423239517 | 12076327423436832 | 12076327423566431 | 12076327423570091 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 122 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 72384 | 0x7f7031f1d600 | 0x7f6f26236000 | 222780 | 222780 | 27440 | 1782248 | 65536 | 184868604 | 1601401 | 0 | 741343652 | 12076327423627638 | 12076327423818110 | 12076327423956189 | 12076327423959836 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 124 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 73600 | 0x7f7031f1d500 | 0x7f6f26236040 | 220364 | 220364 | 24433 | 1762920 | 65536 | 149119121 | 1581565 | 0 | 598323544 | 12076327424037430 | 12076327424214268 | 12076327424348667 | 12076327424352355 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 126 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 75840 | 0x7f7031f1d400 | 0x7f6f26236080 | 408988 | 408988 | 32263 | 3271912 | 65536 | 320979092 | 3083789 | 0 | 1285733124 | 12076327424410684 | 12076327424598266 | 12076327424861305 | 12076327424901776 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 128 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 77056 | 0x7f7031f1d300 | 0x7f6f262360c0 | 391132 | 391132 | 32409 | 3129064 | 65536 | 353412992 | 2963613 | 0 | 1415469032 | 12076327424942843 | 12076327425126584 | 12076327425377463 | 12076327425418577 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 130 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 78272 | 0x7f7031f1da00 | 0x7f6f26236100 | 217293 | 217293 | 22948 | 1738352 | 65536 | 155239009 | 1565948 | 0 | 622791596 | 12076327425451177 | 12076327425639862 | 12076327425773461 | 12076327425777273 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 132 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 80000 | 0x7f7031f1d900 | 0x7f6f26236140 | 232428 | 232428 | 27876 | 1859432 | 65536 | 195594787 | 1679946 | 0 | 784230672 | 12076327425836784 | 12076327426028660 | 12076327426171859 | 12076327426175674 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 134 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 81216 | 0x7f7031f1d800 | 0x7f6f26236180 | 223645 | 223645 | 23883 | 1789168 | 65536 | 145183396 | 1617226 | 0 | 582602460 | 12076327426247878 | 12076327426426418 | 12076327426564337 | 12076327426568073 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 136 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 83456 | 0x7f7031f1d700 | 0x7f6f262361c0 | 414460 | 414460 | 32555 | 3315688 | 65536 | 305746233 | 3117629 | 0 | 1224808600 | 12076327426624498 | 12076327426818096 | 12076327427085135 | 12076327427152028 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 138 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 84928 | 0x7f7031f1d600 | 0x7f6f26236200 | 401477 | 401477 | 34196 | 3211824 | 65536 | 335221921 | 3041646 | 0 | 1342703124 | 12076327427176985 | 12076327427376494 | 12076327427634413 | 12076327427700878 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 140 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 86400 | 0x7f7031f1d500 | 0x7f6f26236240 | 227021 | 227021 | 26580 | 1816176 | 65536 | 138787551 | 1632726 | 0 | 556996696 | 12076327427725213 | 12076327427923371 | 12076327428062571 | 12076327428066197 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 142 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 88128 | 0x7f7031f1d400 | 0x7f6f26236280 | 242348 | 242348 | 27594 | 1938792 | 65536 | 209708783 | 1767698 | 0 | 840693360 | 12076327428126770 | 12076327428313129 | 12076327428463689 | 12076327428467433 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 144 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 89600 | 0x7f7031f1d300 | 0x7f6f262362c0 | 225845 | 225845 | 25029 | 1806768 | 65536 | 137865768 | 1635760 | 0 | 553284708 | 12076327428561548 | 12076327428734728 | 12076327428873287 | 12076327428876904 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 146 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 92096 | 0x7f7031f1da00 | 0x7f6f26236300 | 419101 | 419101 | 32113 | 3352816 | 65536 | 296978305 | 3151701 | 0 | 1189729116 | 12076327428934922 | 12076327429126886 | 12076327429397605 | 12076327429455048 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 148 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 93568 | 0x7f7031f1d900 | 0x7f6f26236340 | 402333 | 402333 | 31713 | 3218672 | 65536 | 334236171 | 3045584 | 0 | 1338758204 | 12076327429479895 | 12076327429675363 | 12076327429933922 | 12076327429979904 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 150 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 95040 | 0x7f7031f1d800 | 0x7f6f26236380 | 227940 | 227940 | 25948 | 1823528 | 65536 | 141446042 | 1624412 | 0 | 567649260 | 12076327430012294 | 12076327430211521 | 12076327430350560 | 12076327430354440 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 152 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 96768 | 0x7f7031f1d700 | 0x7f6f262363c0 | 252172 | 252172 | 28691 | 2017384 | 65536 | 219587427 | 1851182 | 0 | 880202016 | 12076327430415323 | 12076327430600959 | 12076327430758078 | 12076327430761807 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 154 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 98240 | 0x7f7031f1d600 | 0x7f6f26236400 | 225357 | 225357 | 24327 | 1802864 | 65536 | 149769581 | 1633947 | 0 | 600952260 | 12076327430832588 | 12076327431005117 | 12076327431144157 | 12076327431148135 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 156 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 100736 | 0x7f7031f1d500 | 0x7f6f26236440 | 409412 | 409412 | 33883 | 3275304 | 65536 | 315787504 | 3088788 | 0 | 1264966996 | 12076327431206664 | 12076327431396156 | 12076327431660634 | 12076327431708196 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 158 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 102208 | 0x7f7031f1d400 | 0x7f6f26236480 | 400348 | 400348 | 29983 | 3202792 | 65536 | 324847309 | 3032320 | 0 | 1301216560 | 12076327431734034 | 12076327431926393 | 12076327432184632 | 12076327432233041 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 160 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 103680 | 0x7f7031f1d300 | 0x7f6f262364c0 | 221956 | 221956 | 25582 | 1775656 | 65536 | 147481606 | 1594631 | 0 | 591802116 | 12076327432257046 | 12076327432457751 | 12076327432593910 | 12076327432597729 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 162 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 105664 | 0x7f7031f1da00 | 0x7f6f26236500 | 263724 | 263724 | 28572 | 2109800 | 65536 | 235041528 | 1943765 | 0 | 942025504 | 12076327432654835 | 12076327432848469 | 12076327433014068 | 12076327433017749 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 164 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 107136 | 0x7f7031f1d900 | 0x7f6f26236540 | 219060 | 219060 | 23687 | 1752488 | 65536 | 152404572 | 1576119 | 0 | 611446008 | 12076327433090545 | 12076327433271027 | 12076327433405266 | 12076327433408886 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 166 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 109888 | 0x7f7031f1d800 | 0x7f6f26236580 | 419340 | 419340 | 36699 | 3354728 | 65536 | 324040229 | 3156233 | 0 | 1297980316 | 12076327433465331 | 12076327433656145 | 12076327433927184 | 12076327433949251 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 168 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 111360 | 0x7f7031f1d700 | 0x7f6f262365c0 | 409181 | 409181 | 31598 | 3273456 | 65536 | 292613348 | 3085096 | 0 | 1172280348 | 12076327434009422 | 12076327434189103 | 12076327434451662 | 12076327434503731 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 170 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 112832 | 0x7f7031f1d600 | 0x7f6f26236600 | 222981 | 222981 | 24024 | 1783856 | 65536 | 149896144 | 1612689 | 0 | 601442240 | 12076327434528377 | 12076327434728940 | 12076327434866060 | 12076327434869801 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 172 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 114816 | 0x7f7031f1d500 | 0x7f6f26236640 | 277020 | 277020 | 31065 | 2216168 | 65536 | 248052652 | 2044666 | 0 | 994052548 | 12076327434931306 | 12076327435124939 | 12076327435298058 | 12076327435301924 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 174 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 116288 | 0x7f7031f1d400 | 0x7f6f26236680 | 220573 | 220573 | 22459 | 1764592 | 65536 | 165346140 | 1588658 | 0 | 663226476 | 12076327435374459 | 12076327435549737 | 12076327435685416 | 12076327435689505 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 176 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 119040 | 0x7f7031f1d300 | 0x7f6f262366c0 | 404628 | 404628 | 37892 | 3237032 | 65536 | 315795617 | 3035555 | 0 | 1265015904 | 12076327435745910 | 12076327435939015 | 12076327436199654 | 12076327436249676 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 178 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 120768 | 0x7f7031f1da00 | 0x7f6f26236700 | 457901 | 457901 | 15291 | 3663216 | 65536 | 296982808 | 3065379 | 0 | 1189746456 | 12076327436273169 | 12076327436474212 | 12076327436770371 | 12076327436818583 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 180 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 122496 | 0x7f7031f1d900 | 0x7f6f26236740 | 223005 | 223005 | 25216 | 1784048 | 65536 | 150815369 | 1604902 | 0 | 605136716 | 12076327436842538 | 12076327437043330 | 12076327437179809 | 12076327437183842 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 182 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 124736 | 0x7f7031f1d800 | 0x7f6f26236780 | 290572 | 290572 | 30899 | 2324584 | 65536 | 260280880 | 2154890 | 0 | 1042972684 | 12076327437242010 | 12076327437432928 | 12076327437616287 | 12076327437622207 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 184 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 126464 | 0x7f7031f1d700 | 0x7f6f262367c0 | 223317 | 223317 | 25702 | 1786544 | 65536 | 143093189 | 1615056 | 0 | 574262752 | 12076327437704730 | 12076327437881726 | 12076327438019805 | 12076327438023893 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 186 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 20 | 24 | 127936 | 0x7f7031f1d600 | 0x7f6f26236800 | 413908 | 413908 | 36504 | 3311272 | 65536 | 380760177 | 3142546 | 0 | 1524861416 | 12076327438080578 | 12076327438271484 | 12076327438539643 | 12076327438589374 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 188 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 129664 | 0x7f7031f1d500 | 0x7f6f26236840 | 395004 | 395004 | 34433 | 3160040 | 65536 | 334017531 | 2985646 | 0 | 1337889236 | 12076327438615022 | 12076327438814362 | 12076327439068281 | 12076327439117596 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 190 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 131392 | 0x7f7031f1d400 | 0x7f6f26236880 | 220508 | 220508 | 25162 | 1764072 | 65536 | 160293233 | 1584140 | 0 | 643006552 | 12076327439141300 | 12076327439340600 | 12076327439476599 | 12076327439480370 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 192 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 133632 | 0x7f7031f1d300 | 0x7f6f262368c0 | 303348 | 303348 | 32459 | 2426792 | 65536 | 272397563 | 2253283 | 0 | 1091431836 | 12076327439539269 | 12076327439725078 | 12076327439916757 | 12076327439968387 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 194 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 135360 | 0x7f7031f1da00 | 0x7f6f26236900 | 218932 | 218932 | 26009 | 1751464 | 65536 | 154615993 | 1567950 | 0 | 620325540 | 12076327440012309 | 12076327440194516 | 12076327440329715 | 12076327440333576 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 196 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 20 | 24 | 136832 | 0x7f7031f1d900 | 0x7f6f26236940 | 438060 | 438060 | 40923 | 3504488 | 65536 | 406700091 | 3333517 | 0 | 1628620276 | 12076327440391784 | 12076327440580914 | 12076327440865233 | 12076327440914295 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 198 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 138560 | 0x7f7031f1d800 | 0x7f6f26236980 | 404189 | 404189 | 32075 | 3233520 | 65536 | 320696391 | 3056109 | 0 | 1284604624 | 12076327440937508 | 12076327441141391 | 12076327441402190 | 12076327441452836 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 200 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 140288 | 0x7f7031f1d700 | 0x7f6f262369c0 | 222933 | 222933 | 26446 | 1783472 | 65536 | 151298942 | 1601376 | 0 | 607076608 | 12076327441476319 | 12076327441672109 | 12076327441809068 | 12076327441812935 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 202 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 142784 | 0x7f7031f1d600 | 0x7f6f26236a00 | 331445 | 331445 | 33780 | 2651568 | 65536 | 299751261 | 2483426 | 0 | 1200858452 | 12076327441874970 | 12076327442068587 | 12076327442279146 | 12076327442330086 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 204 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 144768 | 0x7f7031f1d500 | 0x7f6f26236a40 | 223189 | 223189 | 26144 | 1785520 | 65536 | 146378075 | 1608324 | 0 | 587388236 | 12076327442365472 | 12076327442551945 | 12076327442689544 | 12076327442693351 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 206 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 20 | 24 | 145728 | 0x7f7031f1d400 | 0x7f6f26236a80 | 472444 | 472444 | 43233 | 3779560 | 65536 | 439173511 | 3590778 | 0 | 1758514404 | 12076327442750828 | 12076327442936263 | 12076327443242982 | 12076327443290020 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 208 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 147712 | 0x7f7031f1d300 | 0x7f6f26236ac0 | 407284 | 407284 | 31468 | 3258280 | 65536 | 261914357 | 3056209 | 0 | 1049494120 | 12076327443327690 | 12076327443513701 | 12076327443775779 | 12076327443821929 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 210 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 149696 | 0x7f7031f1da00 | 0x7f6f26236b00 | 222084 | 222084 | 24880 | 1776680 | 65536 | 153353024 | 1592647 | 0 | 615268220 | 12076327443854429 | 12076327444048418 | 12076327444185858 | 12076327444189762 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 212 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 152192 | 0x7f7031f1d900 | 0x7f6f26236b40 | 358669 | 358669 | 36823 | 2869360 | 65536 | 327245960 | 2696314 | 0 | 1310831392 | 12076327444249323 | 12076327444436377 | 12076327444664696 | 12076327444714257 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 214 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 154176 | 0x7f7031f1d800 | 0x7f6f26236b80 | 222588 | 222588 | 27050 | 1780712 | 65536 | 161613304 | 1600887 | 0 | 648323568 | 12076327444756666 | 12076327444933974 | 12076327445071733 | 12076327445075488 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 216 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 20 | 24 | 155648 | 0x7f7031f1d700 | 0x7f6f26236bc0 | 504180 | 504180 | 44136 | 4033448 | 65536 | 471469664 | 3865220 | 0 | 1887698484 | 12076327445132975 | 12076327445328852 | 12076327445657650 | 12076327445705068 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 218 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 157632 | 0x7f7031f1d600 | 0x7f6f26236c00 | 401748 | 401748 | 30490 | 3213992 | 65536 | 300767866 | 2999630 | 0 | 1204893592 | 12076327445734894 | 12076327445926449 | 12076327446186288 | 12076327446237468 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 220 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 159616 | 0x7f7031f1d500 | 0x7f6f26236c40 | 225429 | 225429 | 27825 | 1803440 | 65536 | 157817115 | 1620370 | 0 | 633136516 | 12076327446262274 | 12076327446461167 | 12076327446600046 | 12076327446603889 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 222 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 162368 | 0x7f7031f1d400 | 0x7f6f26236c80 | 383100 | 383100 | 36758 | 3064808 | 65536 | 352102369 | 2898986 | 0 | 1410263924 | 12076327446662367 | 12076327446846125 | 12076327447091244 | 12076327447140817 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 224 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 164608 | 0x7f7031f1d300 | 0x7f6f26236cc0 | 219500 | 219500 | 27388 | 1756008 | 65536 | 162354413 | 1569011 | 0 | 651287132 | 12076327447177034 | 12076327447364523 | 12076327447499882 | 12076327447503651 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 226 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 20 | 24 | 166336 | 0x7f7031f1da00 | 0x7f6f26236d00 | 575309 | 575309 | 48139 | 4602480 | 65536 | 541767186 | 4429341 | 0 | 2168889116 | 12076327447560727 | 12076327447745641 | 12076327448122280 | 12076327448173185 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 228 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 168576 | 0x7f7031f1d900 | 0x7f6f26236d40 | 409644 | 409644 | 33505 | 3277160 | 65536 | 300693997 | 3067599 | 0 | 1204605360 | 12076327448197100 | 12076327448412038 | 12076327448676677 | 12076327448695205 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 230 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 170816 | 0x7f7031f1d800 | 0x7f6f26236d80 | 225909 | 225909 | 27312 | 1807280 | 65536 | 166754503 | 1630258 | 0 | 668896656 | 12076327448754706 | 12076327448931876 | 12076327449072515 | 12076327449076334 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 232 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 174080 | 0x7f7031f1d700 | 0x7f6f26236dc0 | 434821 | 434821 | 40942 | 3478576 | 65536 | 400645665 | 3305378 | 0 | 1604433640 | 12076327449136656 | 12076327449334914 | 12076327449613953 | 12076327449663064 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 234 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 176576 | 0x7f7031f1d600 | 0x7f6f26236e00 | 227580 | 227580 | 26972 | 1820648 | 65536 | 182547740 | 1649162 | 0 | 732089040 | 12076327449698790 | 12076327449881472 | 12076327450023071 | 12076327450027361 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 236 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 20 | 24 | 177792 | 0x7f7031f1d500 | 0x7f6f26236e40 | 644196 | 644196 | 51967 | 5153576 | 65536 | 611537704 | 4986023 | 0 | 2447971452 | 12076327450085429 | 12076327450275550 | 12076327450698588 | 12076327450744474 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 238 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 180288 | 0x7f7031f1d400 | 0x7f6f26236e80 | 414684 | 414684 | 33984 | 3317480 | 65536 | 325679697 | 3126541 | 0 | 1304555352 | 12076327450772917 | 12076327450963227 | 12076327451232346 | 12076327451280169 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 240 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 182784 | 0x7f7031f1d300 | 0x7f6f26236ec0 | 225124 | 225124 | 27994 | 1801000 | 65536 | 183537361 | 1620656 | 0 | 736035852 | 12076327451305567 | 12076327451502745 | 12076327451642584 | 12076327451646250 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 242 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 186304 | 0x7f7031f1da00 | 0x7f6f26236f00 | 489029 | 489029 | 42650 | 3912240 | 65536 | 456665273 | 3746571 | 0 | 1828511312 | 12076327451704007 | 12076327451896983 | 12076327452212982 | 12076327452257826 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 244 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 189312 | 0x7f7031f1d900 | 0x7f6f26236f40 | 242156 | 242156 | 28169 | 1937256 | 65536 | 214219388 | 1772586 | 0 | 858759044 | 12076327452307599 | 12076327452487220 | 12076327452638900 | 12076327452642591 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 246 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 20 | 24 | 190784 | 0x7f7031f1d800 | 0x7f6f26236f80 | 784476 | 784476 | 59291 | 6275816 | 65536 | 751137040 | 6109488 | 0 | 3006369528 | 12076327452700128 | 12076327452887699 | 12076327453404016 | 12076327453428251 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 248 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 193792 | 0x7f7031f1d700 | 0x7f6f26236fc0 | 457189 | 457189 | 40278 | 3657520 | 65536 | 377118755 | 3475801 | 0 | 1510304444 | 12076327453482212 | 12076327453663215 | 12076327453960654 | 12076327453980718 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 250 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 196800 | 0x7f7031f1d600 | 0x7f6f26237000 | 245468 | 245468 | 27285 | 1963752 | 65536 | 217867234 | 1800044 | 0 | 873357636 | 12076327454042623 | 12076327454221453 | 12076327454375372 | 12076327454379098 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 252 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 201088 | 0x7f7031f1d500 | 0x7f6f26237040 | 632789 | 632789 | 16512 | 5062320 | 65536 | 561747940 | 4589196 | 0 | 2248845944 | 12076327454439972 | 12076327454626411 | 12076327455036969 | 12076327455080602 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 254 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 204608 | 0x7f7031f1d400 | 0x7f6f26237080 | 279837 | 279837 | 30251 | 2238704 | 65536 | 249828270 | 2068744 | 0 | 1001199200 | 12076327455130315 | 12076327455310728 | 12076327455487207 | 12076327455490915 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 256 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 20 | 24 | 206080 | 0x7f7031f1d300 | 0x7f6f262370c0 | 924461 | 924461 | 67066 | 7395696 | 65536 | 889569140 | 7231932 | 0 | 3560097332 | 12076327455548562 | 12076327455743206 | 12076327456352163 | 12076327456399433 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 258 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 209600 | 0x7f7031f1da00 | 0x7f6f26237100 | 500637 | 500637 | 44537 | 4005104 | 65536 | 464298889 | 3830255 | 0 | 1859052364 | 12076327456432445 | 12076327456631202 | 12076327456958561 | 12076327457010679 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 260 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 213120 | 0x7f7031f1d900 | 0x7f6f26237140 | 282037 | 282037 | 29556 | 2256304 | 65536 | 254101760 | 2092270 | 0 | 1018291448 | 12076327457043851 | 12076327457242400 | 12076327457421599 | 12076327457425330 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 262 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 218176 | 0x7f7031f1d800 | 0x7f6f26237180 | 700772 | 700772 | 57754 | 5606184 | 65536 | 664650009 | 5415350 | 0 | 2660446968 | 12076327457486584 | 12076327457672958 | 12076327458127996 | 12076327458177217 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 264 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 222208 | 0x7f7031f1d700 | 0x7f6f262371c0 | 313669 | 313669 | 31681 | 2509360 | 65536 | 285350498 | 2346446 | 0 | 1143297024 | 12076327458223734 | 12076327458403675 | 12076327458603994 | 12076327458649986 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 266 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 20 | 24 | 223936 | 0x7f7031f1d600 | 0x7f6f26237200 | 1066581 | 1066581 | 77332 | 8532656 | 65536 | 1028208571 | 8356608 | 0 | 4114654956 | 12076327458681735 | 12076327458873752 | 12076327459576149 | 12076327459627533 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 268 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 227968 | 0x7f7031f1d500 | 0x7f6f26237240 | 566956 | 566956 | 47385 | 4535656 | 65536 | 532587577 | 4365736 | 0 | 2132192884 | 12076327459652649 | 12076327459855508 | 12076327460227667 | 12076327460277090 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 270 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 232000 | 0x7f7031f1d400 | 0x7f6f26237280 | 319468 | 319468 | 32704 | 2555752 | 65536 | 289506099 | 2387498 | 0 | 1159913240 | 12076327460300694 | 12076327460500785 | 12076327460704304 | 12076327460752473 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 272 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 237824 | 0x7f7031f1d300 | 0x7f6f262372c0 | 803221 | 803221 | 60806 | 6425776 | 65536 | 767733220 | 6255591 | 0 | 3072775544 | 12076327460775676 | 12076327460970223 | 12076327461496141 | 12076327461546389 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 274 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 242368 | 0x7f7031f1da00 | 0x7f6f26237300 | 351500 | 351500 | 36540 | 2812008 | 65536 | 320014175 | 2630801 | 0 | 1281961004 | 12076327461582325 | 12076327461768140 | 12076327461992299 | 12076327462044635 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 276 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 20 | 24 | 243584 | 0x7f7031f1d900 | 0x7f6f26237340 | 1207757 | 1207757 | 85294 | 9662064 | 65536 | 1169193706 | 9490895 | 0 | 4678594368 | 12076327462068589 | 12076327462268778 | 12076327463067974 | 12076327463135792 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 278 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 248128 | 0x7f7031f1d800 | 0x7f6f26237380 | 673884 | 673884 | 16747 | 5391080 | 65536 | 602526433 | 4945484 | 0 | 2411943540 | 12076327463162242 | 12076327463366213 | 12076327463810051 | 12076327463877281 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 280 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 252672 | 0x7f7031f1d700 | 0x7f6f262373c0 | 355796 | 355796 | 35489 | 2846376 | 65536 | 325671565 | 2669737 | 0 | 1304577388 | 12076327463900183 | 12076327464119489 | 12076327464346688 | 12076327464415721 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 282 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 259264 | 0x7f7031f1d600 | 0x7f6f26237400 | 911021 | 911021 | 67086 | 7288176 | 65536 | 875199644 | 7120624 | 0 | 3502644540 | 12076327464440567 | 12076327464642047 | 12076327465239805 | 12076327465308110 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 284 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 264832 | 0x7f7031f1d500 | 0x7f6f26237440 | 419516 | 419516 | 40855 | 3356136 | 65536 | 386941796 | 3175295 | 0 | 1549661548 | 12076327465343636 | 12076327465540123 | 12076327465809082 | 12076327465875684 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 286 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 20 | 24 | 266304 | 0x7f7031f1d400 | 0x7f6f26237480 | 1487725 | 1487725 | 100754 | 11901808 | 65536 | 1447187792 | 11735182 | 0 | 5790571912 | 12076327465900080 | 12076327466105401 | 12076327467090836 | 12076327467160192 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 288 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 28 | 24 | 271872 | 0x7f7031f1d300 | 0x7f6f262374c0 | 804020 | 804020 | 16254 | 6432168 | 65536 | 737761527 | 6055813 | 0 | 2952886016 | 12076327467185128 | 12076327467397075 | 12076327467928273 | 12076327467996005 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 290 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 277440 | 0x7f7031f1da00 | 0x7f6f26237500 | 422949 | 422949 | 40497 | 3383600 | 65536 | 390751573 | 3206117 | 0 | 1564894460 | 12076327468027784 | 12076327468232751 | 12076327468504750 | 12076327468574039 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 292 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 12 | 24 | 279936 | 0x7f7031f1d900 | 0x7f6f26237540 | 1126132 | 1126132 | 79445 | 9009064 | 65536 | 1089845165 | 8842241 | 0 | 4361203736 | 12076327468600158 | 12076327468792269 | 12076327469530026 | 12076327469598864 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 294 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 286528 | 0x7f7031f1d800 | 0x7f6f26237580 | 493468 | 493468 | 45315 | 3947752 | 65536 | 459603534 | 3772007 | 0 | 1840310892 | 12076327469635692 | 12076327469821864 | 12076327470140103 | 12076327470208767 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 296 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 20 | 24 | 288000 | 0x7f7031f1d700 | 0x7f6f262375c0 | 1768844 | 1768844 | 118324 | 14150760 | 65536 | 1723639655 | 13982118 | 0 | 6896378308 | 12076327470234154 | 12076327470433222 | 12076327471602497 | 12076327471670614 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 298 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 32 | 24 | 294592 | 0x7f7031f1d600 | 0x7f6f26237600 | 922484 | 922484 | 66355 | 7379880 | 65536 | 808434371 | 7201184 | 0 | 3235580684 | 12076327471698857 | 12076327471899615 | 12076327472510493 | 12076327472581256 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 300 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 301184 | 0x7f7031f1d500 | 0x7f6f26237640 | 491701 | 491701 | 43190 | 3933616 | 65536 | 459379596 | 3766902 | 0 | 1839417628 | 12076327472604209 | 12076327472814171 | 12076327473133050 | 12076327473199926 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 302 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 12 | 24 | 304960 | 0x7f7031f1d400 | 0x7f6f26237680 | 1338989 | 1338989 | 94366 | 10711920 | 65536 | 1297305485 | 10531704 | 0 | 5191044600 | 12076327473226145 | 12076327473430009 | 12076327474308405 | 12076327474377084 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 304 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 24 | 24 | 313600 | 0x7f7031f1d300 | 0x7f6f262376c0 | 631181 | 631181 | 53286 | 5049456 | 65536 | 596092182 | 4874212 | 0 | 2386266096 | 12076327474422088 | 12076327474602804 | 12076327475013522 | 12076327475081834 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 306 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 20 | 24 | 314816 | 0x7f7031f1da00 | 0x7f6f26237700 | 2333732 | 2333732 | 151312 | 18669864 | 65536 | 2284938455 | 18503363 | 0 | 9141574476 | 12076327475110126 | 12076327475310960 | 12076327476858474 | 12076327476931651 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 308 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 20 | 24 | 317568 | 0x7f7031f1d900 | 0x7f6f26237740 | 1202364 | 1202364 | 15250 | 9618920 | 65536 | 1162048908 | 9433323 | 0 | 4650017668 | 12076327476964272 | 12076327477174632 | 12076327477969029 | 12076327478288343 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 310 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 12 | 24 | 320320 | 0x7f7031f1d800 | 0x7f6f26237780 | 644389 | 644389 | 54450 | 5155120 | 65536 | 608696803 | 4969808 | 0 | 2436613984 | 12076327478312357 | 12076327478521906 | 12076327478937105 | 12076327479012028 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 312 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 12 | 24 | 324096 | 0x7f7031f1d700 | 0x7f6f262377c0 | 1757796 | 1757796 | 46114 | 14062376 | 65536 | 1715011761 | 13896501 | 0 | 6861870600 | 12076327479042625 | 12076327479239503 | 12076327480398058 | 12076327480466140 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 314 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 12 | 24 | 328896 | 0x7f7031f1d600 | 0x7f6f26237800 | 1200124 | 1200124 | 85398 | 9601000 | 65536 | 1160737821 | 9420660 | 0 | 4644781084 | 12076327480509340 | 12076327480689737 | 12076327481475013 | 12076327481543342 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 316 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 20 | 24 | 330112 | 0x7f7031f1d500 | 0x7f6f26237840 | 4586309 | 4586309 | 282847 | 36690480 | 65536 | 4514982965 | 36501638 | 0 | 18061753356 | 12076327481570933 | 12076327481773892 | 12076327484823959 | 12076327484892897 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 318 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 20 | 24 | 332864 | 0x7f7031f1d400 | 0x7f6f26237880 | 2325189 | 2325189 | 150804 | 18601520 | 65536 | 2276865554 | 18430717 | 0 | 9109285784 | 12076327484921430 | 12076327485134197 | 12076327486677231 | 12076327486746191 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 320 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 12 | 24 | 335616 | 0x7f7031f1d300 | 0x7f6f262378c0 | 1203813 | 1203813 | 84257 | 9630512 | 65536 | 1165562290 | 9458642 | 0 | 4664073264 | 12076327486771038 | 12076327486980109 | 12076327487769706 | 12076327487838231 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 322 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 12 | 24 | 339392 | 0x7f7031f1da00 | 0x7f6f26237900 | 3443652 | 3443652 | 145637 | 27549224 | 65536 | 3383207326 | 27379437 | 0 | 13534654516 | 12076327487863708 | 12076327488074664 | 12076327490355454 | 12076327490423525 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 324 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 12 | 24 | 344192 | 0x7f7031f1d900 | 0x7f6f26237940 | 2325508 | 2325508 | 152068 | 18604072 | 65536 | 2274678312 | 18420484 | 0 | 9100535904 | 12076327490468168 | 12076327490646973 | 12076327492182326 | 12076327492249860 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 326 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 20 | 24 | 345408 | 0x7f7031f1d800 | 0x7f6f26237980 | 9087333 | 9087333 | 544171 | 72698672 | 65536 | 8977280861 | 72531278 | 0 | 35910944660 | 12076327492280386 | 12076327492477365 | 12076327498530299 | 12076327498598388 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 328 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 20 | 24 | 348160 | 0x7f7031f1d700 | 0x7f6f262379c0 | 4574436 | 4574436 | 284141 | 36595496 | 65536 | 4502597830 | 36411997 | 0 | 18012214892 | 12076327498627422 | 12076327498826777 | 12076327501868524 | 12076327501942032 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 330 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 12 | 24 | 350912 | 0x7f7031f1d600 | 0x7f6f26237a00 | 2329572 | 2329572 | 150766 | 18636584 | 65536 | 2280499819 | 18463002 | 0 | 9123823536 | 12076327501966948 | 12076327502177803 | 12076327503717156 | 12076327503790938 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 332 | 921529 | 921534 | 4194304 | 256 | 0 | 0 | 12 | 24 | 0 | 0x7f7031f1d500 | 0x7f6f26237a40 | 6814428 | 6814428 | 414267 | 54515432 | 65536 | 6722407797 | 54333595 | 0 | 26891453672 | 12076327503817648 | 12076327504026421 | 12076327508552803 | 12076327508625613 |