43 KiB
43 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | SQ_INSTS_VMEM | SQ_INST_LEVEL_VMEM | SQ_ACCUM_PREV_HIRES | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBuffer.kd | 0 | 0 | 0 | 926143 | 926148 | 33554432 | 256 | 0 | 0 | 8 | 32 | 6464 | 0x0 | 0x7f15cfa04180 | 1048576 | 11235576 | 1438147260 | 12076419454465812 | 12076419701214917 | 12076419701539876 | 12076419701649649 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 926143 | 926148 | 32768 | 256 | 0 | 0 | 24 | 24 | 12480 | 0x0 | 0x7f15cfa35100 | 4096 | 113930 | 14569884 | 12076419716046811 | 12076419716351528 | 12076419716357928 | 12076419716368830 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 4 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 12928 | 0x7f16ffbde900 | 0x7f15cfa35140 | 524288 | 9932637 | 1271377396 | 12076419716430033 | 12076419716641287 | 12076419716781447 | 12076419716785163 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 6 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 36 | 24 | 13632 | 0x7f16ffbde800 | 0x7f15cfa35180 | 524288 | 12650009 | 1619133560 | 12076419716858309 | 12076419717036805 | 12076419717293764 | 12076419717361805 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 8 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 14080 | 0x7f16ffbde700 | 0x7f15cfa351c0 | 524288 | 14218994 | 1819959540 | 12076419717394686 | 12076419717580963 | 12076419717836002 | 12076419717900566 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 10 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 14528 | 0x7f16ffbde600 | 0x7f15cfa35200 | 524288 | 10134990 | 1297298864 | 12076419717927867 | 12076419718122560 | 12076419718263680 | 12076419718267338 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 12 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 14976 | 0x7f16ffbde500 | 0x7f15cfa35240 | 524288 | 10522452 | 1346830292 | 12076419718315237 | 12076419718496959 | 12076419718635838 | 12076419718639199 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 14 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 15424 | 0x7f16ffbde400 | 0x7f15cfa35280 | 524288 | 12575047 | 1609534080 | 12076419718722002 | 12076419718892637 | 12076419719023196 | 12076419719026829 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 16 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 16128 | 0x7f16ffbde300 | 0x7f15cfa352c0 | 524288 | 13499725 | 1727935092 | 12076419719082873 | 12076419719248635 | 12076419719507354 | 12076419719548739 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 18 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 16832 | 0x7f16ffbdea00 | 0x7f15cfa35300 | 524288 | 13945398 | 1784989992 | 12076419719577081 | 12076419719754873 | 12076419720010232 | 12076419720048998 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 20 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 17536 | 0x7f16ffbde900 | 0x7f15cfa35340 | 524288 | 12025815 | 1539260420 | 12076419720073384 | 12076419720266231 | 12076419720399670 | 12076419720403016 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 22 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 18240 | 0x7f16ffbde800 | 0x7f15cfa35380 | 524288 | 10151841 | 1299452388 | 12076419720453660 | 12076419720625109 | 12076419720765909 | 12076419720769277 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 24 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 18944 | 0x7f16ffbde700 | 0x7f15cfa353c0 | 524288 | 12422833 | 1590058864 | 12076419720832394 | 12076419720997268 | 12076419721127667 | 12076419721131219 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 26 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 19904 | 0x7f16ffbde600 | 0x7f15cfa35400 | 524288 | 14359223 | 1837934960 | 12076419721175461 | 12076419721366706 | 12076419721622545 | 12076419721688936 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 28 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 20608 | 0x7f16ffbde500 | 0x7f15cfa35440 | 524288 | 13616119 | 1742818184 | 12076419721715104 | 12076419721903183 | 12076419722163182 | 12076419722229380 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 30 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 21312 | 0x7f16ffbde400 | 0x7f15cfa35480 | 524288 | 11963320 | 1531205796 | 12076419722255639 | 12076419722439341 | 12076419722573260 | 12076419722576665 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 32 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 22016 | 0x7f16ffbde300 | 0x7f15cfa354c0 | 524288 | 11971440 | 1532310640 | 12076419722627249 | 12076419722797099 | 12076419722930379 | 12076419722933789 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 34 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 22720 | 0x7f16ffbdea00 | 0x7f15cfa35500 | 524288 | 12526194 | 1603316120 | 12076419722997968 | 12076419723171658 | 12076419723302537 | 12076419723305930 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 36 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 23680 | 0x7f16ffbde900 | 0x7f15cfa35540 | 524288 | 13579446 | 1738117372 | 12076419723361614 | 12076419723522856 | 12076419723779335 | 12076419723818994 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 38 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 24384 | 0x7f16ffbde800 | 0x7f15cfa35580 | 524288 | 13634272 | 1745161624 | 12076419723843128 | 12076419724035014 | 12076419724288773 | 12076419724354088 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 40 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 25088 | 0x7f16ffbde700 | 0x7f15cfa355c0 | 524288 | 12791268 | 1637275336 | 12076419724380597 | 12076419724566852 | 12076419724696291 | 12076419724699770 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 42 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 25792 | 0x7f16ffbde600 | 0x7f15cfa35600 | 524288 | 12614511 | 1614587116 | 12076419724750875 | 12076419724919170 | 12076419725050209 | 12076419725053648 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 44 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 26496 | 0x7f16ffbde500 | 0x7f15cfa35640 | 524288 | 10832190 | 1386395268 | 12076419725118218 | 12076419725286528 | 12076419725425408 | 12076419725428815 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 46 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 27712 | 0x7f16ffbde400 | 0x7f15cfa35680 | 524288 | 13632238 | 1744907120 | 12076419725484148 | 12076419725645567 | 12076419725907165 | 12076419725971413 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 48 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 28416 | 0x7f16ffbde300 | 0x7f15cfa356c0 | 524288 | 13771485 | 1762706476 | 12076419725998924 | 12076419726185404 | 12076419726475483 | 12076419726541643 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 50 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 29120 | 0x7f16ffbdea00 | 0x7f15cfa35700 | 524288 | 13303305 | 1702877092 | 12076419726567631 | 12076419726744922 | 12076419726872761 | 12076419726876144 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 52 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 30080 | 0x7f16ffbde900 | 0x7f15cfa35740 | 524288 | 12550002 | 1606301404 | 12076419726928572 | 12076419727120600 | 12076419727253079 | 12076419727256762 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 54 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 30784 | 0x7f16ffbde800 | 0x7f15cfa35780 | 524288 | 11732690 | 1501738368 | 12076419727321452 | 12076419727485398 | 12076419727618678 | 12076419727622151 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 56 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 32000 | 0x7f16ffbde700 | 0x7f15cfa357c0 | 524288 | 13594804 | 1740117220 | 12076419727672434 | 12076419727854197 | 12076419728115476 | 12076419728182041 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 58 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 32960 | 0x7f16ffbde600 | 0x7f15cfa35800 | 524288 | 14002558 | 1792280688 | 12076419728206246 | 12076419728394034 | 12076419728650353 | 12076419728714731 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 60 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 33920 | 0x7f16ffbde500 | 0x7f15cfa35840 | 524288 | 13297888 | 1702194480 | 12076419728740398 | 12076419728918992 | 12076419729046191 | 12076419729049663 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 62 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 34880 | 0x7f16ffbde400 | 0x7f15cfa35880 | 524288 | 11036975 | 1412656480 | 12076419729101870 | 12076419729274830 | 12076419729414190 | 12076419729417627 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 64 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 35840 | 0x7f16ffbde300 | 0x7f15cfa358c0 | 524288 | 12064695 | 1544174712 | 12076419729481355 | 12076419729643789 | 12076419729777388 | 12076419729781012 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 66 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 37312 | 0x7f16ffbdea00 | 0x7f15cfa35900 | 524288 | 13992599 | 1791038892 | 12076419729832929 | 12076419729999307 | 12076419730264266 | 12076419730331876 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 68 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 38272 | 0x7f16ffbde900 | 0x7f15cfa35940 | 524288 | 14148259 | 1810968936 | 12076419730357393 | 12076419730541705 | 12076419730800904 | 12076419730865147 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 70 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 39232 | 0x7f16ffbde800 | 0x7f15cfa35980 | 524288 | 11125993 | 1424117500 | 12076419730892608 | 12076419731072902 | 12076419731210342 | 12076419731214336 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 72 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 40192 | 0x7f16ffbde700 | 0x7f15cfa359c0 | 524288 | 10084763 | 1290837788 | 12076419731265290 | 12076419731445861 | 12076419731587620 | 12076419731591076 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 74 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 41152 | 0x7f16ffbde600 | 0x7f15cfa35a00 | 524288 | 12558509 | 1607538740 | 12076419731652129 | 12076419731814979 | 12076419731944898 | 12076419731948430 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 76 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 42624 | 0x7f16ffbde500 | 0x7f15cfa35a40 | 524288 | 13082130 | 1674490432 | 12076419731999465 | 12076419732170497 | 12076419732428416 | 12076419732494144 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 78 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 43584 | 0x7f16ffbde400 | 0x7f15cfa35a80 | 524288 | 13847702 | 1772499852 | 12076419732520312 | 12076419732699295 | 12076419732957534 | 12076419732996277 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 80 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 44544 | 0x7f16ffbde300 | 0x7f15cfa35ac0 | 524288 | 11468388 | 1467834704 | 12076419733026553 | 12076419733209693 | 12076419733346492 | 12076419733350495 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 82 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 45760 | 0x7f16ffbdea00 | 0x7f15cfa35b00 | 524288 | 12082807 | 1546534344 | 12076419733401630 | 12076419733568571 | 12076419733702010 | 12076419733705735 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 84 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 46720 | 0x7f16ffbde900 | 0x7f15cfa35b40 | 524288 | 12626036 | 1616066040 | 12076419733768943 | 12076419733934649 | 12076419734065369 | 12076419734069211 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 86 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 48448 | 0x7f16ffbde800 | 0x7f15cfa35b80 | 524288 | 13597815 | 1740456364 | 12076419734123141 | 12076419734289528 | 12076419734547767 | 12076419734613873 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 88 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 49408 | 0x7f16ffbde700 | 0x7f15cfa35bc0 | 524288 | 13489008 | 1726536356 | 12076419734640001 | 12076419734817845 | 12076419735076084 | 12076419735144909 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 90 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 50368 | 0x7f16ffbde600 | 0x7f15cfa35c00 | 524288 | 11695156 | 1496917184 | 12076419735168814 | 12076419735356243 | 12076419735491442 | 12076419735494890 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 92 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 51584 | 0x7f16ffbde500 | 0x7f15cfa35c40 | 524288 | 10806002 | 1383095088 | 12076419735544171 | 12076419735718961 | 12076419735857841 | 12076419735861231 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 94 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 52544 | 0x7f16ffbde400 | 0x7f15cfa35c80 | 524288 | 11546421 | 1477881944 | 12076419735925420 | 12076419736099120 | 12076419736233679 | 12076419736237209 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 96 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 54272 | 0x7f16ffbde300 | 0x7f15cfa35cc0 | 524288 | 13282244 | 1700109596 | 12076419736289176 | 12076419736458638 | 12076419736724877 | 12076419736764098 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 98 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 55488 | 0x7f16ffbdea00 | 0x7f15cfa35d00 | 524288 | 13800773 | 1766498772 | 12076419736790928 | 12076419736967596 | 12076419737227115 | 12076419737292550 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 100 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 56704 | 0x7f16ffbde900 | 0x7f15cfa35d40 | 524288 | 10684886 | 1367631768 | 12076419737320763 | 12076419737498633 | 12076419737677833 | 12076419737681353 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 102 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 58176 | 0x7f16ffbde800 | 0x7f15cfa35d80 | 524288 | 9240099 | 1182787640 | 12076419737730654 | 12076419737903112 | 12076419738046471 | 12076419738050198 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 104 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 59392 | 0x7f16ffbde700 | 0x7f15cfa35dc0 | 524288 | 10612981 | 1358397244 | 12076419738111913 | 12076419738279270 | 12076419738417989 | 12076419738421438 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 106 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 61376 | 0x7f16ffbde600 | 0x7f15cfa35e00 | 524288 | 13014361 | 1665823616 | 12076419738476370 | 12076419738638628 | 12076419738906467 | 12076419738970027 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 108 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 62592 | 0x7f16ffbde500 | 0x7f15cfa35e40 | 524288 | 13630352 | 1744659328 | 12076419738992188 | 12076419739183586 | 12076419739442785 | 12076419739507085 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 110 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 63808 | 0x7f16ffbde400 | 0x7f15cfa35e80 | 524288 | 12468798 | 1596038064 | 12076419739530358 | 12076419739716383 | 12076419739847423 | 12076419739850884 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 112 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 65280 | 0x7f16ffbde300 | 0x7f15cfa35ec0 | 524288 | 8904529 | 1139698516 | 12076419739899504 | 12076419740082142 | 12076419740223901 | 12076419740227554 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 114 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 66496 | 0x7f16ffbdea00 | 0x7f15cfa35f00 | 524288 | 12370887 | 1583431280 | 12076419740290230 | 12076419740453500 | 12076419740584860 | 12076419740588314 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 116 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 68480 | 0x7f16ffbde900 | 0x7f15cfa35f40 | 524288 | 13110109 | 1678148832 | 12076419740636744 | 12076419740807899 | 12076419741072057 | 12076419741120583 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 118 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 69696 | 0x7f16ffbde800 | 0x7f15cfa35f80 | 524288 | 13741493 | 1758862948 | 12076419741144608 | 12076419741329176 | 12076419741588535 | 12076419741653844 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 120 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 70912 | 0x7f16ffbde700 | 0x7f15cfa35fc0 | 524288 | 11624397 | 1487900776 | 12076419741679472 | 12076419741859094 | 12076419741993813 | 12076419741997222 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 122 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 72384 | 0x7f16ffbde600 | 0x7f15cfa36000 | 524288 | 7568327 | 968789468 | 12076419742052585 | 12076419742216692 | 12076419742356692 | 12076419742360077 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 124 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 73600 | 0x7f16ffbde500 | 0x7f15cfa36040 | 524288 | 12602644 | 1613187088 | 12076419742422933 | 12076419742591091 | 12076419742722290 | 12076419742725666 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 126 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 75840 | 0x7f16ffbde400 | 0x7f15cfa36080 | 524288 | 12822906 | 1641339488 | 12076419742774978 | 12076419742954449 | 12076419743224688 | 12076419743270098 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 128 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 77056 | 0x7f16ffbde300 | 0x7f15cfa360c0 | 524288 | 13272155 | 1698845652 | 12076419743295224 | 12076419743480527 | 12076419743738285 | 12076419743783522 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 130 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 78272 | 0x7f16ffbdea00 | 0x7f15cfa36100 | 524288 | 12357104 | 1581714688 | 12076419743811033 | 12076419743986924 | 12076419744161803 | 12076419744165421 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 132 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 80000 | 0x7f16ffbde900 | 0x7f15cfa36140 | 524288 | 7452354 | 953935248 | 12076419744216146 | 12076419744384042 | 12076419744528522 | 12076419744532243 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 134 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 81216 | 0x7f16ffbde800 | 0x7f15cfa36180 | 524288 | 10799160 | 1382315056 | 12076419744594849 | 12076419744756521 | 12076419744894280 | 12076419744897902 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 136 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 83456 | 0x7f16ffbde700 | 0x7f15cfa361c0 | 524288 | 11621612 | 1487492088 | 12076419744947595 | 12076419745123239 | 12076419745390118 | 12076419745438617 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 138 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 84928 | 0x7f16ffbde600 | 0x7f15cfa36200 | 524288 | 14245893 | 1823434328 | 12076419745464305 | 12076419745644837 | 12076419745898756 | 12076419745944277 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 140 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 86400 | 0x7f16ffbde500 | 0x7f15cfa36240 | 524288 | 12767954 | 1634375672 | 12076419745970616 | 12076419746153635 | 12076419746283074 | 12076419746286723 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 142 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 88128 | 0x7f16ffbde400 | 0x7f15cfa36280 | 524288 | 5697241 | 729125280 | 12076419746333620 | 12076419746510273 | 12076419746659872 | 12076419746663443 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 144 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 89600 | 0x7f16ffbde300 | 0x7f15cfa362c0 | 524288 | 10216473 | 1307689068 | 12076419746746287 | 12076419746906111 | 12076419747046111 | 12076419747050011 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 146 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 92096 | 0x7f16ffbdea00 | 0x7f15cfa36300 | 524288 | 13382971 | 1713031608 | 12076419747101237 | 12076419747273149 | 12076419747543548 | 12076419747587470 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 148 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 93568 | 0x7f16ffbde900 | 0x7f15cfa36340 | 524288 | 13468522 | 1723959132 | 12076419747613338 | 12076419747788827 | 12076419748052506 | 12076419748076549 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 150 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 95040 | 0x7f16ffbde800 | 0x7f15cfa36380 | 524288 | 10807028 | 1383189828 | 12076419748120330 | 12076419748281785 | 12076419748419704 | 12076419748423464 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 152 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 96768 | 0x7f16ffbde700 | 0x7f15cfa363c0 | 524288 | 4922915 | 630018076 | 12076419748474558 | 12076419748638103 | 12076419748796663 | 12076419748800103 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 154 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 98240 | 0x7f16ffbde600 | 0x7f15cfa36400 | 524288 | 11576770 | 1481758252 | 12076419748863241 | 12076419749028342 | 12076419749163061 | 12076419749166705 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 156 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 100736 | 0x7f16ffbde500 | 0x7f15cfa36440 | 524288 | 10739718 | 1374671612 | 12076419749218120 | 12076419749388180 | 12076419749654259 | 12076419749677354 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 158 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 102208 | 0x7f16ffbde400 | 0x7f15cfa36480 | 524288 | 13403285 | 1715657016 | 12076419749720904 | 12076419749882098 | 12076419750145457 | 12076419750171822 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 160 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 103680 | 0x7f16ffbde300 | 0x7f15cfa364c0 | 524288 | 11599650 | 1484735640 | 12076419750214993 | 12076419750375856 | 12076419750510895 | 12076419750514509 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 162 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 105664 | 0x7f16ffbdea00 | 0x7f15cfa36500 | 524288 | 4176806 | 534666028 | 12076419750564502 | 12076419750736654 | 12076419750902893 | 12076419750906417 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 164 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 107136 | 0x7f16ffbde900 | 0x7f15cfa36540 | 524288 | 11916952 | 1525457836 | 12076419750967451 | 12076419751135852 | 12076419751311851 | 12076419751315888 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 166 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 109888 | 0x7f16ffbde800 | 0x7f15cfa36580 | 524288 | 9783081 | 1252203708 | 12076419751370660 | 12076419751550890 | 12076419751816489 | 12076419751834071 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 168 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 111360 | 0x7f16ffbde700 | 0x7f15cfa365c0 | 524288 | 13787281 | 1764732572 | 12076419751879996 | 12076419752045608 | 12076419752302887 | 12076419752327889 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 170 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 112832 | 0x7f16ffbde600 | 0x7f15cfa36600 | 524288 | 10574874 | 1353548796 | 12076419752371330 | 12076419752533286 | 12076419752674565 | 12076419752678300 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 172 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 114816 | 0x7f16ffbde500 | 0x7f15cfa36640 | 524288 | 3663019 | 468760404 | 12076419752728694 | 12076419752895524 | 12076419753069603 | 12076419753073064 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 174 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 116288 | 0x7f16ffbde400 | 0x7f15cfa36680 | 524288 | 10296488 | 1317928156 | 12076419753139617 | 12076419753300802 | 12076419753440162 | 12076419753444013 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 176 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 119040 | 0x7f16ffbde300 | 0x7f15cfa366c0 | 524288 | 8792622 | 1125398008 | 12076419753497653 | 12076419753656961 | 12076419753920800 | 12076419753941738 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 178 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 120768 | 0x7f16ffbdea00 | 0x7f15cfa36700 | 524288 | 13463530 | 1723278100 | 12076419753987032 | 12076419754151839 | 12076419754409597 | 12076419754434093 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 180 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 122496 | 0x7f16ffbde900 | 0x7f15cfa36740 | 524288 | 11360430 | 1454099464 | 12076419754480980 | 12076419754639996 | 12076419754778556 | 12076419754782410 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 182 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 124736 | 0x7f16ffbde800 | 0x7f15cfa36780 | 524288 | 3289089 | 421102728 | 12076419754833715 | 12076419755000155 | 12076419755183674 | 12076419755187573 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 184 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 126464 | 0x7f16ffbde700 | 0x7f15cfa367c0 | 524288 | 10857078 | 1389600764 | 12076419755250600 | 12076419755411833 | 12076419755552312 | 12076419755555697 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 186 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 20 | 24 | 127936 | 0x7f16ffbde600 | 0x7f15cfa36800 | 524288 | 4296045 | 549827380 | 12076419755606271 | 12076419755772311 | 12076419756038870 | 12076419756060805 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 188 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 129664 | 0x7f16ffbde500 | 0x7f15cfa36840 | 524288 | 12559210 | 1607562724 | 12076419756111780 | 12076419756275189 | 12076419756532148 | 12076419756553160 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 190 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 131392 | 0x7f16ffbde400 | 0x7f15cfa36880 | 524288 | 11018463 | 1410468844 | 12076419756601290 | 12076419756762707 | 12076419756900146 | 12076419756904132 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 192 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 133632 | 0x7f16ffbde300 | 0x7f15cfa368c0 | 524288 | 3286275 | 420710296 | 12076419756954696 | 12076419757125425 | 12076419757316784 | 12076419757342487 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 194 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 135360 | 0x7f16ffbdea00 | 0x7f15cfa36900 | 524288 | 10931657 | 1399263692 | 12076419757401026 | 12076419757564303 | 12076419757701423 | 12076419757705311 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 196 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 20 | 24 | 136832 | 0x7f16ffbde900 | 0x7f15cfa36940 | 524288 | 2882634 | 369029716 | 12076419757758119 | 12076419757929742 | 12076419758213260 | 12076419758237710 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 198 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 138560 | 0x7f16ffbde800 | 0x7f15cfa36980 | 524288 | 13539606 | 1733047088 | 12076419758280350 | 12076419758439499 | 12076419758700298 | 12076419758722070 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 200 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 140288 | 0x7f16ffbde700 | 0x7f15cfa369c0 | 524288 | 10858837 | 1389900844 | 12076419758766162 | 12076419758925737 | 12076419759063497 | 12076419759067192 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 202 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 142784 | 0x7f16ffbde600 | 0x7f15cfa36a00 | 524288 | 3492710 | 447156220 | 12076419759116764 | 12076419759286696 | 12076419759497095 | 12076419759518120 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 204 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 144768 | 0x7f16ffbde500 | 0x7f15cfa36a40 | 524288 | 10311426 | 1319845012 | 12076419759583742 | 12076419759747173 | 12076419759887813 | 12076419759891654 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 206 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 20 | 24 | 145728 | 0x7f16ffbde400 | 0x7f15cfa36a80 | 524288 | 2584237 | 330650512 | 12076419759941657 | 12076419760113732 | 12076419760421250 | 12076419760443098 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 208 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 147712 | 0x7f16ffbde300 | 0x7f15cfa36ac0 | 524288 | 13582899 | 1738623920 | 12076419760489094 | 12076419760651809 | 12076419760909728 | 12076419760931306 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 210 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 149696 | 0x7f16ffbdea00 | 0x7f15cfa36b00 | 524288 | 10290712 | 1317106924 | 12076419760975468 | 12076419761141887 | 12076419761280927 | 12076419761284973 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 212 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 152192 | 0x7f16ffbde900 | 0x7f15cfa36b40 | 524288 | 3256102 | 416808376 | 12076419761329235 | 12076419761503326 | 12076419761730685 | 12076419761752221 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 214 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 154176 | 0x7f16ffbde800 | 0x7f15cfa36b80 | 524288 | 9672407 | 1238099976 | 12076419761812072 | 12076419761972763 | 12076419762115003 | 12076419762118912 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 216 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 20 | 24 | 155648 | 0x7f16ffbde700 | 0x7f15cfa36bc0 | 524288 | 2470691 | 316154976 | 12076419762169797 | 12076419762340922 | 12076419762699000 | 12076419762720430 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 218 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 157632 | 0x7f16ffbde600 | 0x7f15cfa36c00 | 524288 | 14169863 | 1813664860 | 12076419762766887 | 12076419762933079 | 12076419763194838 | 12076419763216732 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 220 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 159616 | 0x7f16ffbde500 | 0x7f15cfa36c40 | 524288 | 9597579 | 1228425524 | 12076419763262888 | 12076419763434997 | 12076419763576116 | 12076419763580068 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 222 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 162368 | 0x7f16ffbde400 | 0x7f15cfa36c80 | 524288 | 3247764 | 415764752 | 12076419763630201 | 12076419763810035 | 12076419764054354 | 12076419764076530 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 224 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 164608 | 0x7f16ffbde300 | 0x7f15cfa36cc0 | 524288 | 9742968 | 1247132976 | 12076419764144847 | 12076419764315346 | 12076419764454866 | 12076419764462197 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 226 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 20 | 24 | 166336 | 0x7f16ffbdea00 | 0x7f15cfa36d00 | 524288 | 2413434 | 308894408 | 12076419764508533 | 12076419764686384 | 12076419765063822 | 12076419765085605 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 228 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 168576 | 0x7f16ffbde900 | 0x7f15cfa36d40 | 524288 | 13213049 | 1691347596 | 12076419765136149 | 12076419765305261 | 12076419765567020 | 12076419765587678 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 230 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 170816 | 0x7f16ffbde800 | 0x7f15cfa36d80 | 524288 | 9364538 | 1198648088 | 12076419765632572 | 12076419765799819 | 12076419765937739 | 12076419765941355 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 232 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 174080 | 0x7f16ffbde700 | 0x7f15cfa36dc0 | 524288 | 3163886 | 404905764 | 12076419765999223 | 12076419766172618 | 12076419766453416 | 12076419766478223 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 234 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 176576 | 0x7f16ffbde600 | 0x7f15cfa36e00 | 524288 | 8618968 | 1103276532 | 12076419766541871 | 12076419766711015 | 12076419766851655 | 12076419766855233 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 236 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 20 | 24 | 177792 | 0x7f16ffbde500 | 0x7f15cfa36e40 | 524288 | 2397778 | 306754452 | 12076419766899225 | 12076419767096774 | 12076419767545412 | 12076419767569561 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 238 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 180288 | 0x7f16ffbde400 | 0x7f15cfa36e80 | 524288 | 10266435 | 1314143496 | 12076419767611499 | 12076419767782851 | 12076419768048610 | 12076419768075591 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 240 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 182784 | 0x7f16ffbde300 | 0x7f15cfa36ec0 | 524288 | 7286336 | 932679168 | 12076419768119002 | 12076419768290049 | 12076419768430048 | 12076419768433687 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 242 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 186304 | 0x7f16ffbdea00 | 0x7f15cfa36f00 | 524288 | 3334545 | 426849952 | 12076419768484070 | 12076419768658848 | 12076419768974526 | 12076419768995360 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 244 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 189312 | 0x7f16ffbde900 | 0x7f15cfa36f40 | 524288 | 3565255 | 456377332 | 12076419769064699 | 12076419769236125 | 12076419769388445 | 12076419769392148 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 246 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 20 | 24 | 190784 | 0x7f16ffbde800 | 0x7f15cfa36f80 | 524288 | 2317698 | 296530068 | 12076419769442952 | 12076419769619484 | 12076419770137082 | 12076419770159113 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 248 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 193792 | 0x7f16ffbde700 | 0x7f15cfa36fc0 | 524288 | 7938901 | 1016173972 | 12076419770208314 | 12076419770374201 | 12076419770672919 | 12076419770693666 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 250 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 196800 | 0x7f16ffbde600 | 0x7f15cfa37000 | 524288 | 3104864 | 397385924 | 12076419770746274 | 12076419770915798 | 12076419771071158 | 12076419771074744 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 252 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 201088 | 0x7f16ffbde500 | 0x7f15cfa37040 | 524288 | 3440160 | 440354712 | 12076419771120720 | 12076419771313877 | 12076419771700115 | 12076419771722878 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 254 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 204608 | 0x7f16ffbde400 | 0x7f15cfa37080 | 524288 | 3499569 | 447761804 | 12076419771781948 | 12076419771951474 | 12076419772129073 | 12076419772132750 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 256 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 20 | 24 | 206080 | 0x7f16ffbde300 | 0x7f15cfa370c0 | 524288 | 2322279 | 297382816 | 12076419772183164 | 12076419772361713 | 12076419772972110 | 12076419772993229 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 258 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 209600 | 0x7f16ffbdea00 | 0x7f15cfa37100 | 524288 | 4687471 | 599967236 | 12076419773044895 | 12076419773213389 | 12076419773542828 | 12076419773565172 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 260 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 213120 | 0x7f16ffbde900 | 0x7f15cfa37140 | 524288 | 3134445 | 401100748 | 12076419773615485 | 12076419773776747 | 12076419773956586 | 12076419773959905 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 262 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 218176 | 0x7f16ffbde800 | 0x7f15cfa37180 | 524288 | 3449600 | 441565632 | 12076419774020248 | 12076419774179145 | 12076419774634503 | 12076419774660347 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 264 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 222208 | 0x7f16ffbde700 | 0x7f15cfa371c0 | 524288 | 3012688 | 385553424 | 12076419774719026 | 12076419774880262 | 12076419775080422 | 12076419775103671 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 266 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 20 | 24 | 223936 | 0x7f16ffbde600 | 0x7f15cfa37200 | 524288 | 2317675 | 296629780 | 12076419775152782 | 12076419775315461 | 12076419776025378 | 12076419776049869 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 268 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 227968 | 0x7f16ffbde500 | 0x7f15cfa37240 | 524288 | 3582948 | 458553456 | 12076419776098469 | 12076419776258657 | 12076419776632735 | 12076419776654853 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 270 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 232000 | 0x7f16ffbde400 | 0x7f15cfa37280 | 524288 | 3372621 | 431587368 | 12076419776702752 | 12076419776865214 | 12076419777069853 | 12076419777091965 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 272 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 237824 | 0x7f16ffbde300 | 0x7f15cfa372c0 | 524288 | 4235767 | 542137048 | 12076419777138372 | 12076419777299613 | 12076419777825690 | 12076419777848812 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 274 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 242368 | 0x7f16ffbdea00 | 0x7f15cfa37300 | 524288 | 3227945 | 413095592 | 12076419777907691 | 12076419778082009 | 12076419778306808 | 12076419778331819 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 276 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 20 | 24 | 243584 | 0x7f16ffbde900 | 0x7f15cfa37340 | 524288 | 2331359 | 298276120 | 12076419778375040 | 12076419778535768 | 12076419779334484 | 12076419779381650 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 278 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 248128 | 0x7f16ffbde800 | 0x7f15cfa37380 | 524288 | 3646321 | 466650632 | 12076419779413249 | 12076419779594643 | 12076419780016242 | 12076419780062846 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 280 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 252672 | 0x7f16ffbde700 | 0x7f15cfa373c0 | 524288 | 3069373 | 392860752 | 12076419780099003 | 12076419780275760 | 12076419780501360 | 12076419780545653 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 282 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 259264 | 0x7f16ffbde600 | 0x7f15cfa37400 | 524288 | 4498714 | 575853036 | 12076419780571691 | 12076419780747439 | 12076419781357676 | 12076419781407464 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 284 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 264832 | 0x7f16ffbde500 | 0x7f15cfa37440 | 524288 | 3250239 | 415946660 | 12076419781446307 | 12076419781619115 | 12076419781887274 | 12076419781932660 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 286 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 20 | 24 | 266304 | 0x7f16ffbde400 | 0x7f15cfa37480 | 524288 | 2348635 | 300565248 | 12076419781965291 | 12076419782147593 | 12076419783132069 | 12076419783201117 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 288 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 28 | 24 | 271872 | 0x7f16ffbde300 | 0x7f15cfa374c0 | 524288 | 3258044 | 417055000 | 12076419783231344 | 12076419783412708 | 12076419783926626 | 12076419783991366 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 290 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 277440 | 0x7f16ffbdea00 | 0x7f15cfa37500 | 524288 | 3331003 | 426407044 | 12076419784024598 | 12076419784204865 | 12076419784476863 | 12076419784542811 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 292 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 12 | 24 | 279936 | 0x7f16ffbde900 | 0x7f15cfa37540 | 524288 | 2203008 | 281996940 | 12076419784567226 | 12076419784753982 | 12076419785492379 | 12076419785558758 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 294 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 286528 | 0x7f16ffbde800 | 0x7f15cfa37580 | 524288 | 3427540 | 438670524 | 12076419785606818 | 12076419785769818 | 12076419786087097 | 12076419786152942 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 296 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 20 | 24 | 288000 | 0x7f16ffbde700 | 0x7f15cfa375c0 | 524288 | 2305235 | 294976492 | 12076419786181996 | 12076419786362936 | 12076419787532051 | 12076419787598639 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 298 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 32 | 24 | 294592 | 0x7f16ffbde600 | 0x7f15cfa37600 | 524288 | 3328555 | 426059916 | 12076419787633474 | 12076419787805490 | 12076419788415248 | 12076419788487230 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 300 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 301184 | 0x7f16ffbde500 | 0x7f15cfa37640 | 524288 | 3282040 | 420187656 | 12076419788523107 | 12076419788686446 | 12076419789005325 | 12076419789051328 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 302 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 12 | 24 | 304960 | 0x7f16ffbde400 | 0x7f15cfa37680 | 524288 | 2209680 | 282870116 | 12076419789081705 | 12076419789266764 | 12076419790145481 | 12076419790212626 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 304 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 24 | 24 | 313600 | 0x7f16ffbde300 | 0x7f15cfa376c0 | 524288 | 3285912 | 420519976 | 12076419790259744 | 12076419790424359 | 12076419790836038 | 12076419790900945 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 306 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 20 | 24 | 314816 | 0x7f16ffbdea00 | 0x7f15cfa37700 | 524288 | 2347010 | 300316852 | 12076419790935770 | 12076419791117157 | 12076419792666110 | 12076419792735033 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 308 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 20 | 24 | 317568 | 0x7f16ffbde900 | 0x7f15cfa37740 | 524288 | 2260873 | 289337444 | 12076419792765239 | 12076419792945309 | 12076419793740346 | 12076419793810231 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 310 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 12 | 24 | 320320 | 0x7f16ffbde800 | 0x7f15cfa37780 | 524288 | 2154223 | 275598132 | 12076419793839095 | 12076419794022265 | 12076419794437143 | 12076419794503389 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 312 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 12 | 24 | 324096 | 0x7f16ffbde700 | 0x7f15cfa377c0 | 524288 | 2258729 | 289016756 | 12076419794529287 | 12076419794707062 | 12076419795866097 | 12076419795933397 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 314 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 12 | 24 | 328896 | 0x7f16ffbde600 | 0x7f15cfa37800 | 524288 | 2232048 | 285605348 | 12076419795977028 | 12076419796144496 | 12076419796930413 | 12076419796997905 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 316 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 20 | 24 | 330112 | 0x7f16ffbde500 | 0x7f15cfa37840 | 524288 | 2667957 | 341497048 | 12076419797040504 | 12076419797202892 | 12076419800250560 | 12076419800318495 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 318 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 20 | 24 | 332864 | 0x7f16ffbde400 | 0x7f15cfa37880 | 524288 | 2328695 | 298075784 | 12076419800348060 | 12076419800530238 | 12076419802070552 | 12076419802137084 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 320 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 12 | 24 | 335616 | 0x7f16ffbde300 | 0x7f15cfa378c0 | 524288 | 2257633 | 289029596 | 12076419802171899 | 12076419802354711 | 12076419803144468 | 12076419803211461 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 322 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 12 | 24 | 339392 | 0x7f16ffbdea00 | 0x7f15cfa37900 | 524288 | 2540342 | 325203204 | 12076419803246916 | 12076419803419347 | 12076419805700778 | 12076419805767961 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 324 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 12 | 24 | 344192 | 0x7f16ffbde900 | 0x7f15cfa37940 | 524288 | 2385726 | 305461640 | 12076419805816361 | 12076419805980616 | 12076419807516450 | 12076419807585779 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 326 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 20 | 24 | 345408 | 0x7f16ffbde800 | 0x7f15cfa37980 | 524288 | 2908924 | 372222596 | 12076419807619912 | 12076419807793089 | 12076419813844585 | 12076419813913898 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 328 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 20 | 24 | 348160 | 0x7f16ffbde700 | 0x7f15cfa379c0 | 524288 | 3241827 | 414995268 | 12076419813943082 | 12076419814129383 | 12076419817170491 | 12076419817242613 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 330 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 12 | 24 | 350912 | 0x7f16ffbde600 | 0x7f15cfa37a00 | 524288 | 2393333 | 306301296 | 12076419817281385 | 12076419817450010 | 12076419818989204 | 12076419819055672 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 332 | 926143 | 926148 | 4194304 | 256 | 0 | 0 | 12 | 24 | 0 | 0x7f16ffbde500 | 0x7f15cfa37a40 | 524288 | 2515386 | 321843380 | 12076419819092290 | 12076419819259123 | 12076419823785664 | 12076419823852856 |