46 KiB
46 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | GRBM_COUNT | GRBM_GUI_ACTIVE | SQ_WAVES | SQ_IFETCH | SQ_IFETCH_LEVEL | SQ_ACCUM_PREV_HIRES | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBuffer.kd | 0 | 0 | 0 | 919533 | 919538 | 33554432 | 256 | 0 | 0 | 8 | 32 | 6464 | 0x0 | 0x7f539a404180 | 510905 | 510905 | 524288 | 6291456 | 791255 | 101484656 | 12076299622617100 | 12076299868527949 | 12076299868855467 | 12076299868966179 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 919533 | 919538 | 32768 | 256 | 0 | 0 | 24 | 24 | 12480 | 0x0 | 0x7f539a435100 | 29103 | 29103 | 512 | 8192 | 11024 | 1421636 | 12076299883226411 | 12076299883536030 | 12076299883542910 | 12076299883550754 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 4 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 12928 | 0x7f54a6102900 | 0x7f539a435140 | 214348 | 214348 | 65536 | 917504 | 141051 | 18053272 | 12076299883612759 | 12076299883846109 | 12076299883977148 | 12076299883980823 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 6 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 36 | 24 | 13632 | 0x7f54a6102800 | 0x7f539a435180 | 393217 | 393217 | 65536 | 1245184 | 183556 | 23413388 | 12076299884057155 | 12076299884237467 | 12076299884488185 | 12076299884558838 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 8 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 14080 | 0x7f54a6102700 | 0x7f539a4351c0 | 398588 | 398588 | 65536 | 983040 | 136711 | 17472264 | 12076299884591839 | 12076299884784344 | 12076299885038582 | 12076299885110302 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 10 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 14528 | 0x7f54a6102600 | 0x7f539a435200 | 214801 | 214801 | 65536 | 1048576 | 159691 | 20414844 | 12076299885131732 | 12076299885331861 | 12076299885463220 | 12076299885466665 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 12 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 14976 | 0x7f54a6102500 | 0x7f539a435240 | 217772 | 217772 | 65536 | 983040 | 151837 | 19401912 | 12076299885514403 | 12076299885699699 | 12076299885832498 | 12076299885835941 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 14 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 15424 | 0x7f54a6102400 | 0x7f539a435280 | 213089 | 213089 | 65536 | 1048576 | 146940 | 18850908 | 12076299885918775 | 12076299886104337 | 12076299886234736 | 12076299886238199 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 16 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 16128 | 0x7f54a6102300 | 0x7f539a4352c0 | 392820 | 392820 | 65536 | 1572864 | 229355 | 29302276 | 12076299886293581 | 12076299886473935 | 12076299886724174 | 12076299886768474 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 18 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 16832 | 0x7f54a6102a00 | 0x7f539a435300 | 392001 | 392001 | 65536 | 1179648 | 157851 | 20274332 | 12076299886793070 | 12076299886995532 | 12076299887245771 | 12076299887287509 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 20 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 17536 | 0x7f54a6102900 | 0x7f539a435340 | 214059 | 214059 | 65536 | 1114112 | 163347 | 20901004 | 12076299887319879 | 12076299887507530 | 12076299887638569 | 12076299887641777 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 22 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 18240 | 0x7f54a6102800 | 0x7f539a435380 | 213545 | 213545 | 65536 | 1114112 | 158333 | 20302232 | 12076299887686510 | 12076299887871688 | 12076299888002567 | 12076299888006064 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 24 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 18944 | 0x7f54a6102700 | 0x7f539a4353c0 | 212651 | 212651 | 65536 | 1179648 | 178701 | 22843900 | 12076299888075042 | 12076299888246086 | 12076299888375525 | 12076299888379017 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 26 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 19904 | 0x7f54a6102600 | 0x7f539a435400 | 398465 | 398465 | 65536 | 1835008 | 254566 | 32610180 | 12076299888427387 | 12076299888607044 | 12076299888860963 | 12076299888929360 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 28 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 20608 | 0x7f54a6102500 | 0x7f539a435440 | 397484 | 397484 | 65536 | 1310720 | 177927 | 22757004 | 12076299888953455 | 12076299889151681 | 12076299889405280 | 12076299889475224 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 30 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 21312 | 0x7f54a6102400 | 0x7f539a435480 | 209321 | 209321 | 65536 | 1245184 | 181910 | 23327888 | 12076299889500501 | 12076299889689118 | 12076299889817278 | 12076299889820717 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 32 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 22016 | 0x7f54a6102300 | 0x7f539a4354c0 | 213411 | 213411 | 65536 | 1310720 | 180276 | 23055180 | 12076299889872613 | 12076299890057756 | 12076299890188476 | 12076299890191896 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 34 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 22720 | 0x7f54a6102a00 | 0x7f539a435500 | 220089 | 220089 | 65536 | 1310720 | 180034 | 23026544 | 12076299890256567 | 12076299890424475 | 12076299890559354 | 12076299890562736 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 36 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 23680 | 0x7f54a6102900 | 0x7f539a435540 | 398091 | 398091 | 65536 | 2097152 | 286809 | 36778484 | 12076299890615644 | 12076299890793913 | 12076299891048471 | 12076299891092440 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 38 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 24384 | 0x7f54a6102800 | 0x7f539a435580 | 399921 | 399921 | 65536 | 1441792 | 196270 | 25189740 | 12076299891117106 | 12076299891306070 | 12076299891561909 | 12076299891628837 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 40 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 25088 | 0x7f54a6102700 | 0x7f539a4355c0 | 210100 | 210100 | 65536 | 1376256 | 190752 | 24365644 | 12076299891652300 | 12076299891837907 | 12076299891966067 | 12076299891969560 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 42 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 25792 | 0x7f54a6102600 | 0x7f539a435600 | 208553 | 208553 | 65536 | 1507328 | 223099 | 28554880 | 12076299892027548 | 12076299892208945 | 12076299892336305 | 12076299892339918 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 44 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 26496 | 0x7f54a6102500 | 0x7f539a435640 | 212075 | 212075 | 65536 | 1441792 | 200081 | 25562192 | 12076299892403136 | 12076299892573263 | 12076299892702383 | 12076299892705808 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 46 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 27712 | 0x7f54a6102400 | 0x7f539a435680 | 398945 | 398945 | 65536 | 2359296 | 321994 | 41224232 | 12076299892749179 | 12076299892932942 | 12076299893188460 | 12076299893258766 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 48 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 28416 | 0x7f54a6102300 | 0x7f539a4356c0 | 394531 | 394531 | 65536 | 1572864 | 212336 | 27147804 | 12076299893282670 | 12076299893472299 | 12076299893723817 | 12076299893791165 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 50 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 29120 | 0x7f54a6102a00 | 0x7f539a435700 | 215913 | 215913 | 65536 | 1507328 | 209863 | 26846108 | 12076299893815110 | 12076299894006696 | 12076299894139015 | 12076299894142278 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 52 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 30080 | 0x7f54a6102900 | 0x7f539a435740 | 211651 | 211651 | 65536 | 1703936 | 230651 | 29594612 | 12076299894195176 | 12076299894374854 | 12076299894504293 | 12076299894507787 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 54 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 30784 | 0x7f54a6102800 | 0x7f539a435780 | 216225 | 216225 | 65536 | 1572864 | 213205 | 27280232 | 12076299894573189 | 12076299894740452 | 12076299894873412 | 12076299894876943 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 56 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 32000 | 0x7f54a6102700 | 0x7f539a4357c0 | 391100 | 391100 | 65536 | 2621440 | 361835 | 46493032 | 12076299894928780 | 12076299895117410 | 12076299895367809 | 12076299895436623 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 58 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 32960 | 0x7f54a6102600 | 0x7f539a435800 | 395977 | 395977 | 65536 | 1703936 | 230470 | 29523928 | 12076299895464836 | 12076299895648928 | 12076299895902526 | 12076299895969594 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 60 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 33920 | 0x7f54a6102500 | 0x7f539a435840 | 211483 | 211483 | 65536 | 1638400 | 227044 | 29065240 | 12076299895996444 | 12076299896188125 | 12076299896317404 | 12076299896321187 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 62 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 34880 | 0x7f54a6102400 | 0x7f539a435880 | 218505 | 218505 | 65536 | 1900544 | 268741 | 34343524 | 12076299896374006 | 12076299896548923 | 12076299896683802 | 12076299896687218 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 64 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 35840 | 0x7f54a6102300 | 0x7f539a4358c0 | 278476 | 278476 | 65536 | 1703936 | 232489 | 29686064 | 12076299896750916 | 12076299896920441 | 12076299897092280 | 12076299897096027 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 66 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 37312 | 0x7f54a6102a00 | 0x7f539a435900 | 400697 | 400697 | 65536 | 2883584 | 394892 | 50507760 | 12076299897149537 | 12076299897335319 | 12076299897592437 | 12076299897661218 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 68 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 38272 | 0x7f54a6102900 | 0x7f539a435940 | 389276 | 389276 | 65536 | 1835008 | 245721 | 31376504 | 12076299897684311 | 12076299897872916 | 12076299898121395 | 12076299898189369 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 70 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 39232 | 0x7f54a6102800 | 0x7f539a435980 | 216113 | 216113 | 65536 | 1769472 | 278643 | 35676384 | 12076299898214446 | 12076299898407633 | 12076299898540753 | 12076299898544099 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 72 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 40192 | 0x7f54a6102700 | 0x7f539a4359c0 | 223708 | 223708 | 65536 | 2097152 | 328429 | 42225068 | 12076299898595925 | 12076299898772751 | 12076299898908751 | 12076299898912052 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 74 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 41152 | 0x7f54a6102600 | 0x7f539a435a00 | 279257 | 279257 | 65536 | 1835008 | 248776 | 31844500 | 12076299898977955 | 12076299899151949 | 12076299899326669 | 12076299899330370 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 76 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 42624 | 0x7f54a6102500 | 0x7f539a435a40 | 396443 | 396443 | 65536 | 3145728 | 432501 | 55279636 | 12076299899374973 | 12076299899558667 | 12076299899812426 | 12076299899880893 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 78 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 43584 | 0x7f54a6102400 | 0x7f539a435a80 | 397537 | 397537 | 65536 | 1966080 | 269365 | 34482060 | 12076299899905459 | 12076299900098665 | 12076299900353703 | 12076299900423141 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 80 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 44544 | 0x7f54a6102300 | 0x7f539a435ac0 | 214636 | 214636 | 65536 | 1900544 | 271973 | 34786028 | 12076299900445933 | 12076299900640422 | 12076299900772101 | 12076299900775465 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 82 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 45760 | 0x7f54a6102a00 | 0x7f539a435b00 | 215705 | 215705 | 65536 | 2293760 | 305665 | 39246868 | 12076299900827522 | 12076299901005220 | 12076299901138659 | 12076299901142448 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 84 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 46720 | 0x7f54a6102900 | 0x7f539a435b40 | 276028 | 276028 | 65536 | 1966080 | 284612 | 36382880 | 12076299901206637 | 12076299901379298 | 12076299901551777 | 12076299901555385 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 86 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 48448 | 0x7f54a6102800 | 0x7f539a435b80 | 414577 | 414577 | 65536 | 3407872 | 461566 | 59220616 | 12076299901598976 | 12076299901782816 | 12076299902049374 | 12076299902118672 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 88 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 49408 | 0x7f54a6102700 | 0x7f539a435bc0 | 395507 | 395507 | 65536 | 2097152 | 276323 | 35383616 | 12076299902143187 | 12076299902331613 | 12076299902585052 | 12076299902626285 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 90 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 50368 | 0x7f54a6102600 | 0x7f539a435c00 | 213993 | 213993 | 65536 | 2031616 | 292874 | 37532392 | 12076299902655550 | 12076299902832890 | 12076299902964090 | 12076299902967529 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 92 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 51584 | 0x7f54a6102500 | 0x7f539a435c40 | 227012 | 227012 | 65536 | 2490368 | 335111 | 42932600 | 12076299903018795 | 12076299903201048 | 12076299903341528 | 12076299903345021 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 94 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 52544 | 0x7f54a6102400 | 0x7f539a435c80 | 211969 | 211969 | 65536 | 2097152 | 290284 | 37168948 | 12076299903410232 | 12076299903577687 | 12076299903707926 | 12076299903711522 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 96 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 54272 | 0x7f54a6102300 | 0x7f539a435cc0 | 405019 | 405019 | 65536 | 3670016 | 489204 | 62811988 | 12076299903766123 | 12076299903942645 | 12076299904203283 | 12076299904274047 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 98 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 55488 | 0x7f54a6102a00 | 0x7f539a435d00 | 387121 | 387121 | 65536 | 2228224 | 300500 | 38430084 | 12076299904299815 | 12076299904489682 | 12076299904738801 | 12076299904806727 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 100 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 56704 | 0x7f54a6102900 | 0x7f539a435d40 | 212323 | 212323 | 65536 | 2162688 | 296477 | 38039316 | 12076299904831223 | 12076299905016239 | 12076299905145678 | 12076299905149134 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 102 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 58176 | 0x7f54a6102800 | 0x7f539a435d80 | 227017 | 227017 | 65536 | 2686976 | 387552 | 49471624 | 12076299905201812 | 12076299905382957 | 12076299905524076 | 12076299905527427 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 104 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 59392 | 0x7f54a6102700 | 0x7f539a435dc0 | 208539 | 208539 | 65536 | 2228224 | 306254 | 39183484 | 12076299905592618 | 12076299905760395 | 12076299905888235 | 12076299905891694 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 106 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 61376 | 0x7f54a6102600 | 0x7f539a435e00 | 406425 | 406425 | 65536 | 3932160 | 532180 | 67960200 | 12076299905944893 | 12076299906131113 | 12076299906393352 | 12076299906437829 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 108 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 62592 | 0x7f54a6102500 | 0x7f539a435e40 | 402036 | 402036 | 65536 | 2359296 | 313357 | 40150908 | 12076299906463286 | 12076299906646311 | 12076299906904229 | 12076299906945743 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 110 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 63808 | 0x7f54a6102400 | 0x7f539a435e80 | 210913 | 210913 | 65536 | 2293760 | 340510 | 43490748 | 12076299906976740 | 12076299907159908 | 12076299907289827 | 12076299907293609 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 112 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 65280 | 0x7f54a6102300 | 0x7f539a435ec0 | 222268 | 222268 | 65536 | 2883584 | 431367 | 55156600 | 12076299907346998 | 12076299907529186 | 12076299907666785 | 12076299907670369 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 114 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 66496 | 0x7f54a6102a00 | 0x7f539a435f00 | 212353 | 212353 | 65536 | 2359296 | 349015 | 44610384 | 12076299907735420 | 12076299907901504 | 12076299908032223 | 12076299908035578 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 116 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 68480 | 0x7f54a6102900 | 0x7f539a435f40 | 406948 | 406948 | 65536 | 4194304 | 581524 | 74373760 | 12076299908090300 | 12076299908265662 | 12076299908527741 | 12076299908596621 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 118 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 69696 | 0x7f54a6102800 | 0x7f539a435f80 | 387321 | 387321 | 65536 | 2490368 | 330981 | 42359592 | 12076299908623451 | 12076299908804699 | 12076299909054138 | 12076299909124372 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 120 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 70912 | 0x7f54a6102700 | 0x7f539a435fc0 | 214035 | 214035 | 65536 | 2424832 | 354206 | 45414804 | 12076299909149408 | 12076299909335257 | 12076299909467096 | 12076299909470314 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 122 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 72384 | 0x7f54a6102600 | 0x7f539a436000 | 220241 | 220241 | 65536 | 3080192 | 450511 | 57638424 | 12076299909524826 | 12076299909690295 | 12076299909827574 | 12076299909830804 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 124 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 73600 | 0x7f54a6102500 | 0x7f539a436040 | 214363 | 214363 | 65536 | 2490368 | 355067 | 45513180 | 12076299909894413 | 12076299910060853 | 12076299910192532 | 12076299910196484 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 126 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 75840 | 0x7f54a6102400 | 0x7f539a436080 | 408577 | 408577 | 65536 | 4456448 | 579780 | 74345736 | 12076299910247970 | 12076299910427571 | 12076299910691410 | 12076299910758899 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 128 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 77056 | 0x7f54a6102300 | 0x7f539a4360c0 | 394324 | 394324 | 65536 | 2621440 | 343762 | 44075296 | 12076299910782082 | 12076299910970928 | 12076299911224687 | 12076299911292661 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 130 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 78272 | 0x7f54a6102a00 | 0x7f539a436100 | 213665 | 213665 | 65536 | 2555904 | 367477 | 47012136 | 12076299911317978 | 12076299911506286 | 12076299911638445 | 12076299911641600 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 132 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 80000 | 0x7f54a6102900 | 0x7f539a436140 | 231796 | 231796 | 65536 | 3276800 | 477202 | 60917452 | 12076299911693586 | 12076299911867244 | 12076299912011883 | 12076299912015815 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 134 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 81216 | 0x7f54a6102800 | 0x7f539a436180 | 211569 | 211569 | 65536 | 2621440 | 363595 | 46544632 | 12076299912081447 | 12076299912249162 | 12076299912379561 | 12076299912383218 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 136 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 83456 | 0x7f54a6102700 | 0x7f539a4361c0 | 411667 | 411667 | 65536 | 4718592 | 656067 | 84140872 | 12076299912435525 | 12076299912608040 | 12076299912874118 | 12076299912917100 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 138 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 84928 | 0x7f54a6102600 | 0x7f539a436200 | 391777 | 391777 | 65536 | 2752512 | 361371 | 46213224 | 12076299912940474 | 12076299913132997 | 12076299913385316 | 12076299913455200 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 140 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 86400 | 0x7f54a6102500 | 0x7f539a436240 | 219084 | 219084 | 65536 | 2686976 | 394766 | 50465020 | 12076299913480026 | 12076299913665154 | 12076299913800354 | 12076299913803758 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 142 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 88128 | 0x7f54a6102400 | 0x7f539a436280 | 241329 | 241329 | 65536 | 3473408 | 556381 | 71237200 | 12076299913855885 | 12076299914037472 | 12076299914188192 | 12076299914191569 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 144 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 89600 | 0x7f54a6102300 | 0x7f539a4362c0 | 212492 | 212492 | 65536 | 2752512 | 386737 | 49462240 | 12076299914270686 | 12076299914438430 | 12076299914568990 | 12076299914572587 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 146 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 92096 | 0x7f54a6102a00 | 0x7f539a436300 | 413625 | 413625 | 65536 | 4980736 | 659950 | 84737104 | 12076299914624844 | 12076299914798909 | 12076299915064507 | 12076299915115676 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 148 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 93568 | 0x7f54a6102900 | 0x7f539a436340 | 391372 | 391372 | 65536 | 2883584 | 385374 | 49326632 | 12076299915140793 | 12076299915326906 | 12076299915578904 | 12076299915627608 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 150 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 95040 | 0x7f54a6102800 | 0x7f539a436380 | 218273 | 218273 | 65536 | 2818048 | 419903 | 53706572 | 12076299915647925 | 12076299915837143 | 12076299915972022 | 12076299915975454 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 152 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 96768 | 0x7f54a6102700 | 0x7f539a4363c0 | 251587 | 251587 | 65536 | 3670016 | 530319 | 67833120 | 12076299916030316 | 12076299916209301 | 12076299916366740 | 12076299916370618 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 154 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 98240 | 0x7f54a6102600 | 0x7f539a436400 | 218801 | 218801 | 65536 | 2883584 | 443148 | 56649432 | 12076299916433185 | 12076299916599219 | 12076299916734578 | 12076299916737931 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 156 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 100736 | 0x7f54a6102500 | 0x7f539a436440 | 404363 | 404363 | 65536 | 5177344 | 685648 | 87529560 | 12076299916788315 | 12076299916963057 | 12076299917224656 | 12076299917275029 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 158 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 102208 | 0x7f54a6102400 | 0x7f539a436480 | 397073 | 397073 | 65536 | 3014656 | 398099 | 50926840 | 12076299917298503 | 12076299917487055 | 12076299917743373 | 12076299917791469 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 160 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 103680 | 0x7f54a6102300 | 0x7f539a4364c0 | 223547 | 223547 | 65536 | 2949120 | 499932 | 63983460 | 12076299917814452 | 12076299918004492 | 12076299918142411 | 12076299918145928 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 162 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 105664 | 0x7f54a6102a00 | 0x7f539a436500 | 264505 | 264505 | 65536 | 3866624 | 590898 | 75688444 | 12076299918198806 | 12076299918375530 | 12076299918542569 | 12076299918545951 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 164 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 107136 | 0x7f54a6102900 | 0x7f539a436540 | 219499 | 219499 | 65536 | 3014656 | 407783 | 52170012 | 12076299918610331 | 12076299918775208 | 12076299918910087 | 12076299918914416 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 166 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 109888 | 0x7f54a6102800 | 0x7f539a436580 | 408329 | 408329 | 65536 | 5439488 | 728725 | 93307600 | 12076299918965180 | 12076299919147526 | 12076299919409925 | 12076299919461152 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 168 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 111360 | 0x7f54a6102700 | 0x7f539a4365c0 | 394907 | 394907 | 65536 | 3145728 | 420648 | 53828316 | 12076299919484686 | 12076299919670243 | 12076299919924802 | 12076299919972953 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 170 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 112832 | 0x7f54a6102600 | 0x7f539a436600 | 216569 | 216569 | 65536 | 3080192 | 476862 | 60953660 | 12076299919995876 | 12076299920187361 | 12076299920321120 | 12076299920325108 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 172 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 114816 | 0x7f54a6102500 | 0x7f539a436640 | 277483 | 277483 | 65536 | 4063232 | 561121 | 71822404 | 12076299920371744 | 12076299920556159 | 12076299920730558 | 12076299920734308 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 174 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 116288 | 0x7f54a6102400 | 0x7f539a436680 | 212657 | 212657 | 65536 | 3145728 | 427720 | 54716052 | 12076299920799579 | 12076299920963677 | 12076299921095036 | 12076299921099006 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 176 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 119040 | 0x7f54a6102300 | 0x7f539a4366c0 | 400571 | 400571 | 65536 | 5701632 | 743935 | 94963868 | 12076299921150992 | 12076299921329115 | 12076299921588633 | 12076299921637066 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 178 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 120768 | 0x7f54a6102a00 | 0x7f539a436700 | 395201 | 395201 | 65536 | 3276800 | 447138 | 57230528 | 12076299921661822 | 12076299921846872 | 12076299922101911 | 12076299922150851 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 180 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 122496 | 0x7f54a6102900 | 0x7f539a436740 | 223844 | 223844 | 65536 | 3211264 | 482379 | 61662540 | 12076299922173773 | 12076299922362229 | 12076299922500629 | 12076299922504287 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 182 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 124736 | 0x7f54a6102800 | 0x7f539a436780 | 288777 | 288777 | 65536 | 4259840 | 607340 | 77619552 | 12076299922548660 | 12076299922731187 | 12076299922914547 | 12076299922917856 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 184 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 126464 | 0x7f54a6102700 | 0x7f539a4367c0 | 226412 | 226412 | 65536 | 3276800 | 535703 | 68596192 | 12076299922981244 | 12076299923153745 | 12076299923293745 | 12076299923297732 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 186 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 20 | 24 | 127936 | 0x7f54a6102600 | 0x7f539a436800 | 410545 | 410545 | 65536 | 7733248 | 974305 | 124912844 | 12076299923349478 | 12076299923546063 | 12076299923812782 | 12076299923859997 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 188 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 129664 | 0x7f54a6102500 | 0x7f539a436840 | 402724 | 402724 | 65536 | 3407872 | 454256 | 58389876 | 12076299923882859 | 12076299924073581 | 12076299924333739 | 12076299924382588 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 190 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 131392 | 0x7f54a6102400 | 0x7f539a436880 | 217577 | 217577 | 65536 | 3342336 | 456477 | 58455472 | 12076299924407815 | 12076299924597898 | 12076299924732297 | 12076299924736025 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 192 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 133632 | 0x7f54a6102300 | 0x7f539a4368c0 | 302051 | 302051 | 65536 | 4456448 | 640004 | 82269060 | 12076299924792089 | 12076299924963496 | 12076299925155015 | 12076299925203845 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 194 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 135360 | 0x7f54a6102a00 | 0x7f539a436900 | 215145 | 215145 | 65536 | 3538944 | 490420 | 62641808 | 12076299925240813 | 12076299925410854 | 12076299925543973 | 12076299925547663 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 196 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 20 | 24 | 136832 | 0x7f54a6102900 | 0x7f539a436940 | 437076 | 437076 | 65536 | 8978432 | 1131317 | 144600808 | 12076299925593228 | 12076299925771972 | 12076299926056770 | 12076299926103917 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 198 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 138560 | 0x7f54a6102800 | 0x7f539a436980 | 389345 | 389345 | 65536 | 3670016 | 479222 | 61424280 | 12076299926122672 | 12076299926315489 | 12076299926567488 | 12076299926614336 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 200 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 140288 | 0x7f54a6102700 | 0x7f539a4369c0 | 219715 | 219715 | 65536 | 3604480 | 543259 | 69579764 | 12076299926638932 | 12076299926830206 | 12076299926966046 | 12076299926969756 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 202 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 142784 | 0x7f54a6102600 | 0x7f539a436a00 | 330785 | 330785 | 65536 | 4849664 | 735877 | 94024956 | 12076299927026863 | 12076299927213404 | 12076299927424123 | 12076299927471599 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 204 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 144768 | 0x7f54a6102500 | 0x7f539a436a40 | 219067 | 219067 | 65536 | 3801088 | 601072 | 76954544 | 12076299927509309 | 12076299927675482 | 12076299927810841 | 12076299927814526 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 206 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 20 | 24 | 145728 | 0x7f54a6102400 | 0x7f539a436a80 | 470385 | 470385 | 65536 | 14548992 | 1832714 | 234663380 | 12076299927866513 | 12076299928051800 | 12076299928359478 | 12076299928408891 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 208 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 147712 | 0x7f54a6102300 | 0x7f539a436ac0 | 407483 | 407483 | 65536 | 3932160 | 522533 | 67088484 | 12076299928434649 | 12076299928618677 | 12076299928882196 | 12076299928929148 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 210 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 149696 | 0x7f54a6102a00 | 0x7f539a436b00 | 216841 | 216841 | 65536 | 3866624 | 602869 | 77157604 | 12076299928951980 | 12076299929145874 | 12076299929280274 | 12076299929284548 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 212 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 152192 | 0x7f54a6102900 | 0x7f539a436b40 | 356148 | 356148 | 65536 | 5242880 | 750550 | 96037116 | 12076299929336835 | 12076299929513392 | 12076299929741071 | 12076299929788054 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 214 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 154176 | 0x7f54a6102800 | 0x7f539a436b80 | 221153 | 221153 | 65536 | 4063232 | 581531 | 74441840 | 12076299929823279 | 12076299929994190 | 12076299930131789 | 12076299930135400 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 216 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 20 | 24 | 155648 | 0x7f54a6102700 | 0x7f539a436bc0 | 504355 | 504355 | 65536 | 10027008 | 1259275 | 161391076 | 12076299930188228 | 12076299930365228 | 12076299930695306 | 12076299930742458 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 218 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 157632 | 0x7f54a6102600 | 0x7f539a436c00 | 398585 | 398585 | 65536 | 4194304 | 600322 | 76837356 | 12076299930765611 | 12076299930949865 | 12076299931207944 | 12076299931255491 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 220 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 159616 | 0x7f54a6102500 | 0x7f539a436c40 | 224748 | 224748 | 65536 | 4128768 | 582931 | 74613476 | 12076299931280878 | 12076299931469170 | 12076299931608530 | 12076299931615480 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 222 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 162368 | 0x7f54a6102400 | 0x7f539a436c80 | 381473 | 381473 | 65536 | 5636096 | 774439 | 99074516 | 12076299931666515 | 12076299931843887 | 12076299932089006 | 12076299932138602 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 224 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 164608 | 0x7f54a6102300 | 0x7f539a436cc0 | 219852 | 219852 | 65536 | 4587520 | 636011 | 81425624 | 12076299932175792 | 12076299932348525 | 12076299932484204 | 12076299932487551 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 226 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 20 | 24 | 166336 | 0x7f54a6102a00 | 0x7f539a436d00 | 575009 | 575009 | 65536 | 11075584 | 1395290 | 178377424 | 12076299932539177 | 12076299932714923 | 12076299933092362 | 12076299933139863 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 228 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 168576 | 0x7f54a6102900 | 0x7f539a436d40 | 404540 | 404540 | 65536 | 4718592 | 639390 | 82178140 | 12076299933164709 | 12076299933360200 | 12076299933622279 | 12076299933668666 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 230 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 170816 | 0x7f54a6102800 | 0x7f539a436d80 | 232913 | 232913 | 65536 | 4653056 | 733715 | 94047532 | 12076299933691589 | 12076299933886118 | 12076299934031557 | 12076299934035287 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 232 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 174080 | 0x7f54a6102700 | 0x7f539a436dc0 | 438427 | 438427 | 65536 | 6422528 | 893536 | 115027880 | 12076299934088015 | 12076299934265956 | 12076299934546115 | 12076299934570151 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 234 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 176576 | 0x7f54a6102600 | 0x7f539a436e00 | 223985 | 223985 | 65536 | 5111808 | 810645 | 103823888 | 12076299934628580 | 12076299934794754 | 12076299934934433 | 12076299934937925 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 236 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 20 | 24 | 177792 | 0x7f54a6102500 | 0x7f539a436e40 | 647819 | 647819 | 65536 | 15007744 | 1882223 | 240987232 | 12076299934984261 | 12076299935169472 | 12076299935595390 | 12076299935645730 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 238 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 180288 | 0x7f54a6102400 | 0x7f539a436e80 | 395465 | 395465 | 65536 | 5242880 | 718781 | 92425140 | 12076299935670536 | 12076299935861149 | 12076299936117948 | 12076299936166809 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 240 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 182784 | 0x7f54a6102300 | 0x7f539a436ec0 | 231915 | 231915 | 65536 | 5177344 | 862288 | 110298624 | 12076299936191294 | 12076299936379226 | 12076299936521786 | 12076299936525275 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 242 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 186304 | 0x7f54a6102a00 | 0x7f539a436f00 | 531153 | 531153 | 65536 | 7208960 | 1062588 | 135960020 | 12076299936579065 | 12076299936753305 | 12076299937096983 | 12076299937146670 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 244 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 189312 | 0x7f54a6102900 | 0x7f539a436f40 | 244604 | 244604 | 65536 | 6160384 | 911662 | 116689268 | 12076299937181705 | 12076299937358422 | 12076299937510901 | 12076299937514073 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 246 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 20 | 24 | 190784 | 0x7f54a6102800 | 0x7f539a436f80 | 784073 | 784073 | 65536 | 17104896 | 2144722 | 274642756 | 12076299937565298 | 12076299937740660 | 12076299938258098 | 12076299938306686 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 248 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 193792 | 0x7f54a6102700 | 0x7f539a436fc0 | 459491 | 459491 | 65536 | 6291456 | 960581 | 122933792 | 12076299938335519 | 12076299938523857 | 12076299938824815 | 12076299938871986 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 250 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 196800 | 0x7f54a6102600 | 0x7f539a437000 | 248777 | 248777 | 65536 | 6225920 | 963195 | 123194468 | 12076299938888657 | 12076299939095694 | 12076299939252653 | 12076299939256160 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 252 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 201088 | 0x7f54a6102500 | 0x7f539a437040 | 592603 | 592603 | 65536 | 8781824 | 1248748 | 158885572 | 12076299939311473 | 12076299939490092 | 12076299939875530 | 12076299939922749 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 254 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 204608 | 0x7f54a6102400 | 0x7f539a437080 | 278337 | 278337 | 65536 | 7208960 | 1042106 | 133458592 | 12076299939958085 | 12076299940132809 | 12076299940309768 | 12076299940313405 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 256 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 20 | 24 | 206080 | 0x7f54a6102300 | 0x7f539a4370c0 | 924339 | 924339 | 65536 | 19202048 | 2411222 | 308188192 | 12076299940358298 | 12076299940542247 | 12076299941152964 | 12076299941201095 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 258 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 209600 | 0x7f54a6102a00 | 0x7f539a437100 | 504497 | 504497 | 65536 | 7340032 | 977946 | 125177312 | 12076299941224939 | 12076299941418083 | 12076299941749602 | 12076299941796631 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 260 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 213120 | 0x7f54a6102900 | 0x7f539a437140 | 282692 | 282692 | 65536 | 7274496 | 1062869 | 135987200 | 12076299941819424 | 12076299942010560 | 12076299942189760 | 12076299942193369 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 262 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 218176 | 0x7f54a6102800 | 0x7f539a437180 | 698657 | 698657 | 65536 | 10354688 | 1488537 | 190776492 | 12076299942245826 | 12076299942421598 | 12076299942878236 | 12076299942925399 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 264 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 222208 | 0x7f54a6102700 | 0x7f539a4371c0 | 312723 | 312723 | 65536 | 8257536 | 1184176 | 151611196 | 12076299942961436 | 12076299943135035 | 12076299943334394 | 12076299943383300 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 266 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 20 | 24 | 223936 | 0x7f54a6102600 | 0x7f539a437200 | 1066265 | 1066265 | 65536 | 21299200 | 2669401 | 341698144 | 12076299943407475 | 12076299943595033 | 12076299944299350 | 12076299944347582 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 268 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 227968 | 0x7f54a6102500 | 0x7f539a437240 | 606580 | 606580 | 65536 | 8388608 | 1172274 | 150354736 | 12076299944372919 | 12076299944560949 | 12076299944959987 | 12076299945015463 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 270 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 232000 | 0x7f54a6102400 | 0x7f539a437280 | 320545 | 320545 | 65536 | 8323072 | 1287436 | 164707516 | 12076299945045129 | 12076299945260145 | 12076299945464144 | 12076299945514651 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 272 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 237824 | 0x7f54a6102300 | 0x7f539a4372c0 | 803284 | 803284 | 65536 | 11927552 | 1690594 | 216700224 | 12076299945538165 | 12076299945723343 | 12076299946249901 | 12076299946298969 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 274 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 242368 | 0x7f54a6102a00 | 0x7f539a437300 | 350361 | 350361 | 65536 | 9306112 | 1410890 | 180543672 | 12076299946334164 | 12076299946504460 | 12076299946728939 | 12076299946776927 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 276 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 20 | 24 | 243584 | 0x7f54a6102900 | 0x7f539a437340 | 1207459 | 1207459 | 65536 | 29163520 | 3650494 | 467433600 | 12076299946800210 | 12076299946987497 | 12076299947787814 | 12076299947857215 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 278 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 248128 | 0x7f54a6102800 | 0x7f539a437380 | 635801 | 635801 | 65536 | 9437184 | 1240813 | 159316744 | 12076299947880518 | 12076299948066852 | 12076299948486850 | 12076299948555883 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 280 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 252672 | 0x7f54a6102700 | 0x7f539a4373c0 | 354308 | 354308 | 65536 | 9371648 | 1435958 | 183748864 | 12076299948580429 | 12076299948765249 | 12076299948992768 | 12076299949039592 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 282 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 259264 | 0x7f54a6102600 | 0x7f539a437400 | 910449 | 910449 | 65536 | 13500416 | 1900792 | 243030416 | 12076299949064489 | 12076299949250527 | 12076299949848604 | 12076299949915520 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 284 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 264832 | 0x7f54a6102500 | 0x7f539a437440 | 418508 | 418508 | 65536 | 11403264 | 1737440 | 222385492 | 12076299949952028 | 12076299950134363 | 12076299950403962 | 12076299950472906 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 286 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 20 | 24 | 266304 | 0x7f54a6102400 | 0x7f539a437480 | 1487497 | 1487497 | 65536 | 33357824 | 4175603 | 534728884 | 12076299950496259 | 12076299950682680 | 12076299951668276 | 12076299951735442 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 288 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 28 | 24 | 271872 | 0x7f54a6102300 | 0x7f539a4374c0 | 803932 | 803932 | 65536 | 11534336 | 1585432 | 203111956 | 12076299951753095 | 12076299951954514 | 12076299952486832 | 12076299952557250 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 290 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 277440 | 0x7f54a6102a00 | 0x7f539a437500 | 423657 | 423657 | 65536 | 11534336 | 1744628 | 223243148 | 12076299952580894 | 12076299952773871 | 12076299953047149 | 12076299953116068 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 292 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 12 | 24 | 279936 | 0x7f54a6102900 | 0x7f539a437540 | 1133852 | 1133852 | 65536 | 19267584 | 2424400 | 310155488 | 12076299953145423 | 12076299953332268 | 12076299954075145 | 12076299954143688 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 294 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 286528 | 0x7f54a6102800 | 0x7f539a437580 | 489825 | 489825 | 65536 | 13500416 | 2051702 | 262603160 | 12076299954186958 | 12076299954357063 | 12076299954674342 | 12076299954742280 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 296 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 20 | 24 | 288000 | 0x7f54a6102700 | 0x7f539a4375c0 | 1770043 | 1770043 | 65536 | 37552128 | 4700917 | 601623552 | 12076299954771234 | 12076299954958340 | 12076299956130175 | 12076299956200400 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 298 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 32 | 24 | 294592 | 0x7f54a6102600 | 0x7f539a437600 | 918673 | 918673 | 65536 | 13631488 | 1853505 | 237302996 | 12076299956233161 | 12076299956412894 | 12076299957022171 | 12076299957090504 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 300 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 301184 | 0x7f54a6102500 | 0x7f539a437640 | 492492 | 492492 | 65536 | 13631488 | 2101299 | 269030052 | 12076299957108227 | 12076299957312410 | 12076299957632248 | 12076299957700478 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 302 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 12 | 24 | 304960 | 0x7f54a6102400 | 0x7f539a437680 | 1336121 | 1336121 | 65536 | 21692416 | 2755337 | 352715068 | 12076299957729702 | 12076299957909687 | 12076299958788403 | 12076299958858109 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 304 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 24 | 24 | 313600 | 0x7f54a6102300 | 0x7f539a4376c0 | 629595 | 629595 | 65536 | 17694720 | 2657523 | 340168852 | 12076299958895098 | 12076299959061521 | 12076299959471600 | 12076299959540468 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 306 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 20 | 24 | 314816 | 0x7f54a6102a00 | 0x7f539a437700 | 2332353 | 2332353 | 65536 | 57475072 | 7193193 | 920743084 | 12076299959563090 | 12076299959755438 | 12076299961303271 | 12076299961372392 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 308 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 20 | 24 | 317568 | 0x7f54a6102900 | 0x7f539a437740 | 1202236 | 1202236 | 65536 | 19660800 | 2472188 | 316437508 | 12076299961406285 | 12076299961593830 | 12076299962388866 | 12076299962457359 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 310 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 12 | 24 | 320320 | 0x7f54a6102800 | 0x7f539a437780 | 640153 | 640153 | 65536 | 20381696 | 2572355 | 329398180 | 12076299962487775 | 12076299962673505 | 12076299963088863 | 12076299963156267 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 312 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 12 | 24 | 324096 | 0x7f54a6102700 | 0x7f539a4377c0 | 1757699 | 1757699 | 65536 | 28704768 | 3615591 | 462741080 | 12076299963183398 | 12076299963372381 | 12076299964531576 | 12076299964599109 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 314 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 12 | 24 | 328896 | 0x7f54a6102600 | 0x7f539a437800 | 1201873 | 1201873 | 65536 | 36634624 | 4670909 | 597570484 | 12076299964644974 | 12076299964814775 | 12076299965601491 | 12076299965672544 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 316 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 20 | 24 | 330112 | 0x7f54a6102500 | 0x7f539a437840 | 4584116 | 4584116 | 65536 | 105840640 | 13239672 | 1694957244 | 12076299965707038 | 12076299965893490 | 12076299968943876 | 12076299969024754 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 318 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 20 | 24 | 332864 | 0x7f54a6102400 | 0x7f539a437880 | 2323753 | 2323753 | 65536 | 38535168 | 4844852 | 619388704 | 12076299969050391 | 12076299969242114 | 12076299970786267 | 12076299970853623 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 320 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 12 | 24 | 335616 | 0x7f54a6102300 | 0x7f539a4378c0 | 1203387 | 1203387 | 65536 | 39124992 | 4926957 | 630479052 | 12076299970884630 | 12076299971076346 | 12076299971867542 | 12076299971937918 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 322 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 12 | 24 | 339392 | 0x7f54a6102a00 | 0x7f539a437900 | 3442505 | 3442505 | 65536 | 55771136 | 7005437 | 897087700 | 12076299971961672 | 12076299972158581 | 12076299974440650 | 12076299974508375 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 324 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 12 | 24 | 344192 | 0x7f54a6102900 | 0x7f539a437940 | 2323300 | 2323300 | 65536 | 72548352 | 9110641 | 1166105176 | 12076299974553378 | 12076299974721449 | 12076299976257602 | 12076299976325552 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 326 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 20 | 24 | 345408 | 0x7f54a6102800 | 0x7f539a437980 | 9086817 | 9086817 | 65536 | 210698240 | 26341194 | 3373172476 | 12076299976350268 | 12076299976542880 | 12076299982597252 | 12076299982669983 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 328 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 20 | 24 | 348160 | 0x7f54a6102700 | 0x7f539a4379c0 | 4573883 | 4573883 | 65536 | 76283904 | 9551789 | 1222432152 | 12076299982699107 | 12076299982887171 | 12076299985928917 | 12076299985985855 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 330 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 12 | 24 | 350912 | 0x7f54a6102600 | 0x7f539a437a00 | 2328849 | 2328849 | 65536 | 77398016 | 9707252 | 1242251888 | 12076299986021972 | 12076299986298995 | 12076299987838668 | 12076299987886678 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 332 | 919533 | 919538 | 4194304 | 256 | 0 | 0 | 12 | 24 | 0 | 0x7f54a6102500 | 0x7f539a437a40 | 6812940 | 6812940 | 65536 | 110821376 | 13888106 | 1777123712 | 12076299987917555 | 12076299988114347 | 12076299992641046 | 12076299992713007 |