48 KiB
48 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | GRBM_COUNT | GRBM_GUI_ACTIVE | CPC_ME1_BUSY_FOR_PACKET_DECODE | SQ_CYCLES | SQ_WAVES | SQ_WAVE_CYCLES | SQ_BUSY_CYCLES | SQ_LEVEL_WAVES | SQ_ACCUM_PREV_HIRES | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBufferAligned.kd | 0 | 0 | 0 | 236725 | 236725 | 33554432 | 256 | 0 | 0 | 4 | 32 | 4160 | 0x0 | 0x7fc8d4204280 | 388118 | 388118 | 8813 | 3104952 | 524288 | 245379700 | 3015215 | 0 | 997822932 | 17834114824366 | 17833406340767 | 17834261594719 | 17834261709089 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 236725 | 236725 | 32768 | 256 | 0 | 0 | 12 | 24 | 13888 | 0x0 | 0x7fc8d4223f80 | 34226 | 34226 | 30380 | 273816 | 512 | 1732870 | 162674 | 0 | 6944808 | 17834266862991 | 17834261594719 | 17834267004326 | 17834267009117 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 5 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 14336 | 0x7fc8d71bf380 | 0x7fc8d4223fc0 | 166068 | 166068 | 13553 | 1328552 | 65536 | 78338107 | 1221027 | 0 | 315083700 | 17834267052826 | 17834267004326 | 17834267413606 | 17834267416207 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 8 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15040 | 0x7fc8d71bf200 | 0x7fc8d4224000 | 309075 | 309075 | 24040 | 2472608 | 65536 | 207974461 | 2361927 | 0 | 833627480 | 17834267463736 | 17834267413606 | 17834267844007 | 17834267846456 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 11 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15488 | 0x7fc8d71bf080 | 0x7fc8d4224040 | 312717 | 312717 | 25835 | 2501744 | 65536 | 225690218 | 2387810 | 0 | 904488700 | 17834267887865 | 17834267844007 | 17834268268807 | 17834268271026 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 14 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 15936 | 0x7fc8d4b91f00 | 0x7fc8d4224080 | 165971 | 165971 | 14858 | 1327776 | 65536 | 88194064 | 1222047 | 0 | 354501948 | 17834268313195 | 17834268268807 | 17834268603048 | 17834268605407 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 17 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 16384 | 0x7fc8d4b91d80 | 0x7fc8d42240c0 | 165219 | 165219 | 14018 | 1321760 | 65536 | 79047699 | 1212215 | 0 | 317927864 | 17834268645846 | 17834268603048 | 17834268930728 | 17834268933069 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 20 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 17088 | 0x7fc8d4b91c00 | 0x7fc8d4224100 | 164375 | 164375 | 14488 | 1315008 | 65536 | 91462162 | 1207066 | 0 | 367580624 | 17834268987318 | 17834268930728 | 17834269259369 | 17834269261561 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 23 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 16 | 24 | 17792 | 0x7fc8d4b91a80 | 0x7fc8d4224140 | 309703 | 309703 | 24852 | 2477632 | 65536 | 219777215 | 2368747 | 0 | 880840144 | 17834269301450 | 17834269259369 | 17834269686569 | 17834269688940 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 26 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 16 | 24 | 18496 | 0x7fc8d4b91900 | 0x7fc8d4224180 | 310809 | 310809 | 22257 | 2486480 | 65536 | 225212276 | 2380921 | 0 | 902579640 | 17834269729219 | 17834269686569 | 17834270108970 | 17834270111340 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 29 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19200 | 0x7fc8d4b91780 | 0x7fc8d42241c0 | 165404 | 165404 | 14552 | 1323240 | 65536 | 80450116 | 1211697 | 0 | 323537692 | 17834270152509 | 17834270108970 | 17834270450890 | 17834270453171 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 32 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19904 | 0x7fc8d4b91600 | 0x7fc8d4224200 | 165585 | 165585 | 14733 | 1324688 | 65536 | 89465853 | 1214515 | 0 | 359591852 | 17834270494250 | 17834270450890 | 17834270782411 | 17834270784683 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 35 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 20608 | 0x7fc8d71bf480 | 0x7fc8d4224240 | 166366 | 166366 | 14862 | 1330936 | 65536 | 91499648 | 1220000 | 0 | 367728464 | 17834270836062 | 17834270782411 | 17834271116011 | 17834271118425 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 38 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 16 | 24 | 21312 | 0x7fc8d71bf300 | 0x7fc8d4224280 | 312319 | 312319 | 24507 | 2498560 | 65536 | 233250131 | 2390649 | 0 | 934730296 | 17834271160384 | 17834271116011 | 17834271555532 | 17834271557414 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 41 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22016 | 0x7fc8d71bf180 | 0x7fc8d42242c0 | 308649 | 308649 | 21619 | 2469200 | 65536 | 224851158 | 2359776 | 0 | 901134076 | 17834271600213 | 17834271555532 | 17834271944652 | 17834271946314 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 44 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22720 | 0x7fc8d71bf000 | 0x7fc8d4224300 | 163725 | 163725 | 14889 | 1309808 | 65536 | 91154035 | 1208364 | 0 | 366346432 | 17834271989503 | 17834271944652 | 17834272252333 | 17834272254047 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 47 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 23424 | 0x7fc8d4b91e80 | 0x7fc8d4224340 | 163463 | 163463 | 14910 | 1307712 | 65536 | 95401874 | 1206350 | 0 | 383341996 | 17834272296706 | 17834272252333 | 17834272551373 | 17834272553179 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 50 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 24128 | 0x7fc8d4b91d00 | 0x7fc8d4224380 | 165174 | 165174 | 15006 | 1321400 | 65536 | 93783281 | 1212963 | 0 | 376860444 | 17834272601598 | 17834272551373 | 17834272857294 | 17834272859102 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 53 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 16 | 24 | 24832 | 0x7fc8d4b91b80 | 0x7fc8d42243c0 | 308899 | 308899 | 24067 | 2471200 | 65536 | 231007192 | 2364827 | 0 | 925758852 | 17834272905440 | 17834272857294 | 17834273249934 | 17834273251682 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 56 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 16 | 24 | 25536 | 0x7fc8d4b91a00 | 0x7fc8d4224400 | 309717 | 309717 | 24064 | 2477744 | 65536 | 223804023 | 2368967 | 0 | 896947924 | 17834273293911 | 17834273249934 | 17834273638895 | 17834273640612 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 59 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26240 | 0x7fc8d4b91880 | 0x7fc8d4224440 | 164390 | 164390 | 15085 | 1315128 | 65536 | 93431898 | 1207629 | 0 | 375461760 | 17834273682421 | 17834273638895 | 17834273938095 | 17834273939705 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 62 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26944 | 0x7fc8d4b91700 | 0x7fc8d4224480 | 164938 | 164938 | 14955 | 1319512 | 65536 | 107825297 | 1214954 | 0 | 433026808 | 17834273982454 | 17834273938095 | 17834274250575 | 17834274252317 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 65 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 27648 | 0x7fc8d71bf580 | 0x7fc8d42244c0 | 163684 | 163684 | 15364 | 1309480 | 65536 | 98572989 | 1202351 | 0 | 396025084 | 17834274303036 | 17834274250575 | 17834274560336 | 17834274561989 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 68 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 16 | 24 | 28608 | 0x7fc8d71bf400 | 0x7fc8d4224500 | 309216 | 309216 | 24259 | 2473736 | 65536 | 229456145 | 2366399 | 0 | 919555808 | 17834274608288 | 17834274560336 | 17834274967056 | 17834274968889 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 71 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 16 | 24 | 29312 | 0x7fc8d71bf280 | 0x7fc8d4224540 | 306859 | 306859 | 22328 | 2454880 | 65536 | 211370468 | 2340855 | 0 | 847210304 | 17834275011958 | 17834274967056 | 17834275359377 | 17834275361219 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 74 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 30016 | 0x7fc8d71bf100 | 0x7fc8d4224580 | 162796 | 162796 | 14816 | 1302376 | 65536 | 90130881 | 1195582 | 0 | 362264460 | 17834275404238 | 17834275359377 | 17834275659857 | 17834275661632 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 77 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 8 | 24 | 30976 | 0x7fc8d4b91f80 | 0x7fc8d42245c0 | 164176 | 164176 | 15291 | 1313416 | 65536 | 94637530 | 1203733 | 0 | 380286336 | 17834275703781 | 17834275659857 | 17834275964978 | 17834275966724 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 80 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 31680 | 0x7fc8d4b91e00 | 0x7fc8d4224600 | 164486 | 164486 | 15106 | 1315896 | 65536 | 98263113 | 1206137 | 0 | 394774388 | 17834276016083 | 17834275964978 | 17834276271378 | 17834276273017 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 83 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 16 | 24 | 32640 | 0x7fc8d4b91c80 | 0x7fc8d4224640 | 308147 | 308147 | 24483 | 2465184 | 65536 | 225461106 | 2358920 | 0 | 903576612 | 17834276314886 | 17834276271378 | 17834276663219 | 17834276665107 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 86 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 33600 | 0x7fc8d4b91b00 | 0x7fc8d4224680 | 306784 | 306784 | 21822 | 2454280 | 65536 | 212758018 | 2344118 | 0 | 852761708 | 17834276707936 | 17834276663219 | 17834277052179 | 17834277053737 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 89 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 34560 | 0x7fc8d4b91980 | 0x7fc8d42246c0 | 164291 | 164291 | 15379 | 1314336 | 65536 | 89768986 | 1209049 | 0 | 360811080 | 17834277096186 | 17834277052179 | 17834277355220 | 17834277357100 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 92 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 8 | 24 | 35520 | 0x7fc8d4b91800 | 0x7fc8d4224700 | 166338 | 166338 | 16385 | 1330712 | 65536 | 95949531 | 1221575 | 0 | 385529096 | 17834277398619 | 17834277355220 | 17834277660660 | 17834277662272 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 95 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 36224 | 0x7fc8d4b91680 | 0x7fc8d4224740 | 162847 | 162847 | 15060 | 1302784 | 65536 | 97505447 | 1200686 | 0 | 391750292 | 17834277710811 | 17834277660660 | 17834277967700 | 17834277969325 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 98 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 37184 | 0x7fc8d71bf500 | 0x7fc8d4224780 | 306864 | 306864 | 24043 | 2454920 | 65536 | 228596035 | 2350247 | 0 | 916117520 | 17834278011794 | 17834277967700 | 17834278362581 | 17834278364495 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 101 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 38144 | 0x7fc8d71bf380 | 0x7fc8d42247c0 | 307280 | 307280 | 22874 | 2458248 | 65536 | 219189165 | 2355632 | 0 | 878486864 | 17834278407854 | 17834278362581 | 17834278758901 | 17834278760595 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 104 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 39104 | 0x7fc8d71bf200 | 0x7fc8d4224800 | 163646 | 163646 | 15305 | 1309176 | 65536 | 92738259 | 1205867 | 0 | 372683892 | 17834278802324 | 17834278758901 | 17834279065622 | 17834279067307 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 107 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 8 | 24 | 40320 | 0x7fc8d71bf080 | 0x7fc8d4224840 | 162812 | 162812 | 15305 | 1302504 | 65536 | 91513072 | 1197944 | 0 | 367781628 | 17834279109276 | 17834279065622 | 17834279368342 | 17834279369940 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 110 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 41280 | 0x7fc8d4b91f00 | 0x7fc8d4224880 | 163697 | 163697 | 14743 | 1309584 | 65536 | 97528475 | 1204580 | 0 | 391844768 | 17834279418069 | 17834279368342 | 17834279676023 | 17834279677612 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 113 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 42240 | 0x7fc8d4b91d80 | 0x7fc8d42248c0 | 306817 | 306817 | 23855 | 2454544 | 65536 | 224074796 | 2348571 | 0 | 898027912 | 17834279723881 | 17834279676023 | 17834280077463 | 17834280079182 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 116 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 43200 | 0x7fc8d4b91c00 | 0x7fc8d4224900 | 303088 | 303088 | 21848 | 2424712 | 65536 | 215098226 | 2320002 | 0 | 862124472 | 17834280121761 | 17834280077463 | 17834280466424 | 17834280468003 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 119 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 8 | 24 | 44160 | 0x7fc8d4b91a80 | 0x7fc8d4224940 | 162715 | 162715 | 14617 | 1301728 | 65536 | 100141673 | 1199730 | 0 | 402297404 | 17834280509402 | 17834280466424 | 17834280770264 | 17834280771805 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 122 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 45376 | 0x7fc8d4b91900 | 0x7fc8d4224980 | 163608 | 163608 | 15486 | 1308872 | 65536 | 91950043 | 1202769 | 0 | 369547032 | 17834280813514 | 17834280770264 | 17834281073305 | 17834281075087 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 125 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 46336 | 0x7fc8d4b91780 | 0x7fc8d42249c0 | 162297 | 162297 | 14425 | 1298384 | 65536 | 94382812 | 1195314 | 0 | 379256192 | 17834281124096 | 17834281073305 | 17834281384345 | 17834281386110 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 128 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 47552 | 0x7fc8d4b91600 | 0x7fc8d4224a00 | 306664 | 306664 | 24786 | 2453320 | 65536 | 225485821 | 2347896 | 0 | 903674356 | 17834281432619 | 17834281384345 | 17834281788666 | 17834281790470 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 131 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 48512 | 0x7fc8d71bf480 | 0x7fc8d4224a40 | 304669 | 304669 | 22899 | 2437360 | 65536 | 214318449 | 2330625 | 0 | 859002420 | 17834281832979 | 17834281788666 | 17834282182906 | 17834282184770 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 134 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 8 | 24 | 49472 | 0x7fc8d71bf300 | 0x7fc8d4224a80 | 164032 | 164032 | 14631 | 1312264 | 65536 | 88858198 | 1205412 | 0 | 357162416 | 17834282227459 | 17834282182906 | 17834282489146 | 17834282490792 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 137 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 50688 | 0x7fc8d71bf180 | 0x7fc8d4224ac0 | 163201 | 163201 | 15807 | 1305616 | 65536 | 96721866 | 1200217 | 0 | 388622312 | 17834282533281 | 17834282489146 | 17834282793627 | 17834282795345 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 140 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 51648 | 0x7fc8d71bf000 | 0x7fc8d4224b00 | 161463 | 161463 | 14952 | 1291712 | 65536 | 88740842 | 1187214 | 0 | 356698560 | 17834282844754 | 17834282793627 | 17834283100827 | 17834283102377 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 143 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 52864 | 0x7fc8d4b91e80 | 0x7fc8d4224b40 | 303745 | 303745 | 22710 | 2429968 | 65536 | 201836625 | 2316360 | 0 | 809078756 | 17834283144876 | 17834283100827 | 17834283496508 | 17834283498217 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 146 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 54080 | 0x7fc8d4b91d00 | 0x7fc8d4224b80 | 301047 | 301047 | 21601 | 2408384 | 65536 | 210437020 | 2303682 | 0 | 843478572 | 17834283539956 | 17834283496508 | 17834283892508 | 17834283894117 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 149 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 8 | 24 | 55296 | 0x7fc8d4b91b80 | 0x7fc8d4224bc0 | 162428 | 162428 | 14903 | 1299432 | 65536 | 88474318 | 1194758 | 0 | 355627208 | 17834283936316 | 17834283892508 | 17834284193629 | 17834284195250 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 152 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 56768 | 0x7fc8d4b91a00 | 0x7fc8d4224c00 | 163629 | 163629 | 16950 | 1309040 | 65536 | 101217691 | 1198725 | 0 | 406601800 | 17834284237269 | 17834284193629 | 17834284495869 | 17834284497512 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 155 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 57728 | 0x7fc8d4b91880 | 0x7fc8d4224c40 | 163391 | 163391 | 14597 | 1307136 | 65536 | 91714320 | 1200360 | 0 | 368585112 | 17834284546191 | 17834284495869 | 17834284805790 | 17834284807455 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 158 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 58944 | 0x7fc8d4b91700 | 0x7fc8d4224c80 | 300221 | 300221 | 21845 | 2401776 | 65536 | 212739892 | 2297136 | 0 | 852693288 | 17834284848824 | 17834284805790 | 17834285192510 | 17834285194135 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 161 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 60160 | 0x7fc8d71bf580 | 0x7fc8d4224cc0 | 301545 | 301545 | 20283 | 2412368 | 65536 | 205629479 | 2301410 | 0 | 824246612 | 17834285238724 | 17834285192510 | 17834285579871 | 17834285581566 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 164 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 8 | 24 | 61376 | 0x7fc8d71bf400 | 0x7fc8d4224d00 | 163132 | 163132 | 15667 | 1305064 | 65536 | 95210655 | 1200481 | 0 | 382572852 | 17834285623274 | 17834285579871 | 17834285881151 | 17834285882808 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 167 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 62848 | 0x7fc8d71bf280 | 0x7fc8d4224d40 | 169065 | 169065 | 16375 | 1352528 | 65536 | 97879669 | 1245323 | 0 | 393262852 | 17834285924347 | 17834285881151 | 17834286199391 | 17834286201270 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 170 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 63808 | 0x7fc8d71bf100 | 0x7fc8d4224d80 | 162702 | 162702 | 15058 | 1301624 | 65536 | 92605328 | 1194089 | 0 | 372151888 | 17834286252129 | 17834286199391 | 17834286509952 | 17834286511732 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 173 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 65024 | 0x7fc8d4b91f80 | 0x7fc8d4224dc0 | 302903 | 302903 | 22609 | 2423232 | 65536 | 215042701 | 2319421 | 0 | 861904624 | 17834286559221 | 17834286509952 | 17834286905152 | 17834286906793 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 176 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 66240 | 0x7fc8d4b91e00 | 0x7fc8d4224e00 | 299934 | 299934 | 20991 | 2399480 | 65536 | 211568934 | 2288440 | 0 | 848010412 | 17834286949312 | 17834286905152 | 17834287299553 | 17834287301333 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 179 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 8 | 24 | 67456 | 0x7fc8d4b91c80 | 0x7fc8d4224e40 | 164917 | 164917 | 15176 | 1319344 | 65536 | 92895653 | 1215543 | 0 | 373328368 | 17834287342372 | 17834287299553 | 17834287601473 | 17834287603155 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 182 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 68928 | 0x7fc8d4b91b00 | 0x7fc8d4224e80 | 177796 | 177796 | 16578 | 1422376 | 65536 | 104994509 | 1313234 | 0 | 421714412 | 17834287645334 | 17834287601473 | 17834287915234 | 17834287916868 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 185 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 70144 | 0x7fc8d4b91980 | 0x7fc8d4224ec0 | 160811 | 160811 | 14705 | 1286496 | 65536 | 89629786 | 1181277 | 0 | 360258064 | 17834287965816 | 17834287915234 | 17834288223074 | 17834288224820 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 188 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 71616 | 0x7fc8d4b91800 | 0x7fc8d4224f00 | 302087 | 302087 | 23294 | 2416704 | 65536 | 219851616 | 2309099 | 0 | 881138856 | 17834288266549 | 17834288223074 | 17834288616835 | 17834288618460 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 191 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 72832 | 0x7fc8d4b91680 | 0x7fc8d4224f40 | 303611 | 303611 | 23005 | 2428896 | 65536 | 222137973 | 2319977 | 0 | 890282592 | 17834288661129 | 17834288616835 | 17834289007715 | 17834289009390 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 194 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 8 | 24 | 74048 | 0x7fc8d71bf500 | 0x7fc8d4224f80 | 163161 | 163161 | 15630 | 1305296 | 65536 | 91235959 | 1194973 | 0 | 366677940 | 17834289050369 | 17834289007715 | 17834289310436 | 17834289312333 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 197 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 75776 | 0x7fc8d71bf380 | 0x7fc8d4224fc0 | 183219 | 183219 | 17101 | 1465760 | 65536 | 109826885 | 1356619 | 0 | 441057852 | 17834289355122 | 17834289310436 | 17834289625796 | 17834289627395 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 200 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 76992 | 0x7fc8d71bf200 | 0x7fc8d4225000 | 162997 | 162997 | 15184 | 1303984 | 65536 | 88666144 | 1192526 | 0 | 356405896 | 17834289690813 | 17834289625796 | 17834289938917 | 17834289940647 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 203 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 78464 | 0x7fc8d71bf080 | 0x7fc8d4225040 | 301969 | 301969 | 22124 | 2415760 | 65536 | 214738349 | 2310781 | 0 | 860686468 | 17834289987216 | 17834289938917 | 17834290365157 | 17834290367057 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 206 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 79936 | 0x7fc8d4b91f00 | 0x7fc8d4225080 | 302753 | 302753 | 23164 | 2422032 | 65536 | 210241017 | 2311664 | 0 | 842698468 | 17834290408876 | 17834290365157 | 17834290767398 | 17834290769027 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 209 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 8 | 24 | 81408 | 0x7fc8d4b91d80 | 0x7fc8d42250c0 | 162581 | 162581 | 15730 | 1300656 | 65536 | 93338046 | 1195432 | 0 | 375088052 | 17834290811296 | 17834290767398 | 17834291075238 | 17834291077019 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 212 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 83136 | 0x7fc8d4b91c00 | 0x7fc8d4225100 | 192516 | 192516 | 18259 | 1540136 | 65536 | 115988784 | 1429576 | 0 | 465701400 | 17834291118798 | 17834291075238 | 17834291400198 | 17834291402111 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 215 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 84352 | 0x7fc8d4b91a80 | 0x7fc8d4225140 | 162889 | 162889 | 15404 | 1303120 | 65536 | 96009514 | 1198118 | 0 | 385765176 | 17834291450040 | 17834291400198 | 17834291712679 | 17834291714363 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 218 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 85824 | 0x7fc8d4b91900 | 0x7fc8d4225180 | 303894 | 303894 | 22975 | 2431160 | 65536 | 220298015 | 2321393 | 0 | 882931436 | 17834291756322 | 17834291712679 | 17834292106279 | 17834292108014 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 221 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 87296 | 0x7fc8d4b91780 | 0x7fc8d42251c0 | 299823 | 299823 | 22016 | 2398592 | 65536 | 213726362 | 2293812 | 0 | 856641476 | 17834292152253 | 17834292106279 | 17834292497480 | 17834292499214 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 224 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 88768 | 0x7fc8d4b91600 | 0x7fc8d4225200 | 162456 | 162456 | 15936 | 1299656 | 65536 | 96275564 | 1197182 | 0 | 386834488 | 17834292541063 | 17834292497480 | 17834292804840 | 17834292806386 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 227 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 90752 | 0x7fc8d71bf480 | 0x7fc8d4225240 | 203471 | 203471 | 18200 | 1627776 | 65536 | 117796929 | 1513037 | 0 | 472938496 | 17834292847715 | 17834292804840 | 17834293142121 | 17834293143698 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 230 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 91968 | 0x7fc8d71bf300 | 0x7fc8d4225280 | 162292 | 162292 | 15476 | 1298344 | 65536 | 93981779 | 1192840 | 0 | 377663004 | 17834293192997 | 17834293142121 | 17834293452041 | 17834293453861 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 233 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 93440 | 0x7fc8d71bf180 | 0x7fc8d42252c0 | 301740 | 301740 | 23035 | 2413928 | 65536 | 223216311 | 2308970 | 0 | 894601568 | 17834293501559 | 17834293452041 | 17834293849802 | 17834293851431 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 236 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 94912 | 0x7fc8d71bf000 | 0x7fc8d4225300 | 299586 | 299586 | 21971 | 2396696 | 65536 | 212866702 | 2295181 | 0 | 853196760 | 17834293895900 | 17834293849802 | 17834294243242 | 17834294245081 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 239 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 96384 | 0x7fc8d4b91e80 | 0x7fc8d4225340 | 162618 | 162618 | 15249 | 1300952 | 65536 | 98466108 | 1197652 | 0 | 395598028 | 17834294286870 | 17834294243242 | 17834294553963 | 17834294555623 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 242 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 98368 | 0x7fc8d4b91d00 | 0x7fc8d4225380 | 211130 | 211130 | 19059 | 1689048 | 65536 | 139997082 | 1578277 | 0 | 561732788 | 17834294597952 | 17834294553963 | 17834294888843 | 17834294890575 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 245 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 99584 | 0x7fc8d4b91b80 | 0x7fc8d42253c0 | 162454 | 162454 | 15664 | 1299640 | 65536 | 95675469 | 1195184 | 0 | 384430776 | 17834294938784 | 17834294888843 | 17834295197484 | 17834295199077 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 248 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 101312 | 0x7fc8d4b91a00 | 0x7fc8d4225400 | 298352 | 298352 | 22850 | 2386824 | 65536 | 218183439 | 2281773 | 0 | 874465752 | 17834295239986 | 17834295197484 | 17834295591724 | 17834295593397 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 251 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 102784 | 0x7fc8d4b91880 | 0x7fc8d4225440 | 299448 | 299448 | 22428 | 2395592 | 65536 | 208003050 | 2290833 | 0 | 833743560 | 17834295635696 | 17834295591724 | 17834295985005 | 17834295986638 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 254 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 104256 | 0x7fc8d4b91700 | 0x7fc8d4225480 | 161836 | 161836 | 15933 | 1294696 | 65536 | 98449694 | 1189411 | 0 | 395538516 | 17834296029047 | 17834295985005 | 17834296289485 | 17834296291350 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 257 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 106240 | 0x7fc8d71bf580 | 0x7fc8d42254c0 | 220777 | 220777 | 19935 | 1766224 | 65536 | 126795673 | 1647432 | 0 | 508938936 | 17834296332469 | 17834296289485 | 17834296633806 | 17834296635512 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 260 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 107712 | 0x7fc8d71bf400 | 0x7fc8d4225500 | 161888 | 161888 | 15580 | 1295112 | 65536 | 89962750 | 1188814 | 0 | 361583932 | 17834296685250 | 17834296633806 | 17834296943246 | 17834296945044 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 263 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 16 | 24 | 109440 | 0x7fc8d71bf280 | 0x7fc8d4225540 | 297291 | 297291 | 21409 | 2378336 | 65536 | 206695233 | 2272110 | 0 | 828513140 | 17834296991243 | 17834296943246 | 17834297338286 | 17834297340024 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 266 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 16 | 24 | 111168 | 0x7fc8d71bf100 | 0x7fc8d4225580 | 301879 | 301879 | 23718 | 2415040 | 65536 | 215905745 | 2301239 | 0 | 865353032 | 17834297383633 | 17834297338286 | 17834297732367 | 17834297734054 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 269 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 8 | 24 | 112896 | 0x7fc8d4b91f80 | 0x7fc8d42255c0 | 164601 | 164601 | 16231 | 1316816 | 65536 | 99833361 | 1209593 | 0 | 401091668 | 17834297775473 | 17834297732367 | 17834298041807 | 17834298043577 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 272 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 115136 | 0x7fc8d4b91e00 | 0x7fc8d4225600 | 229723 | 229723 | 19773 | 1837792 | 65536 | 149136492 | 1730381 | 0 | 598297608 | 17834298092205 | 17834298041807 | 17834298404048 | 17834298405698 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 275 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 116608 | 0x7fc8d4b91c80 | 0x7fc8d4225640 | 161402 | 161402 | 15123 | 1291224 | 65536 | 90921050 | 1187708 | 0 | 365422976 | 17834298454706 | 17834298404048 | 17834298712048 | 17834298713750 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 278 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 16 | 24 | 118336 | 0x7fc8d4b91b00 | 0x7fc8d4225680 | 298204 | 298204 | 20792 | 2385640 | 65536 | 197986138 | 2276652 | 0 | 793685384 | 17834298760439 | 17834298712048 | 17834299105809 | 17834299107450 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 281 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 16 | 24 | 120064 | 0x7fc8d4b91980 | 0x7fc8d42256c0 | 300595 | 300595 | 22494 | 2404768 | 65536 | 215379737 | 2301175 | 0 | 863254268 | 17834299150079 | 17834299105809 | 17834299496689 | 17834299498340 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 284 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 121792 | 0x7fc8d4b91800 | 0x7fc8d4225700 | 164958 | 164958 | 16370 | 1319672 | 65536 | 101616331 | 1214016 | 0 | 408212144 | 17834299539319 | 17834299496689 | 17834299801810 | 17834299803813 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 287 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 124032 | 0x7fc8d4b91680 | 0x7fc8d4225740 | 240645 | 240645 | 20516 | 1925168 | 65536 | 157732556 | 1813466 | 0 | 632674640 | 17834299844102 | 17834299801810 | 17834300163570 | 17834300165174 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 290 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 125504 | 0x7fc8d71bf500 | 0x7fc8d4225780 | 162126 | 162126 | 15768 | 1297016 | 65536 | 98187098 | 1194453 | 0 | 394504012 | 17834300214413 | 17834300163570 | 17834300475571 | 17834300477146 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 293 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 127488 | 0x7fc8d71bf380 | 0x7fc8d42257c0 | 302955 | 302955 | 20938 | 2423648 | 65536 | 205734897 | 2308541 | 0 | 824672836 | 17834300523855 | 17834300475571 | 17834300872531 | 17834300874236 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 296 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 129216 | 0x7fc8d71bf200 | 0x7fc8d4225800 | 298432 | 298432 | 20729 | 2387464 | 65536 | 202637622 | 2282225 | 0 | 812285600 | 17834300916045 | 17834300872531 | 17834301262772 | 17834301264587 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 299 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 130944 | 0x7fc8d71bf080 | 0x7fc8d4225840 | 171091 | 171091 | 16030 | 1368736 | 65536 | 100852134 | 1263541 | 0 | 405154688 | 17834301305746 | 17834301262772 | 17834301573972 | 17834301575609 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 302 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 133440 | 0x7fc8d4b91f00 | 0x7fc8d4225880 | 259655 | 259655 | 21249 | 2077248 | 65536 | 166745550 | 1964412 | 0 | 668732852 | 17834301617628 | 17834301573972 | 17834301938933 | 17834301940650 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 305 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 134912 | 0x7fc8d4b91d80 | 0x7fc8d42258c0 | 161815 | 161815 | 15866 | 1294528 | 65536 | 95893855 | 1188755 | 0 | 385320516 | 17834301990029 | 17834301938933 | 17834302259413 | 17834302260992 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 308 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 136896 | 0x7fc8d4b91c00 | 0x7fc8d4225900 | 296539 | 296539 | 20914 | 2372320 | 65536 | 202649671 | 2263614 | 0 | 812338056 | 17834302302771 | 17834302259413 | 17834302655254 | 17834302657002 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 311 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 138880 | 0x7fc8d4b91a80 | 0x7fc8d4225940 | 297031 | 297031 | 21172 | 2376256 | 65536 | 205901482 | 2265136 | 0 | 825344388 | 17834302698781 | 17834302655254 | 17834303044374 | 17834303046012 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 314 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 140864 | 0x7fc8d4b91900 | 0x7fc8d4225980 | 178771 | 178771 | 16738 | 1430176 | 65536 | 106947525 | 1324370 | 0 | 429537856 | 17834303087531 | 17834303044374 | 17834303357495 | 17834303359055 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 317 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 143616 | 0x7fc8d4b91780 | 0x7fc8d42259c0 | 280909 | 280909 | 23093 | 2247280 | 65536 | 190802329 | 2129530 | 0 | 764957064 | 17834303400584 | 17834303357495 | 17834303734775 | 17834303736465 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 320 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 145344 | 0x7fc8d4b91600 | 0x7fc8d4225a00 | 163019 | 163019 | 16590 | 1304160 | 65536 | 102331826 | 1195152 | 0 | 411073356 | 17834303785814 | 17834303734775 | 17834304045176 | 17834304046747 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 323 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 147584 | 0x7fc8d71bf480 | 0x7fc8d4225a40 | 296769 | 296769 | 21322 | 2374160 | 65536 | 203778534 | 2261266 | 0 | 816877520 | 17834304088806 | 17834304045176 | 17834304437496 | 17834304439028 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 326 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 149568 | 0x7fc8d71bf300 | 0x7fc8d4225a80 | 296072 | 296072 | 20953 | 2368584 | 65536 | 206833922 | 2259877 | 0 | 829074876 | 17834304479807 | 17834304437496 | 17834304828857 | 17834304830788 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 329 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 151552 | 0x7fc8d71bf180 | 0x7fc8d4225ac0 | 186912 | 186912 | 17450 | 1495304 | 65536 | 103138691 | 1380354 | 0 | 414306260 | 17834304870297 | 17834304828857 | 17834305160377 | 17834305162140 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 332 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 154304 | 0x7fc8d71bf000 | 0x7fc8d4225b00 | 300476 | 300476 | 23558 | 2403816 | 65536 | 195767935 | 2289652 | 0 | 784828060 | 17834305202979 | 17834305160377 | 17834305553338 | 17834305555040 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 335 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 156288 | 0x7fc8d4b91e80 | 0x7fc8d4225b40 | 171069 | 171069 | 16766 | 1368560 | 65536 | 101300694 | 1266522 | 0 | 406947060 | 17834305604099 | 17834305553338 | 17834305872538 | 17834305874242 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 338 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 158784 | 0x7fc8d4b91d00 | 0x7fc8d4225b80 | 299366 | 299366 | 19246 | 2394936 | 65536 | 164222368 | 2269854 | 0 | 658639616 | 17834305915891 | 17834305872538 | 17834306266619 | 17834306268682 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 341 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 161024 | 0x7fc8d4b91b80 | 0x7fc8d4225bc0 | 297382 | 297382 | 20708 | 2379064 | 65536 | 191601847 | 2264334 | 0 | 768152064 | 17834306309591 | 17834306266619 | 17834306661499 | 17834306663382 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 344 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 163264 | 0x7fc8d4b91a00 | 0x7fc8d4225c00 | 207412 | 207412 | 19074 | 1659304 | 65536 | 123377617 | 1541710 | 0 | 495275328 | 17834306703341 | 17834306661499 | 17834306993019 | 17834306994584 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 347 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 166528 | 0x7fc8d4b91880 | 0x7fc8d4225c40 | 341044 | 341044 | 25539 | 2728360 | 65536 | 230738852 | 2613176 | 0 | 924716048 | 17834307035523 | 17834306993019 | 17834307411260 | 17834307459113 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 350 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 168512 | 0x7fc8d4b91700 | 0x7fc8d4225c80 | 184919 | 184919 | 18033 | 1479360 | 65536 | 115675289 | 1368223 | 0 | 464448212 | 17834307478252 | 17834307411260 | 17834307767581 | 17834307769255 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 353 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 171264 | 0x7fc8d71bf580 | 0x7fc8d4225cc0 | 298024 | 298024 | 21863 | 2384200 | 65536 | 158606979 | 2238111 | 0 | 636177212 | 17834307811134 | 17834307767581 | 17834308161181 | 17834308162815 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 356 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 173760 | 0x7fc8d71bf400 | 0x7fc8d4225d00 | 297180 | 297180 | 20530 | 2377448 | 65536 | 184505727 | 2259504 | 0 | 739772484 | 17834308205604 | 17834308161181 | 17834308556062 | 17834308557885 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 359 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 176256 | 0x7fc8d71bf280 | 0x7fc8d4225d40 | 224815 | 224815 | 19630 | 1798528 | 65536 | 145776401 | 1689205 | 0 | 584851028 | 17834308598954 | 17834308556062 | 17834308900702 | 17834308902377 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 362 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 179776 | 0x7fc8d71bf100 | 0x7fc8d4225d80 | 381869 | 381869 | 27926 | 3054960 | 65536 | 257070858 | 2936653 | 0 | 1030042636 | 17834308943066 | 17834308900702 | 17834309347263 | 17834309366235 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 365 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 182272 | 0x7fc8d4b91f80 | 0x7fc8d4225dc0 | 212815 | 212815 | 19513 | 1702528 | 65536 | 122464861 | 1583033 | 0 | 491617708 | 17834309397585 | 17834309347263 | 17834309686303 | 17834309687957 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 368 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 185536 | 0x7fc8d4b91e00 | 0x7fc8d4225e00 | 310102 | 310102 | 24097 | 2480824 | 65536 | 185464783 | 2345934 | 0 | 743628116 | 17834309728316 | 17834309686303 | 17834310090304 | 17834310096947 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 371 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 188544 | 0x7fc8d4b91c80 | 0x7fc8d4225e40 | 311821 | 311821 | 20978 | 2494576 | 65536 | 179673646 | 2366407 | 0 | 720457404 | 17834310132456 | 17834310090304 | 17834310509824 | 17834310531006 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 374 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 191552 | 0x7fc8d4b91b00 | 0x7fc8d4225e80 | 266016 | 266016 | 21765 | 2128136 | 65536 | 177645979 | 2018546 | 0 | 712343952 | 17834310551946 | 17834310509824 | 17834310879745 | 17834310881678 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 377 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 195840 | 0x7fc8d4b91980 | 0x7fc8d4225ec0 | 462230 | 462230 | 31445 | 3697848 | 65536 | 327814997 | 3582185 | 0 | 1313021200 | 17834310921557 | 17834310879745 | 17834311373345 | 17834311392615 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 380 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 198592 | 0x7fc8d4b91800 | 0x7fc8d4225f00 | 243299 | 243299 | 20537 | 1946400 | 65536 | 168632596 | 1836482 | 0 | 676289424 | 17834311423864 | 17834311373345 | 17834311732706 | 17834311734556 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 383 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 202368 | 0x7fc8d4b91680 | 0x7fc8d4225f40 | 334675 | 334675 | 23818 | 2677408 | 65536 | 199877609 | 2554723 | 0 | 801277260 | 17834311774095 | 17834311732706 | 17834312160866 | 17834312179645 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 386 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 205888 | 0x7fc8d71bf500 | 0x7fc8d4225f80 | 333944 | 333944 | 23247 | 2671560 | 65536 | 207389401 | 2543268 | 0 | 831339332 | 17834312203145 | 17834312160866 | 17834312584067 | 17834312601845 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 389 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 209408 | 0x7fc8d71bf380 | 0x7fc8d4225fc0 | 307785 | 307785 | 23645 | 2462288 | 65536 | 204659723 | 2351204 | 0 | 820405932 | 17834312625324 | 17834312584067 | 17834312985508 | 17834312987395 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 392 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 214464 | 0x7fc8d71bf200 | 0x7fc8d4226000 | 543831 | 543831 | 36446 | 4350656 | 65536 | 400108703 | 4228041 | 0 | 1602203616 | 17834313028704 | 17834312985508 | 17834313528868 | 17834313545371 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 395 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 217728 | 0x7fc8d71bf080 | 0x7fc8d4226040 | 272076 | 272076 | 22079 | 2176616 | 65536 | 195969289 | 2069235 | 0 | 785630088 | 17834313580611 | 17834313528868 | 17834313907589 | 17834313909332 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 398 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 222016 | 0x7fc8d4b91f00 | 0x7fc8d4226080 | 366676 | 366676 | 27448 | 2933416 | 65536 | 245183051 | 2817157 | 0 | 982512760 | 17834313950611 | 17834313907589 | 17834314357029 | 17834314375181 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 401 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 226048 | 0x7fc8d4b91d80 | 0x7fc8d42260c0 | 364698 | 364698 | 28121 | 2917592 | 65536 | 255642502 | 2806900 | 0 | 1024333444 | 17834314399810 | 17834314357029 | 17834314802630 | 17834314845409 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 404 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 230080 | 0x7fc8d4b91c00 | 0x7fc8d4226100 | 347899 | 347899 | 25794 | 2783200 | 65536 | 242487603 | 2672104 | 0 | 971720320 | 17834314855839 | 17834314802630 | 17834315245191 | 17834315287608 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 407 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 235904 | 0x7fc8d4b91a80 | 0x7fc8d4226140 | 625481 | 625481 | 40686 | 5003856 | 65536 | 460031137 | 4879068 | 0 | 1841894612 | 17834315298628 | 17834315245191 | 17834315876071 | 17834315918383 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 410 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 239424 | 0x7fc8d4b91900 | 0x7fc8d4226180 | 302927 | 302927 | 23596 | 2423424 | 65536 | 213261601 | 2312174 | 0 | 854813768 | 17834315937612 | 17834315876071 | 17834316297832 | 17834316299403 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 413 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 244224 | 0x7fc8d4b91780 | 0x7fc8d42261c0 | 399075 | 399075 | 27608 | 3192608 | 65536 | 264195773 | 3080075 | 0 | 1058569392 | 17834316340782 | 17834316297832 | 17834316759753 | 17834316801851 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 416 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 248768 | 0x7fc8d4b91600 | 0x7fc8d4226200 | 392130 | 392130 | 27681 | 3137048 | 65536 | 289347031 | 3022706 | 0 | 1159165792 | 17834316812020 | 17834316759753 | 17834317239753 | 17834317281259 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 419 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 253312 | 0x7fc8d71bf480 | 0x7fc8d4226240 | 387952 | 387952 | 27807 | 3103624 | 65536 | 280753329 | 2989110 | 0 | 1124778064 | 17834317291418 | 17834317239753 | 17834317709354 | 17834317727518 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 422 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 8 | 24 | 255552 | 0x7fc8d71bf300 | 0x7fc8d4226280 | 719930 | 719930 | 44876 | 5759448 | 65536 | 543357386 | 5636111 | 0 | 2175169880 | 17834317752167 | 17834317709354 | 17834318374795 | 17834318418700 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 425 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 259840 | 0x7fc8d71bf180 | 0x7fc8d42262c0 | 364824 | 364824 | 27411 | 2918600 | 65536 | 263017562 | 2801039 | 0 | 1053835448 | 17834318438150 | 17834318374795 | 17834318836235 | 17834318879929 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 428 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 265664 | 0x7fc8d71bf000 | 0x7fc8d4226300 | 471292 | 471292 | 32403 | 3770344 | 65536 | 351197243 | 3653322 | 0 | 1406578836 | 17834318891029 | 17834318836235 | 17834319369036 | 17834319411026 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 431 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 271232 | 0x7fc8d4b91e80 | 0x7fc8d4226340 | 474138 | 474138 | 32968 | 3793112 | 65536 | 349572599 | 3680200 | 0 | 1400078536 | 17834319421405 | 17834319369036 | 17834319910157 | 17834319951892 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 434 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 8 | 24 | 273216 | 0x7fc8d4b91d00 | 0x7fc8d4226380 | 483314 | 483314 | 33001 | 3866520 | 65536 | 352783080 | 3753336 | 0 | 1412873680 | 17834319962552 | 17834319910157 | 17834320437198 | 17834320479809 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 437 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 8 | 24 | 275712 | 0x7fc8d4b91b80 | 0x7fc8d42263c0 | 880138 | 880138 | 52986 | 7041112 | 65536 | 675410808 | 6929733 | 0 | 2703384488 | 17834320490389 | 17834320437198 | 17834321229839 | 17834321272819 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 440 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 280768 | 0x7fc8d4b91a00 | 0x7fc8d4226400 | 425881 | 425881 | 29669 | 3407056 | 65536 | 318126163 | 3299396 | 0 | 1274275000 | 17834321292269 | 17834321229839 | 17834321724559 | 17834321742908 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 443 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 287616 | 0x7fc8d4b91880 | 0x7fc8d4226440 | 552000 | 552000 | 35408 | 4416008 | 65536 | 405168085 | 4305890 | 0 | 1622465864 | 17834321767237 | 17834321724559 | 17834322289360 | 17834322335643 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 446 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 294208 | 0x7fc8d4b91700 | 0x7fc8d4226480 | 551581 | 551581 | 36057 | 4412656 | 65536 | 409721582 | 4298465 | 0 | 1640670012 | 17834322347203 | 17834322289360 | 17834322879601 | 17834322924048 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 449 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 8 | 24 | 296960 | 0x7fc8d71bf580 | 0x7fc8d42264c0 | 563270 | 563270 | 36733 | 4506168 | 65536 | 422198219 | 4392694 | 0 | 1690538260 | 17834322935358 | 17834322879601 | 17834323460242 | 17834323501854 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 452 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 8 | 24 | 299968 | 0x7fc8d71bf400 | 0x7fc8d4226500 | 1041630 | 1041630 | 61508 | 8333048 | 65536 | 797586758 | 8218915 | 0 | 3192089132 | 17834323512054 | 17834323460072 | 17834324354792 | 17834324401882 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 455 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 8 | 24 | 302720 | 0x7fc8d71bf280 | 0x7fc8d4226540 | 721638 | 721638 | 44565 | 5773112 | 65536 | 538243078 | 5659185 | 0 | 2154714336 | 17834324420811 | 17834324354792 | 17834325038312 | 17834325080545 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 458 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 305472 | 0x7fc8d71bf100 | 0x7fc8d4226580 | 723659 | 723659 | 45227 | 5789280 | 65536 | 541683722 | 5671557 | 0 | 2168477180 | 17834325091305 | 17834325038312 | 17834325732233 | 17834325775538 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 461 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 308224 | 0x7fc8d4b91f80 | 0x7fc8d42265c0 | 724066 | 724066 | 45236 | 5792536 | 65536 | 554432325 | 5665808 | 0 | 2219470204 | 17834325786137 | 17834325732233 | 17834326425354 | 17834326470040 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 464 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 8 | 24 | 310976 | 0x7fc8d4b91e00 | 0x7fc8d4226600 | 727528 | 727528 | 45271 | 5820232 | 65536 | 542132432 | 5700957 | 0 | 2170273016 | 17834326481840 | 17834326425354 | 17834327121354 | 17834327165433 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 467 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 8 | 24 | 313216 | 0x7fc8d4b91c80 | 0x7fc8d4226640 | 1368716 | 1368716 | 77974 | 10949736 | 65536 | 1066748922 | 10813154 | 0 | 4268737600 | 17834327175473 | 17834327121354 | 17834328226315 | 17834328269906 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 470 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 8 | 24 | 315968 | 0x7fc8d4b91b00 | 0x7fc8d4226680 | 1369824 | 1369824 | 77831 | 10958600 | 65536 | 1076782474 | 10843115 | 0 | 4308871668 | 17834328288855 | 17834328226315 | 17834329311116 | 17834329374338 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 473 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 318720 | 0x7fc8d4b91980 | 0x7fc8d42266c0 | 1375124 | 1375124 | 78065 | 11001000 | 65536 | 1071881202 | 10865494 | 0 | 4289266868 | 17834329385588 | 17834329311116 | 17834330454158 | 17834330521830 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 476 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 321472 | 0x7fc8d4b91800 | 0x7fc8d4226700 | 1371238 | 1371238 | 77436 | 10969912 | 65536 | 1077779295 | 10853697 | 0 | 4312857984 | 17834330533269 | 17834330454158 | 17834331595599 | 17834331662981 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 479 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 8 | 24 | 324224 | 0x7fc8d4b91680 | 0x7fc8d4226740 | 1376130 | 1376130 | 77713 | 11009048 | 65536 | 1084688254 | 10886966 | 0 | 4340495408 | 17834331673821 | 17834331595599 | 17834332731920 | 17834332799413 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 482 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 8 | 24 | 326464 | 0x7fc8d71bf500 | 0x7fc8d4226780 | 2662336 | 2662336 | 142424 | 21298696 | 65536 | 2131580032 | 21184514 | 0 | 8528061380 | 17834332810773 | 17834332731920 | 17834334704242 | 17834334776354 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 485 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 8 | 24 | 329216 | 0x7fc8d71bf380 | 0x7fc8d42267c0 | 2670852 | 2670852 | 143342 | 21366824 | 65536 | 2131999864 | 21233521 | 0 | 8529740752 | 17834334795274 | 17834334704242 | 17834336653524 | 17834336720826 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 488 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 331968 | 0x7fc8d71bf200 | 0x7fc8d4226800 | 2670556 | 2670556 | 142721 | 21364456 | 65536 | 2122324716 | 21238623 | 0 | 8491039852 | 17834336731875 | 17834336653524 | 17834338654006 | 17834338725046 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 491 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 12 | 24 | 334720 | 0x7fc8d71bf080 | 0x7fc8d4226840 | 2669612 | 2669612 | 143666 | 21356904 | 65536 | 2113520736 | 21229473 | 0 | 8455823144 | 17834338736746 | 17834338654006 | 17834340663928 | 17834340732916 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 494 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 8 | 24 | 337472 | 0x7fc8d4b91f00 | 0x7fc8d4226880 | 2674293 | 2674293 | 143290 | 21394352 | 65536 | 2122181246 | 21263814 | 0 | 8490468052 | 17834340744566 | 17834340663928 | 17834342616730 | 17834342688017 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 497 | 236725 | 236725 | 4194304 | 256 | 0 | 0 | 8 | 24 | 0 | 0x7fc8d4b91d80 | 0x7fc8d42268c0 | 5256862 | 5256862 | 273842 | 42054904 | 65536 | 4229210368 | 41928959 | 0 | 16918583340 | 17834342699137 | 17834342616730 | 17834346261054 | 17834346333537 |