41 KiB
41 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | SQ_INSTS_SMEM | SQ_INST_LEVEL_SMEM | SQ_ACCUM_PREV_HIRES | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBufferAligned.kd | 0 | 0 | 0 | 229165 | 229165 | 33554432 | 256 | 0 | 0 | 4 | 32 | 4160 | 0x0 | 0x7fed8e404280 | 3670016 | 3210192 | 359394552 | 17703062218323 | 17697497051832 | 17703209908589 | 17703210020339 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 229165 | 229165 | 32768 | 256 | 0 | 0 | 12 | 24 | 13888 | 0x0 | 0x7fed8e423f80 | 512 | 102828 | 11537184 | 17703215180549 | 17703209908589 | 17703215310683 | 17703215315516 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 5 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 14336 | 0x7fed91369380 | 0x7fed8e423fc0 | 65536 | 615618 | 68994040 | 17703215349825 | 17703215310683 | 17703215686844 | 17703215689607 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 8 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15040 | 0x7fed91369200 | 0x7fed8e424000 | 65536 | 648906 | 72722096 | 17703215725596 | 17703215686844 | 17703216088126 | 17703216090817 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 11 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15488 | 0x7fed91369080 | 0x7fed8e424040 | 65536 | 644350 | 72223192 | 17703216122186 | 17703216088126 | 17703216480927 | 17703216483097 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 14 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 15936 | 0x7fed8ed09f00 | 0x7fed8e424080 | 65536 | 684224 | 76626936 | 17703216515176 | 17703216480927 | 17703216784128 | 17703216786459 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 17 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 16384 | 0x7fed8ed09d80 | 0x7fed8e4240c0 | 65536 | 608090 | 68097952 | 17703216817389 | 17703216784128 | 17703217086528 | 17703217088672 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 20 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 17088 | 0x7fed8ed09c00 | 0x7fed8e424100 | 131072 | 640238 | 71627944 | 17703217131511 | 17703217086528 | 17703217385569 | 17703217387694 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 23 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 16 | 24 | 17792 | 0x7fed8ed09a80 | 0x7fed8e424140 | 131072 | 681956 | 76343048 | 17703217418683 | 17703217385569 | 17703217776610 | 17703217778944 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 26 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 16 | 24 | 18496 | 0x7fed8ed09900 | 0x7fed8e424180 | 65536 | 644478 | 72231080 | 17703217809274 | 17703217776610 | 17703218164451 | 17703218167365 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 29 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19200 | 0x7fed8ed09780 | 0x7fed8e4241c0 | 131072 | 682384 | 76442072 | 17703218199494 | 17703218164451 | 17703218495652 | 17703218497996 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 32 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19904 | 0x7fed8ed09600 | 0x7fed8e424200 | 131072 | 684462 | 76591912 | 17703218530046 | 17703218495652 | 17703218802053 | 17703218804309 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 35 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 20608 | 0x7fed91369480 | 0x7fed8e424240 | 131072 | 686448 | 76781752 | 17703218843698 | 17703218802053 | 17703219104614 | 17703219106861 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 38 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 16 | 24 | 21312 | 0x7fed91369300 | 0x7fed8e424280 | 131072 | 682246 | 76323040 | 17703219138310 | 17703219104614 | 17703219486375 | 17703219488121 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 41 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22016 | 0x7fed91369180 | 0x7fed8e4242c0 | 65536 | 645194 | 72177304 | 17703219520191 | 17703219486375 | 17703219848136 | 17703219849772 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 44 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22720 | 0x7fed91369000 | 0x7fed8e424300 | 131072 | 678602 | 75972824 | 17703219881472 | 17703219848136 | 17703220123977 | 17703220125575 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 47 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 23424 | 0x7fed8ed09e80 | 0x7fed8e424340 | 131072 | 692914 | 77536808 | 17703220156675 | 17703220123977 | 17703220403498 | 17703220405178 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 50 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 24128 | 0x7fed8ed09d00 | 0x7fed8e424380 | 131072 | 669116 | 74921848 | 17703220443767 | 17703220403498 | 17703220687659 | 17703220689311 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 53 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 16 | 24 | 24832 | 0x7fed8ed09b80 | 0x7fed8e4243c0 | 131072 | 680954 | 76335792 | 17703220721710 | 17703220687659 | 17703221052460 | 17703221054112 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 56 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 16 | 24 | 25536 | 0x7fed8ed09a00 | 0x7fed8e424400 | 65536 | 606372 | 67867592 | 17703221085331 | 17703221052460 | 17703221423661 | 17703221425333 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 59 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26240 | 0x7fed8ed09880 | 0x7fed8e424440 | 131072 | 683568 | 76397128 | 17703221456152 | 17703221423661 | 17703221700621 | 17703221702196 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 62 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26944 | 0x7fed8ed09700 | 0x7fed8e424480 | 131072 | 688164 | 77076080 | 17703221732895 | 17703221700621 | 17703221977102 | 17703221978789 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 65 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 27648 | 0x7fed91369580 | 0x7fed8e4244c0 | 131072 | 659726 | 74016992 | 17703222016328 | 17703221977102 | 17703222268303 | 17703222270181 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 68 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 16 | 24 | 28608 | 0x7fed91369400 | 0x7fed8e424500 | 131072 | 675586 | 75641064 | 17703222303171 | 17703222268303 | 17703222636304 | 17703222637902 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 71 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 16 | 24 | 29312 | 0x7fed91369280 | 0x7fed8e424540 | 65536 | 649090 | 72766256 | 17703222669141 | 17703222636304 | 17703223000945 | 17703223002693 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 74 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 30016 | 0x7fed91369100 | 0x7fed8e424580 | 131072 | 649394 | 72732128 | 17703223034602 | 17703223000945 | 17703223276466 | 17703223278136 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 77 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 8 | 24 | 30976 | 0x7fed8ed09f80 | 0x7fed8e4245c0 | 131072 | 642024 | 71812808 | 17703223309655 | 17703223276466 | 17703223550867 | 17703223552529 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 80 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 31680 | 0x7fed8ed09e00 | 0x7fed8e424600 | 131072 | 670666 | 75144160 | 17703223591668 | 17703223550867 | 17703223826707 | 17703223828262 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 83 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 16 | 24 | 32640 | 0x7fed8ed09c80 | 0x7fed8e424640 | 131072 | 640668 | 71715088 | 17703223859751 | 17703223826707 | 17703224191348 | 17703224193033 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 86 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 33600 | 0x7fed8ed09b00 | 0x7fed8e424680 | 65536 | 634210 | 71028128 | 17703224223532 | 17703224191348 | 17703224559510 | 17703224561194 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 89 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 34560 | 0x7fed8ed09980 | 0x7fed8e4246c0 | 131072 | 680932 | 76428432 | 17703224591873 | 17703224559510 | 17703224838070 | 17703224839657 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 92 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 8 | 24 | 35520 | 0x7fed8ed09800 | 0x7fed8e424700 | 131072 | 687064 | 76958048 | 17703224870636 | 17703224838070 | 17703225116631 | 17703225118480 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 95 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 36224 | 0x7fed8ed09680 | 0x7fed8e424740 | 131072 | 682132 | 76370640 | 17703225156079 | 17703225116631 | 17703225395352 | 17703225397093 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 98 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 37184 | 0x7fed91369500 | 0x7fed8e424780 | 131072 | 673762 | 75525592 | 17703225427772 | 17703225395352 | 17703225768473 | 17703225770083 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 101 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 38144 | 0x7fed91369380 | 0x7fed8e4247c0 | 65536 | 650886 | 72829080 | 17703225801963 | 17703225768473 | 17703226130554 | 17703226132394 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 104 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 39104 | 0x7fed91369200 | 0x7fed8e424800 | 131072 | 675970 | 75676024 | 17703226165033 | 17703226130554 | 17703226412315 | 17703226414037 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 107 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 8 | 24 | 40320 | 0x7fed91369080 | 0x7fed8e424840 | 131072 | 668162 | 74784432 | 17703226445826 | 17703226412315 | 17703226698556 | 17703226700250 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 110 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 41280 | 0x7fed8ed09f00 | 0x7fed8e424880 | 131072 | 684166 | 76622864 | 17703226738989 | 17703226698556 | 17703226982076 | 17703226983803 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 113 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 42240 | 0x7fed8ed09d80 | 0x7fed8e4248c0 | 131072 | 675928 | 75752200 | 17703227014182 | 17703226982076 | 17703227351997 | 17703227353624 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 116 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 43200 | 0x7fed8ed09c00 | 0x7fed8e424900 | 65536 | 600026 | 67223968 | 17703227385293 | 17703227351997 | 17703227717918 | 17703227719505 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 119 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 8 | 24 | 44160 | 0x7fed8ed09a80 | 0x7fed8e424940 | 131072 | 687060 | 76971112 | 17703227750234 | 17703227717918 | 17703227994399 | 17703227996108 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 122 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 45376 | 0x7fed8ed09900 | 0x7fed8e424980 | 131072 | 668826 | 74864128 | 17703228026747 | 17703227994399 | 17703228272320 | 17703228274091 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 125 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 46336 | 0x7fed8ed09780 | 0x7fed8e4249c0 | 131072 | 679994 | 76310464 | 17703228312040 | 17703228272320 | 17703228558081 | 17703228559783 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 128 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 47552 | 0x7fed8ed09600 | 0x7fed8e424a00 | 131072 | 680318 | 76111008 | 17703228590533 | 17703228558081 | 17703228923522 | 17703228925164 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 131 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 48512 | 0x7fed91369480 | 0x7fed8e424a40 | 65536 | 642558 | 71858392 | 17703228957464 | 17703228923522 | 17703229287843 | 17703229289535 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 134 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 8 | 24 | 49472 | 0x7fed91369300 | 0x7fed8e424a80 | 131072 | 642488 | 71862760 | 17703229320144 | 17703229287843 | 17703229572964 | 17703229574658 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 137 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 50688 | 0x7fed91369180 | 0x7fed8e424ac0 | 131072 | 650690 | 72790248 | 17703229606257 | 17703229572964 | 17703229853284 | 17703229855011 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 140 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 51648 | 0x7fed91369000 | 0x7fed8e424b00 | 131072 | 641228 | 71834688 | 17703229893120 | 17703229853284 | 17703230137765 | 17703230139714 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 143 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 52864 | 0x7fed8ed09e80 | 0x7fed8e424b40 | 131072 | 690034 | 77205296 | 17703230170893 | 17703230137765 | 17703230506566 | 17703230508265 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 146 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 54080 | 0x7fed8ed09d00 | 0x7fed8e424b80 | 65536 | 646340 | 72542032 | 17703230539544 | 17703230506566 | 17703230872647 | 17703230874405 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 149 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 8 | 24 | 55296 | 0x7fed8ed09b80 | 0x7fed8e424bc0 | 131072 | 685162 | 76747592 | 17703230904755 | 17703230872647 | 17703231152968 | 17703231154608 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 152 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 56768 | 0x7fed8ed09a00 | 0x7fed8e424c00 | 131072 | 668458 | 74782264 | 17703231186108 | 17703231152968 | 17703231432969 | 17703231434691 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 155 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 57728 | 0x7fed8ed09880 | 0x7fed8e424c40 | 131072 | 682918 | 76432920 | 17703231472710 | 17703231432969 | 17703231717130 | 17703231718874 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 158 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 58944 | 0x7fed8ed09700 | 0x7fed8e424c80 | 131072 | 670380 | 75045944 | 17703231749433 | 17703231717130 | 17703232082091 | 17703232083805 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 161 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 60160 | 0x7fed91369580 | 0x7fed8e424cc0 | 65536 | 647386 | 72487592 | 17703232114784 | 17703232082091 | 17703232448012 | 17703232449616 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 164 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 8 | 24 | 61376 | 0x7fed91369400 | 0x7fed8e424d00 | 131072 | 682806 | 76492608 | 17703232480835 | 17703232448012 | 17703232723533 | 17703232725249 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 167 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 62848 | 0x7fed91369280 | 0x7fed8e424d40 | 131072 | 679598 | 76065704 | 17703232758308 | 17703232723533 | 17703233008813 | 17703233010462 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 170 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 63808 | 0x7fed91369100 | 0x7fed8e424d80 | 131072 | 681286 | 76352600 | 17703233049831 | 17703233008813 | 17703233285134 | 17703233286875 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 173 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 65024 | 0x7fed8ed09f80 | 0x7fed8e424dc0 | 131072 | 657086 | 73629160 | 17703233318494 | 17703233285134 | 17703233646735 | 17703233648466 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 176 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 66240 | 0x7fed8ed09e00 | 0x7fed8e424e00 | 65536 | 610560 | 68362896 | 17703233680635 | 17703233646735 | 17703234014096 | 17703234015846 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 179 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 8 | 24 | 67456 | 0x7fed8ed09c80 | 0x7fed8e424e40 | 131072 | 678086 | 75968608 | 17703234046756 | 17703234014096 | 17703234302097 | 17703234303729 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 182 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 68928 | 0x7fed8ed09b00 | 0x7fed8e424e80 | 131072 | 689532 | 77260584 | 17703234335408 | 17703234302097 | 17703234588498 | 17703234590182 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 185 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 70144 | 0x7fed8ed09980 | 0x7fed8e424ec0 | 131072 | 637780 | 71364560 | 17703234628371 | 17703234588498 | 17703234870579 | 17703234872305 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 188 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 71616 | 0x7fed8ed09800 | 0x7fed8e424f00 | 131072 | 673838 | 75426760 | 17703234903154 | 17703234870579 | 17703235235380 | 17703235237076 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 191 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 72832 | 0x7fed8ed09680 | 0x7fed8e424f40 | 65536 | 642276 | 71988744 | 17703235268125 | 17703235235380 | 17703235599381 | 17703235600996 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 194 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 8 | 24 | 74048 | 0x7fed91369500 | 0x7fed8e424f80 | 131072 | 651186 | 72884896 | 17703235631976 | 17703235599381 | 17703235885301 | 17703235886939 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 197 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 75776 | 0x7fed91369380 | 0x7fed8e424fc0 | 131072 | 645134 | 72263696 | 17703235917618 | 17703235885301 | 17703236179542 | 17703236181202 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 200 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 76992 | 0x7fed91369200 | 0x7fed8e425000 | 131072 | 681540 | 76267672 | 17703236219431 | 17703236179542 | 17703236460343 | 17703236462105 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 203 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 78464 | 0x7fed91369080 | 0x7fed8e425040 | 131072 | 704122 | 78991592 | 17703236492974 | 17703236460343 | 17703236822424 | 17703236824066 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 206 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 79936 | 0x7fed8ed09f00 | 0x7fed8e425080 | 65536 | 645734 | 72350248 | 17703236855405 | 17703236822424 | 17703237186585 | 17703237188366 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 209 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 8 | 24 | 81408 | 0x7fed8ed09d80 | 0x7fed8e4250c0 | 131072 | 674888 | 75555096 | 17703237219826 | 17703237186585 | 17703237468666 | 17703237470289 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 212 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 83136 | 0x7fed8ed09c00 | 0x7fed8e425100 | 131072 | 681264 | 76291120 | 17703237500969 | 17703237468666 | 17703237766747 | 17703237768382 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 215 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 84352 | 0x7fed8ed09a80 | 0x7fed8e425140 | 131072 | 668322 | 74820320 | 17703237818421 | 17703237766747 | 17703238046588 | 17703238048215 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 218 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 85824 | 0x7fed8ed09900 | 0x7fed8e425180 | 131072 | 670590 | 75062376 | 17703238087584 | 17703238046588 | 17703238429469 | 17703238431355 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 221 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 87296 | 0x7fed8ed09780 | 0x7fed8e4251c0 | 65536 | 643988 | 72134760 | 17703238462394 | 17703238429469 | 17703238798910 | 17703238800636 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 224 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 88768 | 0x7fed8ed09600 | 0x7fed8e425200 | 131072 | 676308 | 75771056 | 17703238831625 | 17703238798910 | 17703239076030 | 17703239077739 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 227 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 90752 | 0x7fed91369480 | 0x7fed8e425240 | 131072 | 684146 | 76623304 | 17703239108858 | 17703239076030 | 17703239379711 | 17703239381372 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 230 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 91968 | 0x7fed91369300 | 0x7fed8e425280 | 131072 | 680786 | 76197288 | 17703239419931 | 17703239379711 | 17703239663552 | 17703239665244 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 233 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 93440 | 0x7fed91369180 | 0x7fed8e4252c0 | 131072 | 675160 | 75709912 | 17703239696854 | 17703239663552 | 17703240027713 | 17703240029415 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 236 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 94912 | 0x7fed91369000 | 0x7fed8e425300 | 65536 | 652386 | 72934368 | 17703240061055 | 17703240027713 | 17703240389154 | 17703240390856 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 239 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 96384 | 0x7fed8ed09e80 | 0x7fed8e425340 | 131072 | 680210 | 76172984 | 17703240422235 | 17703240389154 | 17703240667715 | 17703240669459 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 242 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 98368 | 0x7fed8ed09d00 | 0x7fed8e425380 | 131072 | 675058 | 75641776 | 17703240700339 | 17703240667715 | 17703240974916 | 17703240976532 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 245 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 99584 | 0x7fed8ed09b80 | 0x7fed8e4253c0 | 131072 | 679408 | 76213976 | 17703241014561 | 17703240974916 | 17703241257957 | 17703241259755 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 248 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 101312 | 0x7fed8ed09a00 | 0x7fed8e425400 | 131072 | 689920 | 77220200 | 17703241292104 | 17703241257957 | 17703241624038 | 17703241625795 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 251 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 102784 | 0x7fed8ed09880 | 0x7fed8e425440 | 65536 | 633302 | 70994016 | 17703241656585 | 17703241624038 | 17703241986119 | 17703241987756 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 254 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 104256 | 0x7fed8ed09700 | 0x7fed8e425480 | 131072 | 650620 | 72795520 | 17703242018656 | 17703241986119 | 17703242271239 | 17703242273259 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 257 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 106240 | 0x7fed91369580 | 0x7fed8e4254c0 | 131072 | 637582 | 71352944 | 17703242304828 | 17703242271239 | 17703242589640 | 17703242591311 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 260 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 107712 | 0x7fed91369400 | 0x7fed8e425500 | 131072 | 654352 | 73307608 | 17703242630650 | 17703242589640 | 17703242868361 | 17703242870124 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 263 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 16 | 24 | 109440 | 0x7fed91369280 | 0x7fed8e425540 | 131072 | 682316 | 76289128 | 17703242901103 | 17703242868361 | 17703243239082 | 17703243240785 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 266 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 16 | 24 | 111168 | 0x7fed91369100 | 0x7fed8e425580 | 65536 | 635588 | 71257504 | 17703243272424 | 17703243239082 | 17703243604043 | 17703243605696 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 269 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 8 | 24 | 112896 | 0x7fed8ed09f80 | 0x7fed8e4255c0 | 131072 | 685798 | 76836648 | 17703243637245 | 17703243604043 | 17703243883884 | 17703243885489 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 272 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 115136 | 0x7fed8ed09e00 | 0x7fed8e425600 | 131072 | 682358 | 76453728 | 17703243916608 | 17703243883884 | 17703244203885 | 17703244205680 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 275 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 116608 | 0x7fed8ed09c80 | 0x7fed8e425640 | 131072 | 677970 | 76119264 | 17703244243390 | 17703244203885 | 17703244488686 | 17703244490343 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 278 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 16 | 24 | 118336 | 0x7fed8ed09b00 | 0x7fed8e425680 | 131072 | 676664 | 75875296 | 17703244521683 | 17703244488686 | 17703244861167 | 17703244862854 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 281 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 16 | 24 | 120064 | 0x7fed8ed09980 | 0x7fed8e4256c0 | 65536 | 640526 | 71758152 | 17703244894033 | 17703244861167 | 17703245226288 | 17703245228005 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 284 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 121792 | 0x7fed8ed09800 | 0x7fed8e425700 | 131072 | 680300 | 76107712 | 17703245258244 | 17703245226288 | 17703245508529 | 17703245510148 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 287 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 124032 | 0x7fed8ed09680 | 0x7fed8e425740 | 131072 | 689112 | 77141032 | 17703245541007 | 17703245508529 | 17703245834930 | 17703245836609 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 290 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 125504 | 0x7fed91369500 | 0x7fed8e425780 | 131072 | 663540 | 74563632 | 17703245874858 | 17703245834930 | 17703246113010 | 17703246114862 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 293 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 127488 | 0x7fed91369380 | 0x7fed8e4257c0 | 131072 | 692164 | 77535048 | 17703246146462 | 17703246113010 | 17703246483731 | 17703246485413 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 296 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 129216 | 0x7fed91369200 | 0x7fed8e425800 | 65536 | 645422 | 72272416 | 17703246516722 | 17703246483731 | 17703246846452 | 17703246848274 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 299 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 130944 | 0x7fed91369080 | 0x7fed8e425840 | 131072 | 647668 | 72487632 | 17703246878963 | 17703246846452 | 17703247131253 | 17703247132827 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 302 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 133440 | 0x7fed8ed09f00 | 0x7fed8e425880 | 131072 | 649744 | 72877728 | 17703247164366 | 17703247131253 | 17703247473014 | 17703247474738 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 305 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 134912 | 0x7fed8ed09d80 | 0x7fed8e4258c0 | 131072 | 1008904 | 113111432 | 17703247513207 | 17703247473014 | 17703247758935 | 17703247760551 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 308 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 136896 | 0x7fed8ed09c00 | 0x7fed8e425900 | 131072 | 643090 | 72076680 | 17703247791140 | 17703247758935 | 17703248122456 | 17703248124192 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 311 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 138880 | 0x7fed8ed09a80 | 0x7fed8e425940 | 65536 | 637770 | 71494776 | 17703248155451 | 17703248122456 | 17703248499897 | 17703248501522 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 314 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 140864 | 0x7fed8ed09900 | 0x7fed8e425980 | 131072 | 680622 | 76186808 | 17703248531732 | 17703248499897 | 17703248788378 | 17703248790115 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 317 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 143616 | 0x7fed8ed09780 | 0x7fed8e4259c0 | 131072 | 684288 | 76733440 | 17703248821324 | 17703248788378 | 17703249141819 | 17703249143546 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 320 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 145344 | 0x7fed8ed09600 | 0x7fed8e425a00 | 131072 | 1002888 | 112284696 | 17703249181805 | 17703249141819 | 17703249429660 | 17703249431319 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 323 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 147584 | 0x7fed91369480 | 0x7fed8e425a40 | 131072 | 668424 | 74857072 | 17703249462338 | 17703249429660 | 17703249796221 | 17703249797840 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 326 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 149568 | 0x7fed91369300 | 0x7fed8e425a80 | 65536 | 638094 | 71453344 | 17703249829259 | 17703249796221 | 17703250161982 | 17703250163890 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 329 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 151552 | 0x7fed91369180 | 0x7fed8e425ac0 | 131072 | 641984 | 71893376 | 17703250196020 | 17703250161982 | 17703250465183 | 17703250466793 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 332 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 154304 | 0x7fed91369000 | 0x7fed8e425b00 | 131072 | 642166 | 71948488 | 17703250497432 | 17703250465183 | 17703250835584 | 17703250837184 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 335 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 156288 | 0x7fed8ed09e80 | 0x7fed8e425b40 | 131072 | 959880 | 107410376 | 17703250875663 | 17703250835584 | 17703251130944 | 17703251132706 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 338 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 158784 | 0x7fed8ed09d00 | 0x7fed8e425b80 | 131072 | 681896 | 76277072 | 17703251163275 | 17703251130944 | 17703251501506 | 17703251503197 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 341 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 161024 | 0x7fed8ed09b80 | 0x7fed8e425bc0 | 65536 | 638812 | 71520384 | 17703251534066 | 17703251501506 | 17703251870467 | 17703251872318 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 344 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 163264 | 0x7fed8ed09a00 | 0x7fed8e425c00 | 131072 | 641712 | 71815680 | 17703251903417 | 17703251870467 | 17703252175587 | 17703252177310 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 347 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 166528 | 0x7fed8ed09880 | 0x7fed8e425c40 | 131072 | 676516 | 75832968 | 17703252209529 | 17703252175587 | 17703252569509 | 17703252592320 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 350 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 168512 | 0x7fed8ed09700 | 0x7fed8e425c80 | 131072 | 1006360 | 112807040 | 17703252611679 | 17703252569509 | 17703252876069 | 17703252877653 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 353 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 171264 | 0x7fed91369580 | 0x7fed8e425cc0 | 131072 | 643570 | 72086296 | 17703252907722 | 17703252876069 | 17703253245670 | 17703253247283 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 356 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 173760 | 0x7fed91369400 | 0x7fed8e425d00 | 65536 | 643972 | 72116576 | 17703253278763 | 17703253245670 | 17703253620232 | 17703253621814 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 359 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 176256 | 0x7fed91369280 | 0x7fed8e425d40 | 131072 | 642340 | 72028752 | 17703253652513 | 17703253620232 | 17703253946312 | 17703253947876 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 362 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 179776 | 0x7fed91369100 | 0x7fed8e425d80 | 131072 | 646224 | 72367848 | 17703253978835 | 17703253946312 | 17703254370794 | 17703254394155 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 365 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 182272 | 0x7fed8ed09f80 | 0x7fed8e425dc0 | 131072 | 969952 | 108637208 | 17703254414144 | 17703254370794 | 17703254697995 | 17703254699647 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 368 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 185536 | 0x7fed8ed09e00 | 0x7fed8e425e00 | 131072 | 672558 | 75339488 | 17703254730746 | 17703254697995 | 17703255077356 | 17703255080157 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 371 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 188544 | 0x7fed8ed09c80 | 0x7fed8e425e40 | 65536 | 644726 | 72271984 | 17703255110687 | 17703255077356 | 17703255462957 | 17703255483817 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 374 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 191552 | 0x7fed8ed09b00 | 0x7fed8e425e80 | 131072 | 646670 | 72376528 | 17703255495207 | 17703255462957 | 17703255817358 | 17703255819059 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 377 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 195840 | 0x7fed8ed09980 | 0x7fed8e425ec0 | 131072 | 641174 | 71874256 | 17703255849628 | 17703255817358 | 17703256286319 | 17703256306386 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 380 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 198592 | 0x7fed8ed09800 | 0x7fed8e425f00 | 131072 | 1012202 | 113524136 | 17703256326696 | 17703256286319 | 17703256629680 | 17703256631418 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 383 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 202368 | 0x7fed8ed09680 | 0x7fed8e425f40 | 131072 | 972560 | 108631832 | 17703256662128 | 17703256629680 | 17703257024561 | 17703257042038 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 386 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 205888 | 0x7fed91369500 | 0x7fed8e425f80 | 65536 | 632942 | 70899888 | 17703257056638 | 17703257024561 | 17703257426482 | 17703257443808 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 389 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 209408 | 0x7fed91369380 | 0x7fed8e425fc0 | 131072 | 652108 | 73058312 | 17703257458787 | 17703257426482 | 17703257804723 | 17703257806559 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 392 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 214464 | 0x7fed91369200 | 0x7fed8e426000 | 131072 | 644604 | 71980872 | 17703257837078 | 17703257804723 | 17703258327445 | 17703258345555 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 395 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 217728 | 0x7fed91369080 | 0x7fed8e426040 | 131072 | 1001328 | 112031784 | 17703258368715 | 17703258327445 | 17703258688726 | 17703258690536 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 398 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 222016 | 0x7fed8ed09f00 | 0x7fed8e426080 | 131072 | 1008242 | 112991312 | 17703258721056 | 17703258688726 | 17703259105687 | 17703259123136 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 401 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 226048 | 0x7fed8ed09d80 | 0x7fed8e4260c0 | 65536 | 636718 | 71193600 | 17703259139975 | 17703259105687 | 17703259525848 | 17703259542835 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 404 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 230080 | 0x7fed8ed09c00 | 0x7fed8e426100 | 131072 | 650582 | 72837608 | 17703259557765 | 17703259525848 | 17703259927769 | 17703259945015 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 407 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 235904 | 0x7fed8ed09a80 | 0x7fed8e426140 | 131072 | 643808 | 72014424 | 17703259960364 | 17703259927769 | 17703260506011 | 17703260523480 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 410 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 239424 | 0x7fed8ed09900 | 0x7fed8e426180 | 131072 | 1011462 | 113252312 | 17703260545860 | 17703260506011 | 17703260880092 | 17703260881751 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 413 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 244224 | 0x7fed8ed09780 | 0x7fed8e4261c0 | 131072 | 967332 | 108379304 | 17703260912711 | 17703260880092 | 17703261321693 | 17703261339180 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 416 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 248768 | 0x7fed8ed09600 | 0x7fed8e426200 | 65536 | 645724 | 72311224 | 17703261354919 | 17703261321693 | 17703261759934 | 17703261776939 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 419 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 253312 | 0x7fed91369480 | 0x7fed8e426240 | 131072 | 646338 | 72346416 | 17703261793008 | 17703261759934 | 17703262186176 | 17703262205228 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 422 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 8 | 24 | 255552 | 0x7fed91369300 | 0x7fed8e426280 | 131072 | 1020366 | 114192200 | 17703262220998 | 17703262186176 | 17703262834338 | 17703262851592 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 425 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 259840 | 0x7fed91369180 | 0x7fed8e4262c0 | 131072 | 998278 | 111870152 | 17703262874731 | 17703262834338 | 17703263253379 | 17703263270331 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 428 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 265664 | 0x7fed91369000 | 0x7fed8e426300 | 131072 | 966728 | 108202696 | 17703263286801 | 17703263253379 | 17703263741540 | 17703263758509 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 431 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 271232 | 0x7fed8ed09e80 | 0x7fed8e426340 | 65536 | 637992 | 71499768 | 17703263773879 | 17703263741540 | 17703264228101 | 17703264244747 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 434 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 8 | 24 | 273216 | 0x7fed8ed09d00 | 0x7fed8e426380 | 131072 | 971744 | 108719232 | 17703264260367 | 17703264228101 | 17703264713383 | 17703264730505 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 437 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 8 | 24 | 275712 | 0x7fed8ed09b80 | 0x7fed8e4263c0 | 131072 | 1021874 | 114647576 | 17703264745554 | 17703264713383 | 17703265458025 | 17703265475906 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 440 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 280768 | 0x7fed8ed09a00 | 0x7fed8e426400 | 131072 | 1032400 | 115574912 | 17703265497986 | 17703265458025 | 17703265916106 | 17703265937445 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 443 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 287616 | 0x7fed8ed09880 | 0x7fed8e426440 | 131072 | 1015756 | 113808416 | 17703265948224 | 17703265916106 | 17703266469228 | 17703266486871 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 446 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 294208 | 0x7fed8ed09700 | 0x7fed8e426480 | 65536 | 645040 | 72304888 | 17703266502070 | 17703266469228 | 17703267007629 | 17703267023617 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 449 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 8 | 24 | 296960 | 0x7fed91369580 | 0x7fed8e4264c0 | 131072 | 1004040 | 112478528 | 17703267039637 | 17703267007629 | 17703267546191 | 17703267561994 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 452 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 8 | 24 | 299968 | 0x7fed91369400 | 0x7fed8e426500 | 131072 | 998690 | 111876488 | 17703267579113 | 17703267546191 | 17703268394833 | 17703268411482 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 455 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 8 | 24 | 302720 | 0x7fed91369280 | 0x7fed8e426540 | 131072 | 1007132 | 112664944 | 17703268435352 | 17703268394833 | 17703269028915 | 17703269044516 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 458 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 305472 | 0x7fed91369100 | 0x7fed8e426580 | 131072 | 1001066 | 111993944 | 17703269061786 | 17703269028915 | 17703269681557 | 17703269697250 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 461 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 308224 | 0x7fed8ed09f80 | 0x7fed8e4265c0 | 65536 | 635816 | 71338440 | 17703269715020 | 17703269681557 | 17703270325879 | 17703270345054 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 464 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 8 | 24 | 310976 | 0x7fed8ed09e00 | 0x7fed8e426600 | 131072 | 1006120 | 112296928 | 17703270358873 | 17703270325879 | 17703270983480 | 17703271002737 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 467 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 8 | 24 | 313216 | 0x7fed8ed09c80 | 0x7fed8e426640 | 131072 | 1078742 | 120796496 | 17703271015817 | 17703270983480 | 17703272067004 | 17703272085050 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 470 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 8 | 24 | 315968 | 0x7fed8ed09b00 | 0x7fed8e426680 | 131072 | 1002408 | 112318776 | 17703272107659 | 17703272066871 | 17703273123673 | 17703273145913 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 473 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 318720 | 0x7fed8ed09980 | 0x7fed8e4266c0 | 131072 | 1007858 | 112911824 | 17703273156883 | 17703273123673 | 17703274216315 | 17703274258785 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 476 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 321472 | 0x7fed8ed09800 | 0x7fed8e426700 | 65536 | 641774 | 71844000 | 17703274270625 | 17703274216315 | 17703275328638 | 17703275393027 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 479 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 8 | 24 | 324224 | 0x7fed8ed09680 | 0x7fed8e426740 | 131072 | 996178 | 111902792 | 17703275404217 | 17703275328638 | 17703276442401 | 17703276482910 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 482 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 8 | 24 | 326464 | 0x7fed91369500 | 0x7fed8e426780 | 131072 | 1003104 | 112245392 | 17703276494649 | 17703276442401 | 17703278370246 | 17703278415841 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 485 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 8 | 24 | 329216 | 0x7fed91369380 | 0x7fed8e4267c0 | 131072 | 1001512 | 112282816 | 17703278435151 | 17703278370246 | 17703280274731 | 17703280319153 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 488 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 331968 | 0x7fed91369200 | 0x7fed8e426800 | 131072 | 1002310 | 112467848 | 17703280330753 | 17703280274731 | 17703282226096 | 17703282294603 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 491 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 12 | 24 | 334720 | 0x7fed91369080 | 0x7fed8e426840 | 65536 | 640844 | 71784192 | 17703282306123 | 17703282226096 | 17703284199861 | 17703284268924 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 494 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 8 | 24 | 337472 | 0x7fed8ed09f00 | 0x7fed8e426880 | 131072 | 1030734 | 115555040 | 17703284279724 | 17703284199861 | 17703286141466 | 17703286212105 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 497 | 229165 | 229165 | 4194304 | 256 | 0 | 0 | 8 | 24 | 0 | 0x7fed8ed09d80 | 0x7fed8e4268c0 | 131072 | 1020118 | 114373520 | 17703286224035 | 17703286141466 | 17703289763555 | 17703289837694 |