44 KiB
44 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | GRBM_COUNT | GRBM_GUI_ACTIVE | SQ_WAVES | SQ_IFETCH | SQ_IFETCH_LEVEL | SQ_ACCUM_PREV_HIRES | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBufferAligned.kd | 0 | 0 | 0 | 236503 | 236503 | 33554432 | 256 | 0 | 0 | 4 | 32 | 4160 | 0x0 | 0x7fe83c204280 | 385832 | 385832 | 524288 | 4718592 | 682094 | 76386864 | 17833173257611 | 17832460487290 | 17833324063793 | 17833324177862 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 236503 | 236503 | 32768 | 256 | 0 | 0 | 12 | 24 | 13888 | 0x0 | 0x7fe83c223f80 | 34124 | 34124 | 512 | 8192 | 5540 | 624020 | 17833329373303 | 17833324063793 | 17833329503317 | 17833329508120 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 5 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 14336 | 0x7fe83f16b380 | 0x7fe83c223fc0 | 166451 | 166451 | 65536 | 917504 | 140662 | 15737800 | 17833329547519 | 17833329503317 | 17833329887317 | 17833329890091 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 8 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15040 | 0x7fe83f16b200 | 0x7fe83c224000 | 320813 | 320813 | 65536 | 1114112 | 167869 | 18973284 | 17833329928940 | 17833329887317 | 17833330326517 | 17833330329380 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 11 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15488 | 0x7fe83f16b080 | 0x7fe83c224040 | 323006 | 323006 | 65536 | 917504 | 146978 | 16539568 | 17833330364489 | 17833330326517 | 17833330747798 | 17833330753919 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 14 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 15936 | 0x7fe83cb0bf00 | 0x7fe83c224080 | 168550 | 168550 | 65536 | 1048576 | 159174 | 17856292 | 17833330784798 | 17833330747798 | 17833331068118 | 17833331070481 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 17 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 16384 | 0x7fe83cb0bd80 | 0x7fe83c2240c0 | 168572 | 168572 | 65536 | 983040 | 148090 | 16569436 | 17833331104930 | 17833331068118 | 17833331386678 | 17833331389103 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 20 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 17088 | 0x7fe83cb0bc00 | 0x7fe83c224100 | 167664 | 167664 | 65536 | 1114112 | 162610 | 18224860 | 17833331435702 | 17833331386678 | 17833331703318 | 17833331705705 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 23 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 16 | 24 | 17792 | 0x7fe83cb0ba80 | 0x7fe83c224140 | 320079 | 320079 | 65536 | 1310720 | 202232 | 22647988 | 17833331740015 | 17833331703318 | 17833332108599 | 17833332110925 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 26 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 16 | 24 | 18496 | 0x7fe83cb0b900 | 0x7fe83c224180 | 316809 | 316809 | 65536 | 1179648 | 176290 | 19855416 | 17833332143565 | 17833332108599 | 17833332528439 | 17833332530935 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 29 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19200 | 0x7fe83cb0b780 | 0x7fe83c2241c0 | 168281 | 168281 | 65536 | 1245184 | 188620 | 21166232 | 17833332564054 | 17833332528439 | 17833332839959 | 17833332842307 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 32 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19904 | 0x7fe83cb0b600 | 0x7fe83c224200 | 169494 | 169494 | 65536 | 1245184 | 202520 | 22612512 | 17833332876086 | 17833332839959 | 17833333154039 | 17833333156369 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 35 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 20608 | 0x7fe83f16b480 | 0x7fe83c224240 | 171299 | 171299 | 65536 | 1245184 | 200754 | 22467976 | 17833333198828 | 17833333154039 | 17833333471320 | 17833333473552 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 38 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 16 | 24 | 21312 | 0x7fe83f16b300 | 0x7fe83c224280 | 320776 | 320776 | 65536 | 1441792 | 216093 | 24168728 | 17833333508101 | 17833333471320 | 17833333874840 | 17833333881351 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 41 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22016 | 0x7fe83f16b180 | 0x7fe83c2242c0 | 316393 | 316393 | 65536 | 1310720 | 197617 | 22204988 | 17833333911551 | 17833333874840 | 17833334286360 | 17833334289041 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 44 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22720 | 0x7fe83f16b000 | 0x7fe83c224300 | 169264 | 169264 | 65536 | 1376256 | 205151 | 23034404 | 17833334324160 | 17833334286360 | 17833334608441 | 17833334610943 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 47 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 23424 | 0x7fe83cb0be80 | 0x7fe83c224340 | 168263 | 168263 | 65536 | 1441792 | 221753 | 24858852 | 17833334644352 | 17833334608441 | 17833334922841 | 17833334925195 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 50 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 24128 | 0x7fe83cb0bd00 | 0x7fe83c224380 | 167492 | 167492 | 65536 | 1310720 | 195746 | 21931324 | 17833334967074 | 17833334922841 | 17833335246361 | 17833335248667 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 53 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 16 | 24 | 24832 | 0x7fe83cb0bb80 | 0x7fe83c2243c0 | 316291 | 316291 | 65536 | 1572864 | 232311 | 26113788 | 17833335285227 | 17833335246361 | 17833335624441 | 17833335626348 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 56 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 16 | 24 | 25536 | 0x7fe83cb0ba00 | 0x7fe83c224400 | 312673 | 312673 | 65536 | 1441792 | 209241 | 23385064 | 17833335661197 | 17833335624441 | 17833335999642 | 17833336001459 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 59 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26240 | 0x7fe83cb0b880 | 0x7fe83c224440 | 166555 | 166555 | 65536 | 1507328 | 224652 | 25196208 | 17833336035928 | 17833335999642 | 17833336288122 | 17833336290022 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 62 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26944 | 0x7fe83cb0b700 | 0x7fe83c224480 | 168033 | 168033 | 65536 | 1638400 | 243000 | 27172084 | 17833336324411 | 17833336288122 | 17833336577882 | 17833336579724 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 65 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 27648 | 0x7fe83f16b580 | 0x7fe83c2244c0 | 169325 | 169325 | 65536 | 1441792 | 215804 | 24164768 | 17833336621253 | 17833336577882 | 17833336865242 | 17833336867167 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 68 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 16 | 24 | 28608 | 0x7fe83f16b400 | 0x7fe83c224500 | 317983 | 317983 | 65536 | 1703936 | 251876 | 28216384 | 17833336903336 | 17833336865242 | 17833337239963 | 17833337241868 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 71 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 16 | 24 | 29312 | 0x7fe83f16b280 | 0x7fe83c224540 | 316071 | 316071 | 65536 | 1572864 | 233891 | 26185384 | 17833337276507 | 17833337239963 | 17833337615003 | 17833337616889 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 74 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 30016 | 0x7fe83f16b100 | 0x7fe83c224580 | 167827 | 167827 | 65536 | 1638400 | 243052 | 27250156 | 17833337650858 | 17833337615003 | 17833337911803 | 17833337913661 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 77 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 8 | 24 | 30976 | 0x7fe83cb0bf80 | 0x7fe83c2245c0 | 167561 | 167561 | 65536 | 1835008 | 270019 | 30313992 | 17833337948630 | 17833337911803 | 17833338216123 | 17833338218214 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 80 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 31680 | 0x7fe83cb0be00 | 0x7fe83c224600 | 166155 | 166155 | 65536 | 1507328 | 223562 | 25065536 | 17833338260273 | 17833338216123 | 17833338505724 | 17833338507656 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 83 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 16 | 24 | 32640 | 0x7fe83cb0bc80 | 0x7fe83c224640 | 313708 | 313708 | 65536 | 1835008 | 272596 | 30454488 | 17833338544396 | 17833338505724 | 17833338882684 | 17833338884677 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 86 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 33600 | 0x7fe83cb0bb00 | 0x7fe83c224680 | 313561 | 313561 | 65536 | 1703936 | 248219 | 27816044 | 17833338919186 | 17833338882684 | 17833339257084 | 17833339259098 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 89 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 34560 | 0x7fe83cb0b980 | 0x7fe83c2246c0 | 168531 | 168531 | 65536 | 1769472 | 264701 | 29659096 | 17833339293197 | 17833339257084 | 17833339545244 | 17833339547101 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 92 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 8 | 24 | 35520 | 0x7fe83cb0b800 | 0x7fe83c224700 | 168533 | 168533 | 65536 | 2031616 | 303743 | 34041364 | 17833339581850 | 17833339545244 | 17833339833885 | 17833339835803 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 95 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 36224 | 0x7fe83cb0b680 | 0x7fe83c224740 | 168721 | 168721 | 65536 | 1638400 | 243880 | 27433232 | 17833339877512 | 17833339833885 | 17833340126845 | 17833340128726 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 98 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 37184 | 0x7fe83f16b500 | 0x7fe83c224780 | 311801 | 311801 | 65536 | 1966080 | 288908 | 32275144 | 17833340163205 | 17833340126845 | 17833340509405 | 17833340511177 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 101 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 38144 | 0x7fe83f16b380 | 0x7fe83c2247c0 | 314592 | 314592 | 65536 | 1835008 | 272159 | 30484976 | 17833340546636 | 17833340509405 | 17833340889245 | 17833340891087 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 104 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 39104 | 0x7fe83f16b200 | 0x7fe83c224800 | 168011 | 168011 | 65536 | 1900544 | 281499 | 31452584 | 17833340925936 | 17833340889245 | 17833341181406 | 17833341183040 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 107 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 8 | 24 | 40320 | 0x7fe83f16b080 | 0x7fe83c224840 | 168636 | 168636 | 65536 | 2228224 | 328196 | 36754620 | 17833341218079 | 17833341181406 | 17833341472606 | 17833341474483 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 110 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 41280 | 0x7fe83cb0bf00 | 0x7fe83c224880 | 169134 | 169134 | 65536 | 1703936 | 257950 | 28833172 | 17833341515762 | 17833341472606 | 17833341761886 | 17833341763986 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 113 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 42240 | 0x7fe83cb0bd80 | 0x7fe83c2248c0 | 311600 | 311600 | 65536 | 2097152 | 311380 | 34862612 | 17833341798245 | 17833341761886 | 17833342137566 | 17833342139966 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 116 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 43200 | 0x7fe83cb0bc00 | 0x7fe83c224900 | 311542 | 311542 | 65536 | 1966080 | 284002 | 31844304 | 17833342176125 | 17833342137566 | 17833342523327 | 17833342525247 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 119 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 8 | 24 | 44160 | 0x7fe83cb0ba80 | 0x7fe83c224940 | 168342 | 168342 | 65536 | 2031616 | 302765 | 33940188 | 17833342559536 | 17833342523327 | 17833342815647 | 17833342817649 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 122 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 45376 | 0x7fe83cb0b900 | 0x7fe83c224980 | 169165 | 169165 | 65536 | 2424832 | 362267 | 40550672 | 17833342852049 | 17833342815647 | 17833343114047 | 17833343115852 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 125 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 46336 | 0x7fe83cb0b780 | 0x7fe83c2249c0 | 168186 | 168186 | 65536 | 1835008 | 272130 | 30424784 | 17833343157201 | 17833343114047 | 17833343405727 | 17833343407425 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 128 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 47552 | 0x7fe83cb0b600 | 0x7fe83c224a00 | 312770 | 312770 | 65536 | 2228224 | 327050 | 36634776 | 17833343441984 | 17833343405727 | 17833343780928 | 17833343782835 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 131 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 48512 | 0x7fe83f16b480 | 0x7fe83c224a40 | 306056 | 306056 | 65536 | 2097152 | 309123 | 34672752 | 17833343818545 | 17833343780928 | 17833344158688 | 17833344160556 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 134 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 8 | 24 | 49472 | 0x7fe83f16b300 | 0x7fe83c224a80 | 167548 | 167548 | 65536 | 2162688 | 317410 | 35619068 | 17833344195655 | 17833344158688 | 17833344447968 | 17833344449669 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 137 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 50688 | 0x7fe83f16b180 | 0x7fe83c224ac0 | 169504 | 169504 | 65536 | 2621440 | 384926 | 43161376 | 17833344484848 | 17833344447968 | 17833344739968 | 17833344741802 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 140 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 51648 | 0x7fe83f16b000 | 0x7fe83c224b00 | 165512 | 165512 | 65536 | 1966080 | 291635 | 32744156 | 17833344783641 | 17833344739968 | 17833345032609 | 17833345034574 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 143 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 52864 | 0x7fe83cb0be80 | 0x7fe83c224b40 | 307635 | 307635 | 65536 | 2359296 | 355072 | 39814608 | 17833345076833 | 17833345032609 | 17833345407329 | 17833345409095 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 146 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 54080 | 0x7fe83cb0bd00 | 0x7fe83c224b80 | 306044 | 306044 | 65536 | 2228224 | 328227 | 36844320 | 17833345443604 | 17833345407329 | 17833345783969 | 17833345785826 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 149 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 8 | 24 | 55296 | 0x7fe83cb0bb80 | 0x7fe83c224bc0 | 168845 | 168845 | 65536 | 2293760 | 348654 | 38971364 | 17833345820455 | 17833345783969 | 17833346075329 | 17833346083318 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 152 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 56768 | 0x7fe83cb0ba00 | 0x7fe83c224c00 | 169498 | 169498 | 65536 | 2752512 | 404228 | 45354672 | 17833346112458 | 17833346075329 | 17833346373410 | 17833346375231 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 155 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 57728 | 0x7fe83cb0b880 | 0x7fe83c224c40 | 169071 | 169071 | 65536 | 2031616 | 303042 | 33913500 | 17833346416440 | 17833346373410 | 17833346667010 | 17833346668874 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 158 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 58944 | 0x7fe83cb0b700 | 0x7fe83c224c80 | 307122 | 307122 | 65536 | 2490368 | 369401 | 41428256 | 17833346706213 | 17833346667010 | 17833347040930 | 17833347042884 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 161 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 60160 | 0x7fe83f16b580 | 0x7fe83c224cc0 | 308959 | 308959 | 65536 | 2359296 | 365280 | 40887324 | 17833347076864 | 17833347040930 | 17833347420450 | 17833347422375 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 164 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 8 | 24 | 61376 | 0x7fe83f16b400 | 0x7fe83c224d00 | 169956 | 169956 | 65536 | 2424832 | 381780 | 42729400 | 17833347457904 | 17833347420450 | 17833347711011 | 17833347712878 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 167 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 62848 | 0x7fe83f16b280 | 0x7fe83c224d40 | 173407 | 173407 | 65536 | 2949120 | 441931 | 49481420 | 17833347747547 | 17833347711011 | 17833348005091 | 17833348006880 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 170 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 63808 | 0x7fe83f16b100 | 0x7fe83c224d80 | 166344 | 166344 | 65536 | 2162688 | 321975 | 36072248 | 17833348048719 | 17833348005091 | 17833348302691 | 17833348304553 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 173 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 65024 | 0x7fe83cb0bf80 | 0x7fe83c224dc0 | 305814 | 305814 | 65536 | 2621440 | 389080 | 43384336 | 17833348339332 | 17833348302691 | 17833348678051 | 17833348680044 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 176 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 66240 | 0x7fe83cb0be00 | 0x7fe83c224e00 | 304155 | 304155 | 65536 | 2490368 | 364521 | 40814816 | 17833348715763 | 17833348678051 | 17833349050532 | 17833349052354 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 179 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 8 | 24 | 67456 | 0x7fe83cb0bc80 | 0x7fe83c224e40 | 170016 | 170016 | 65536 | 2555904 | 381139 | 42794068 | 17833349087144 | 17833349050532 | 17833349345252 | 17833349346957 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 182 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 68928 | 0x7fe83cb0bb00 | 0x7fe83c224e80 | 177017 | 177017 | 65536 | 3145728 | 470883 | 52684580 | 17833349382036 | 17833349345252 | 17833349643652 | 17833349645520 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 185 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 70144 | 0x7fe83cb0b980 | 0x7fe83c224ec0 | 166578 | 166578 | 65536 | 2228224 | 327804 | 36764916 | 17833349687679 | 17833349643652 | 17833349935492 | 17833349937203 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 188 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 71616 | 0x7fe83cb0b800 | 0x7fe83c224f00 | 302457 | 302457 | 65536 | 2752512 | 406147 | 45544456 | 17833349973952 | 17833349935492 | 17833350316773 | 17833350318913 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 191 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 72832 | 0x7fe83cb0b680 | 0x7fe83c224f40 | 304510 | 304510 | 65536 | 2621440 | 386423 | 43272968 | 17833350354692 | 17833350316773 | 17833350692933 | 17833350694984 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 194 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 8 | 24 | 74048 | 0x7fe83f16b500 | 0x7fe83c224f80 | 167339 | 167339 | 65536 | 2686976 | 399117 | 44684512 | 17833350728583 | 17833350692933 | 17833350982053 | 17833350984027 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 197 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 75776 | 0x7fe83f16b380 | 0x7fe83c224fc0 | 183614 | 183614 | 65536 | 3342336 | 496613 | 55633136 | 17833351018986 | 17833350982053 | 17833351282533 | 17833351284429 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 200 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 76992 | 0x7fe83f16b200 | 0x7fe83c225000 | 167166 | 167166 | 65536 | 2359296 | 350153 | 39373624 | 17833351338838 | 17833351282533 | 17833351576774 | 17833351578622 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 203 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 78464 | 0x7fe83f16b080 | 0x7fe83c225040 | 303630 | 303630 | 65536 | 2883584 | 435848 | 48734928 | 17833351615461 | 17833351576774 | 17833351958214 | 17833351960042 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 206 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 79936 | 0x7fe83cb0bf00 | 0x7fe83c225080 | 303100 | 303100 | 65536 | 2686976 | 399594 | 44765504 | 17833351995661 | 17833351958214 | 17833352333094 | 17833352335093 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 209 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 8 | 24 | 81408 | 0x7fe83cb0bd80 | 0x7fe83c2250c0 | 170425 | 170425 | 65536 | 2818048 | 421112 | 47160840 | 17833352369572 | 17833352333094 | 17833352623174 | 17833352625026 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 212 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 83136 | 0x7fe83cb0bc00 | 0x7fe83c225100 | 192467 | 192467 | 65536 | 3538944 | 538081 | 60204324 | 17833352659005 | 17833352623174 | 17833352927655 | 17833352929528 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 215 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 84352 | 0x7fe83cb0ba80 | 0x7fe83c225140 | 169322 | 169322 | 65536 | 2424832 | 359577 | 40321568 | 17833352971487 | 17833352927655 | 17833353224455 | 17833353226431 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 218 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 85824 | 0x7fe83cb0b900 | 0x7fe83c225180 | 308086 | 308086 | 65536 | 3014656 | 453709 | 50727012 | 17833353260050 | 17833353224455 | 17833353611495 | 17833353613361 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 221 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 87296 | 0x7fe83cb0b780 | 0x7fe83c2251c0 | 303114 | 303114 | 65536 | 2818048 | 414457 | 46395432 | 17833353647860 | 17833353611495 | 17833353985735 | 17833353987472 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 224 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 88768 | 0x7fe83cb0b600 | 0x7fe83c225200 | 168204 | 168204 | 65536 | 2949120 | 439817 | 49244168 | 17833354022171 | 17833353985735 | 17833354291816 | 17833354293764 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 227 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 90752 | 0x7fe83f16b480 | 0x7fe83c225240 | 201871 | 201871 | 65536 | 3735552 | 560870 | 62806964 | 17833354328653 | 17833354291816 | 17833354605416 | 17833354607396 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 230 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 91968 | 0x7fe83f16b300 | 0x7fe83c225280 | 166916 | 166916 | 65536 | 2555904 | 395655 | 44391096 | 17833354649265 | 17833354605416 | 17833354895656 | 17833354897599 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 233 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 93440 | 0x7fe83f16b180 | 0x7fe83c2252c0 | 304577 | 304577 | 65536 | 3145728 | 466630 | 52282620 | 17833354933938 | 17833354895656 | 17833355272616 | 17833355274500 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 236 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 94912 | 0x7fe83f16b000 | 0x7fe83c225300 | 301618 | 301618 | 65536 | 2949120 | 438044 | 48999416 | 17833355310369 | 17833355272616 | 17833355645897 | 17833355647791 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 239 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 96384 | 0x7fe83cb0be80 | 0x7fe83c225340 | 168835 | 168835 | 65536 | 3080192 | 459338 | 51414080 | 17833355681500 | 17833355645897 | 17833355934057 | 17833355936003 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 242 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 98368 | 0x7fe83cb0bd00 | 0x7fe83c225380 | 211422 | 211422 | 65536 | 3932160 | 584962 | 65429388 | 17833355970523 | 17833355934057 | 17833356256617 | 17833356258445 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 245 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 99584 | 0x7fe83cb0bb80 | 0x7fe83c2253c0 | 167511 | 167511 | 65536 | 2621440 | 388846 | 43578000 | 17833356300124 | 17833356256617 | 17833356552617 | 17833356554738 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 248 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 101312 | 0x7fe83cb0ba00 | 0x7fe83c225400 | 304783 | 304783 | 65536 | 3276800 | 487250 | 54676880 | 17833356589057 | 17833356552617 | 17833356926858 | 17833356928709 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 251 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 102784 | 0x7fe83cb0b880 | 0x7fe83c225440 | 304031 | 304031 | 65536 | 3080192 | 465994 | 52152364 | 17833356962958 | 17833356926858 | 17833357302858 | 17833357304939 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 254 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 104256 | 0x7fe83cb0b700 | 0x7fe83c225480 | 168847 | 168847 | 65536 | 3211264 | 472919 | 52929148 | 17833357338709 | 17833357302858 | 17833357593578 | 17833357595522 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 257 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 106240 | 0x7fe83f16b580 | 0x7fe83c2254c0 | 218845 | 218845 | 65536 | 4128768 | 609203 | 68267656 | 17833357630121 | 17833357593578 | 17833357919978 | 17833357921834 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 260 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 107712 | 0x7fe83f16b400 | 0x7fe83c225500 | 167201 | 167201 | 65536 | 2752512 | 408007 | 45704904 | 17833357964573 | 17833357919978 | 17833358219659 | 17833358221797 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 263 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 16 | 24 | 109440 | 0x7fe83f16b280 | 0x7fe83c225540 | 300053 | 300053 | 65536 | 3407872 | 509053 | 56999112 | 17833358258066 | 17833358219659 | 17833358597099 | 17833358598907 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 266 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 16 | 24 | 111168 | 0x7fe83f16b100 | 0x7fe83c225580 | 300200 | 300200 | 65536 | 3211264 | 474244 | 53131240 | 17833358633596 | 17833358597099 | 17833358972619 | 17833358974498 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 269 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 8 | 24 | 112896 | 0x7fe83cb0bf80 | 0x7fe83c2255c0 | 168788 | 168788 | 65536 | 3276800 | 492858 | 55205864 | 17833359009827 | 17833358972619 | 17833359262379 | 17833359264261 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 272 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 115136 | 0x7fe83cb0be00 | 0x7fe83c225600 | 232164 | 232164 | 65536 | 4325376 | 648749 | 72658560 | 17833359298580 | 17833359262379 | 17833359594060 | 17833359595993 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 275 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 116608 | 0x7fe83cb0bc80 | 0x7fe83c225640 | 169376 | 169376 | 65536 | 2818048 | 429623 | 48129556 | 17833359638381 | 17833359594060 | 17833359888300 | 17833359890205 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 278 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 16 | 24 | 118336 | 0x7fe83cb0bb00 | 0x7fe83c225680 | 300713 | 300713 | 65536 | 3538944 | 524423 | 58732196 | 17833359923974 | 17833359888300 | 17833360260140 | 17833360262016 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 281 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 16 | 24 | 120064 | 0x7fe83cb0b980 | 0x7fe83c2256c0 | 302008 | 302008 | 65536 | 3407872 | 502770 | 56356060 | 17833360296845 | 17833360260140 | 17833360630540 | 17833360632417 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 284 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 121792 | 0x7fe83cb0b800 | 0x7fe83c225700 | 167077 | 167077 | 65536 | 3407872 | 513280 | 57448736 | 17833360666996 | 17833360630540 | 17833360919021 | 17833360920880 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 287 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 124032 | 0x7fe83cb0b680 | 0x7fe83c225740 | 240548 | 240548 | 65536 | 4521984 | 677850 | 76029392 | 17833360955349 | 17833360919021 | 17833361257421 | 17833361259191 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 290 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 125504 | 0x7fe83f16b500 | 0x7fe83c225780 | 169238 | 169238 | 65536 | 3014656 | 460312 | 51595968 | 17833361301430 | 17833361257421 | 17833361555981 | 17833361557714 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 293 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 127488 | 0x7fe83f16b380 | 0x7fe83c2257c0 | 303321 | 303321 | 65536 | 3801088 | 565090 | 63265024 | 17833361592213 | 17833361555981 | 17833361935341 | 17833361937344 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 296 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 129216 | 0x7fe83f16b200 | 0x7fe83c225800 | 304169 | 304169 | 65536 | 3670016 | 555213 | 62175088 | 17833361972664 | 17833361935341 | 17833362320622 | 17833362322655 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 299 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 130944 | 0x7fe83f16b080 | 0x7fe83c225840 | 173257 | 173257 | 65536 | 3670016 | 558045 | 62469356 | 17833362358914 | 17833362320622 | 17833362617102 | 17833362619097 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 302 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 133440 | 0x7fe83cb0bf00 | 0x7fe83c225880 | 258461 | 258461 | 65536 | 4915200 | 746817 | 83594780 | 17833362654677 | 17833362617102 | 17833362965582 | 17833362967549 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 305 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 134912 | 0x7fe83cb0bd80 | 0x7fe83c2258c0 | 170911 | 170911 | 65536 | 3145728 | 467869 | 52410260 | 17833363011138 | 17833362965582 | 17833363263343 | 17833363265301 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 308 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 136896 | 0x7fe83cb0bc00 | 0x7fe83c225900 | 301919 | 301919 | 65536 | 4063232 | 617922 | 69219988 | 17833363300421 | 17833363263343 | 17833363636943 | 17833363638762 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 311 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 138880 | 0x7fe83cb0ba80 | 0x7fe83c225940 | 301829 | 301829 | 65536 | 3932160 | 597857 | 66953784 | 17833363674591 | 17833363636943 | 17833364009263 | 17833364011223 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 314 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 140864 | 0x7fe83cb0b900 | 0x7fe83c225980 | 177968 | 177968 | 65536 | 3932160 | 596056 | 66734084 | 17833364045152 | 17833364009263 | 17833364312623 | 17833364314605 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 317 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 143616 | 0x7fe83cb0b780 | 0x7fe83c2259c0 | 278430 | 278430 | 65536 | 5308416 | 795390 | 89144032 | 17833364348674 | 17833364312623 | 17833364671344 | 17833364673196 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 320 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 145344 | 0x7fe83cb0b600 | 0x7fe83c225a00 | 168158 | 168158 | 65536 | 3342336 | 496115 | 55511576 | 17833364715915 | 17833364671344 | 17833364967984 | 17833364969829 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 323 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 147584 | 0x7fe83f16b480 | 0x7fe83c225a40 | 302112 | 302112 | 65536 | 4325376 | 679360 | 75998736 | 17833365004128 | 17833364967984 | 17833365343184 | 17833365345140 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 326 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 149568 | 0x7fe83f16b300 | 0x7fe83c225a80 | 300038 | 300038 | 65536 | 4194304 | 640040 | 71578624 | 17833365380529 | 17833365343184 | 17833365718064 | 17833365719900 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 329 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 151552 | 0x7fe83f16b180 | 0x7fe83c225ac0 | 187296 | 187296 | 65536 | 4194304 | 633708 | 70979648 | 17833365753980 | 17833365718064 | 17833366021105 | 17833366023093 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 332 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 154304 | 0x7fe83f16b000 | 0x7fe83c225b00 | 300034 | 300034 | 65536 | 5701632 | 866651 | 97056844 | 17833366058802 | 17833366021105 | 17833366401905 | 17833366403933 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 335 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 156288 | 0x7fe83cb0be80 | 0x7fe83c225b40 | 171812 | 171812 | 65536 | 3735552 | 559895 | 62694600 | 17833366446302 | 17833366401905 | 17833366700305 | 17833366702346 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 338 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 158784 | 0x7fe83cb0bd00 | 0x7fe83c225b80 | 303329 | 303329 | 65536 | 4849664 | 764136 | 85670204 | 17833366739525 | 17833366700305 | 17833367079665 | 17833367081477 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 341 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 161024 | 0x7fe83cb0bb80 | 0x7fe83c225bc0 | 304282 | 304282 | 65536 | 4718592 | 738083 | 82726232 | 17833367115496 | 17833367079665 | 17833367467186 | 17833367469197 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 344 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 163264 | 0x7fe83cb0ba00 | 0x7fe83c225c00 | 206411 | 206411 | 65536 | 4718592 | 716943 | 80228732 | 17833367503216 | 17833367467186 | 17833367783666 | 17833367785549 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 347 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 166528 | 0x7fe83cb0b880 | 0x7fe83c225c40 | 340023 | 340023 | 65536 | 6488064 | 983106 | 110076864 | 17833367819648 | 17833367783666 | 17833368182866 | 17833368209779 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 350 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 168512 | 0x7fe83cb0b700 | 0x7fe83c225c80 | 184379 | 184379 | 65536 | 4128768 | 621586 | 69574528 | 17833368228628 | 17833368182866 | 17833368500787 | 17833368502701 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 353 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 171264 | 0x7fe83f16b580 | 0x7fe83c225cc0 | 303703 | 303703 | 65536 | 5373952 | 859064 | 96251956 | 17833368539740 | 17833368500787 | 17833368880307 | 17833368882192 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 356 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 173760 | 0x7fe83f16b400 | 0x7fe83c225d00 | 306151 | 306151 | 65536 | 5242880 | 848046 | 94899672 | 17833368917151 | 17833368880307 | 17833369260947 | 17833369265292 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 359 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 176256 | 0x7fe83f16b280 | 0x7fe83c225d40 | 226653 | 226653 | 65536 | 5242880 | 782651 | 87709652 | 17833369297242 | 17833369260947 | 17833369588627 | 17833369590554 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 362 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 179776 | 0x7fe83f16b100 | 0x7fe83c225d80 | 380709 | 380709 | 65536 | 7274496 | 1096835 | 122880504 | 17833369624613 | 17833369588627 | 17833370019028 | 17833370038103 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 365 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 182272 | 0x7fe83cb0bf80 | 0x7fe83c225dc0 | 211326 | 211326 | 65536 | 4915200 | 734226 | 82202996 | 17833370063632 | 17833370019028 | 17833370349428 | 17833370351515 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 368 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 185536 | 0x7fe83cb0be00 | 0x7fe83c225e00 | 308027 | 308027 | 65536 | 6422528 | 990606 | 110945628 | 17833370385265 | 17833370349428 | 17833370734868 | 17833370784165 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 371 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 188544 | 0x7fe83cb0bc80 | 0x7fe83c225e40 | 311334 | 311334 | 65536 | 6291456 | 1015562 | 113688560 | 17833370794694 | 17833370734868 | 17833371160949 | 17833371207294 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 374 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 191552 | 0x7fe83cb0bb00 | 0x7fe83c225e80 | 266391 | 266391 | 65536 | 6291456 | 959541 | 107455604 | 17833371218164 | 17833371160949 | 17833371546549 | 17833371548436 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 377 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 195840 | 0x7fe83cb0b980 | 0x7fe83c225ec0 | 461600 | 461600 | 65536 | 8847360 | 1334366 | 149533012 | 17833371582655 | 17833371546549 | 17833372022069 | 17833372068323 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 380 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 198592 | 0x7fe83cb0b800 | 0x7fe83c225f00 | 245533 | 245533 | 65536 | 5701632 | 872385 | 97746628 | 17833372087512 | 17833372022069 | 17833372399350 | 17833372401214 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 383 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 202368 | 0x7fe83cb0b680 | 0x7fe83c225f40 | 333240 | 333240 | 65536 | 7471104 | 1190293 | 133416856 | 17833372438303 | 17833372399350 | 17833372805430 | 17833372827754 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 386 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 205888 | 0x7fe83f16b500 | 0x7fe83c225f80 | 331906 | 331906 | 65536 | 7340032 | 1156506 | 129439136 | 17833372840983 | 17833372805430 | 17833373216470 | 17833373237694 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 389 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 209408 | 0x7fe83f16b380 | 0x7fe83c225fc0 | 306784 | 306784 | 65536 | 7340032 | 1122895 | 125758168 | 17833373253713 | 17833373216470 | 17833373602070 | 17833373604035 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 392 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 214464 | 0x7fe83f16b200 | 0x7fe83c226000 | 542870 | 542870 | 65536 | 10420224 | 1572795 | 176191112 | 17833373638674 | 17833373602070 | 17833374129111 | 17833374151011 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 395 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 217728 | 0x7fe83f16b080 | 0x7fe83c226040 | 273524 | 273524 | 65536 | 6488064 | 1001580 | 112199020 | 17833374174310 | 17833374129111 | 17833374501751 | 17833374503742 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 398 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 222016 | 0x7fe83cb0bf00 | 0x7fe83c226080 | 367402 | 367402 | 65536 | 8519680 | 1353274 | 151506452 | 17833374538861 | 17833374501751 | 17833374928631 | 17833374946841 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 401 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 226048 | 0x7fe83cb0bd80 | 0x7fe83c2260c0 | 365216 | 365216 | 65536 | 8388608 | 1304526 | 146097372 | 17833374965361 | 17833374928631 | 17833375353272 | 17833375371071 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 404 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 230080 | 0x7fe83cb0bc00 | 0x7fe83c226100 | 347450 | 347450 | 65536 | 8388608 | 1301080 | 145747168 | 17833375389370 | 17833375353272 | 17833375759832 | 17833375776981 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 407 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 235904 | 0x7fe83cb0ba80 | 0x7fe83c226140 | 623883 | 623883 | 65536 | 11993088 | 1821460 | 204012224 | 17833375795600 | 17833375759832 | 17833376342393 | 17833376359956 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 410 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 239424 | 0x7fe83cb0b900 | 0x7fe83c226180 | 301927 | 301927 | 65536 | 7274496 | 1129391 | 126520252 | 17833376386155 | 17833376342393 | 17833376726873 | 17833376728867 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 413 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 244224 | 0x7fe83cb0b780 | 0x7fe83c2261c0 | 397112 | 397112 | 65536 | 9568256 | 1519909 | 170238480 | 17833376763316 | 17833376726873 | 17833377172793 | 17833377191405 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 416 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 248768 | 0x7fe83cb0b600 | 0x7fe83c226200 | 390579 | 390579 | 65536 | 9437184 | 1516148 | 169854668 | 17833377210205 | 17833377172793 | 17833377619354 | 17833377636884 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 419 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 253312 | 0x7fe83f16b480 | 0x7fe83c226240 | 388246 | 388246 | 65536 | 9437184 | 1469651 | 164646916 | 17833377656044 | 17833377619354 | 17833378054714 | 17833378073234 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 422 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 8 | 24 | 255552 | 0x7fe83f16b300 | 0x7fe83c226280 | 719031 | 719031 | 65536 | 16056320 | 2305568 | 258136480 | 17833378093213 | 17833378054714 | 17833378709754 | 17833378756117 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 425 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 259840 | 0x7fe83f16b180 | 0x7fe83c2262c0 | 364708 | 364708 | 65536 | 8847360 | 1370645 | 153515112 | 17833378775936 | 17833378709754 | 17833379159035 | 17833379204805 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 428 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 265664 | 0x7fe83f16b000 | 0x7fe83c226300 | 469173 | 469173 | 65536 | 11665408 | 1832647 | 205290624 | 17833379216425 | 17833379159035 | 17833379686075 | 17833379731762 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 431 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 271232 | 0x7fe83cb0be80 | 0x7fe83c226340 | 472147 | 472147 | 65536 | 11468800 | 1836446 | 205663764 | 17833379742592 | 17833379686075 | 17833380206876 | 17833380252019 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 434 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 8 | 24 | 273216 | 0x7fe83cb0bd00 | 0x7fe83c226380 | 483319 | 483319 | 65536 | 14090240 | 2020745 | 226286316 | 17833380262739 | 17833380206876 | 17833380730396 | 17833380775826 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 437 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 8 | 24 | 275712 | 0x7fe83cb0bb80 | 0x7fe83c2263c0 | 880693 | 880693 | 65536 | 19202048 | 2756489 | 308858668 | 17833380786746 | 17833380730396 | 17833381509117 | 17833381554727 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 440 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 280768 | 0x7fe83cb0ba00 | 0x7fe83c226400 | 426823 | 426823 | 65536 | 10420224 | 1609659 | 180348376 | 17833381573027 | 17833381509117 | 17833381995517 | 17833382013656 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 443 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 287616 | 0x7fe83cb0b880 | 0x7fe83c226440 | 550151 | 550151 | 65536 | 13762560 | 2210664 | 247726852 | 17833382032035 | 17833381995517 | 17833382551997 | 17833382597981 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 446 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 294208 | 0x7fe83cb0b700 | 0x7fe83c226480 | 551517 | 551517 | 65536 | 13565952 | 2140716 | 239728764 | 17833382609251 | 17833382551997 | 17833383127358 | 17833383172737 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 449 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 8 | 24 | 296960 | 0x7fe83f16b580 | 0x7fe83c2264c0 | 564777 | 564777 | 65536 | 15466496 | 2228456 | 249593016 | 17833383183477 | 17833383127358 | 17833383699518 | 17833383744933 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 452 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 8 | 24 | 299968 | 0x7fe83f16b400 | 0x7fe83c226500 | 1044359 | 1044359 | 65536 | 22347776 | 3211299 | 359707520 | 17833383755813 | 17833383699518 | 17833384583359 | 17833384626841 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 455 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 8 | 24 | 302720 | 0x7fe83f16b280 | 0x7fe83c226540 | 722945 | 722945 | 65536 | 20250624 | 2923813 | 327459048 | 17833384644931 | 17833384583359 | 17833385251039 | 17833385295565 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 458 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 305472 | 0x7fe83f16b100 | 0x7fe83c226580 | 725769 | 725769 | 65536 | 20447232 | 2935642 | 328720784 | 17833385306544 | 17833385251039 | 17833385941920 | 17833385960188 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 461 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 308224 | 0x7fe83cb0bf80 | 0x7fe83c2265c0 | 721755 | 721755 | 65536 | 19595264 | 2818351 | 315615332 | 17833385979718 | 17833385941920 | 17833386603840 | 17833386650201 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 464 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 8 | 24 | 310976 | 0x7fe83cb0be00 | 0x7fe83c226600 | 727949 | 727949 | 65536 | 20381696 | 2928148 | 327905732 | 17833386661111 | 17833386603784 | 17833387281864 | 17833387333494 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 467 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 8 | 24 | 313216 | 0x7fe83cb0bc80 | 0x7fe83c226640 | 1366307 | 1366307 | 65536 | 31522816 | 4509238 | 505473072 | 17833387344264 | 17833387281864 | 17833388391624 | 17833388436797 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 470 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 8 | 24 | 315968 | 0x7fe83cb0bb00 | 0x7fe83c226680 | 1373247 | 1373247 | 65536 | 38993920 | 5583960 | 625679232 | 17833388456356 | 17833388391624 | 17833389481225 | 17833389547849 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 473 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 318720 | 0x7fe83cb0b980 | 0x7fe83c2266c0 | 1373929 | 1373929 | 65536 | 39124992 | 5615805 | 628883484 | 17833389559129 | 17833389481225 | 17833390631786 | 17833390703550 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 476 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 321472 | 0x7fe83cb0b800 | 0x7fe83c226700 | 1372851 | 1372851 | 65536 | 38469632 | 5509601 | 617057236 | 17833390715150 | 17833390631786 | 17833391778986 | 17833391848222 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 479 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 8 | 24 | 324224 | 0x7fe83cb0b680 | 0x7fe83c226740 | 1375132 | 1375132 | 65536 | 39059456 | 5596845 | 626840900 | 17833391858982 | 17833391778986 | 17833392899307 | 17833392966684 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 482 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 8 | 24 | 326464 | 0x7fe83f16b500 | 0x7fe83c226780 | 2664386 | 2664386 | 65536 | 60489728 | 8652521 | 969163852 | 17833392977874 | 17833392899307 | 17833394866828 | 17833394944075 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 485 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 8 | 24 | 329216 | 0x7fe83f16b380 | 0x7fe83c2267c0 | 2669534 | 2669534 | 65536 | 77266944 | 11073873 | 1240553420 | 17833394963545 | 17833394866828 | 17833396808270 | 17833396876617 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 488 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 331968 | 0x7fe83f16b200 | 0x7fe83c226800 | 2672170 | 2672170 | 65536 | 77398016 | 11071825 | 1240072748 | 17833396887957 | 17833396808270 | 17833398795791 | 17833398869628 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 491 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 12 | 24 | 334720 | 0x7fe83f16b080 | 0x7fe83c226840 | 2668592 | 2668592 | 65536 | 76218368 | 10904144 | 1221576836 | 17833398880977 | 17833398795791 | 17833400781712 | 17833400848588 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 494 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 8 | 24 | 337472 | 0x7fe83cb0bf00 | 0x7fe83c226880 | 2672754 | 2672754 | 65536 | 77332480 | 11067421 | 1239281240 | 17833400859718 | 17833400781712 | 17833402716274 | 17833402787070 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 497 | 236503 | 236503 | 4194304 | 256 | 0 | 0 | 8 | 24 | 0 | 0x7fe83cb0bd80 | 0x7fe83c2268c0 | 5255776 | 5255776 | 65536 | 120258560 | 17187452 | 1925701988 | 17833402798580 | 17833402716274 | 17833406340436 | 17833406412550 |