44 KiB
44 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | GRBM_COUNT | GRBM_GUI_ACTIVE | SQ_WAVES | SQ_IFETCH | SQ_IFETCH_LEVEL | SQ_ACCUM_PREV_HIRES | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBufferAligned.kd | 0 | 0 | 0 | 229387 | 229387 | 33554432 | 256 | 0 | 0 | 4 | 32 | 4160 | 0x0 | 0x7f6c7d404280 | 382955 | 382955 | 524288 | 4718592 | 681277 | 76305216 | 17703999491386 | 17703289764389 | 17704150035092 | 17704150122942 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 229387 | 229387 | 32768 | 256 | 0 | 0 | 12 | 24 | 13888 | 0x0 | 0x7f6c7d423f80 | 33183 | 33183 | 512 | 8192 | 5968 | 677612 | 17704155264803 | 17704150035092 | 17704155402300 | 17704155407109 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 5 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 14336 | 0x7f6c80453380 | 0x7f6c7d423fc0 | 167502 | 167502 | 65536 | 917504 | 152335 | 17093232 | 17704155444078 | 17704155402300 | 17704155777981 | 17704155780500 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 8 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15040 | 0x7f6c80453200 | 0x7f6c7d424000 | 321931 | 321931 | 65536 | 1114112 | 168959 | 18993004 | 17704155819119 | 17704155777981 | 17704156194942 | 17704156200929 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 11 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15488 | 0x7f6c80453080 | 0x7f6c7d424040 | 319786 | 319786 | 65536 | 917504 | 139211 | 15543636 | 17704156231619 | 17704156194942 | 17704156602942 | 17704156605089 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 14 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 15936 | 0x7f6c7dcfbf00 | 0x7f6c7d424080 | 169384 | 169384 | 65536 | 1048576 | 158832 | 17783112 | 17704156640868 | 17704156602942 | 17704156913503 | 17704156915581 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 17 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 16384 | 0x7f6c7dcfbd80 | 0x7f6c7d4240c0 | 167664 | 167664 | 65536 | 983040 | 147357 | 16543664 | 17704156951100 | 17704156913503 | 17704157223583 | 17704157225814 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 20 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 17088 | 0x7f6c7dcfbc00 | 0x7f6c7d424100 | 166916 | 166916 | 65536 | 1114112 | 163667 | 18227732 | 17704157272902 | 17704157223583 | 17704157533184 | 17704157535236 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 23 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 16 | 24 | 17792 | 0x7f6c7dcfba80 | 0x7f6c7d424140 | 322022 | 322022 | 65536 | 1310720 | 203306 | 22691004 | 17704157569545 | 17704157533184 | 17704157934944 | 17704157939206 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 26 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 16 | 24 | 18496 | 0x7f6c7dcfb900 | 0x7f6c7d424180 | 317500 | 317500 | 65536 | 1179648 | 178451 | 19917816 | 17704157970965 | 17704157934944 | 17704158367905 | 17704158370365 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 29 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19200 | 0x7f6c7dcfb780 | 0x7f6c7d4241c0 | 167822 | 167822 | 65536 | 1245184 | 189632 | 21233444 | 17704158405324 | 17704158367905 | 17704158689026 | 17704158691247 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 32 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19904 | 0x7f6c7dcfb600 | 0x7f6c7d424200 | 166236 | 166236 | 65536 | 1245184 | 189850 | 21326848 | 17704158726446 | 17704158689026 | 17704158997026 | 17704158999119 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 35 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 20608 | 0x7f6c80453480 | 0x7f6c7d424240 | 166940 | 166940 | 65536 | 1245184 | 186251 | 20900792 | 17704159041998 | 17704158997026 | 17704159305507 | 17704159307011 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 38 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 16 | 24 | 21312 | 0x7f6c80453300 | 0x7f6c7d424280 | 321594 | 321594 | 65536 | 1441792 | 244344 | 27392076 | 17704159343310 | 17704159305507 | 17704159677987 | 17704159680632 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 41 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22016 | 0x7f6c80453180 | 0x7f6c7d4242c0 | 315997 | 315997 | 65536 | 1310720 | 198936 | 22228636 | 17704159714071 | 17704159677987 | 17704160051108 | 17704160052532 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 44 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22720 | 0x7f6c80453000 | 0x7f6c7d424300 | 168106 | 168106 | 65536 | 1376256 | 205879 | 23051544 | 17704160088091 | 17704160051108 | 17704160333348 | 17704160334955 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 47 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 23424 | 0x7f6c7dcfbe80 | 0x7f6c7d424340 | 169267 | 169267 | 65536 | 1441792 | 215468 | 24142504 | 17704160368864 | 17704160333348 | 17704160614789 | 17704160616378 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 50 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 24128 | 0x7f6c7dcfbd00 | 0x7f6c7d424380 | 166862 | 166862 | 65536 | 1310720 | 195656 | 21922376 | 17704160657857 | 17704160614789 | 17704160909829 | 17704160911371 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 53 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 16 | 24 | 24832 | 0x7f6c7dcfbb80 | 0x7f6c7d4243c0 | 317973 | 317973 | 65536 | 1572864 | 234285 | 26278436 | 17704160947060 | 17704160909829 | 17704161283590 | 17704161285191 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 56 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 16 | 24 | 25536 | 0x7f6c7dcfba00 | 0x7f6c7d424400 | 313256 | 313256 | 65536 | 1441792 | 207795 | 23263808 | 17704161319870 | 17704161283590 | 17704161652711 | 17704161654352 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 59 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26240 | 0x7f6c7dcfb880 | 0x7f6c7d424440 | 169307 | 169307 | 65536 | 1507328 | 224378 | 25143440 | 17704161688581 | 17704161652711 | 17704161935111 | 17704161936645 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 62 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26944 | 0x7f6c7dcfb700 | 0x7f6c7d424480 | 170722 | 170722 | 65536 | 1638400 | 242995 | 27281908 | 17704161971204 | 17704161935111 | 17704162231112 | 17704162232817 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 65 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 27648 | 0x7f6c80453580 | 0x7f6c7d4244c0 | 166926 | 166926 | 65536 | 1441792 | 217768 | 24282728 | 17704162274986 | 17704162231112 | 17704162520232 | 17704162521880 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 68 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 16 | 24 | 28608 | 0x7f6c80453400 | 0x7f6c7d424500 | 319654 | 319654 | 65536 | 1703936 | 252087 | 28239492 | 17704162557259 | 17704162520232 | 17704162894793 | 17704162898091 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 71 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 16 | 24 | 29312 | 0x7f6c80453280 | 0x7f6c7d424540 | 315191 | 315191 | 65536 | 1572864 | 233635 | 26087768 | 17704162931530 | 17704162894793 | 17704163266953 | 17704163268712 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 74 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 30016 | 0x7f6c80453100 | 0x7f6c7d424580 | 166135 | 166135 | 65536 | 1638400 | 248509 | 27802340 | 17704163303761 | 17704163266953 | 17704163551594 | 17704163553094 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 77 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 8 | 24 | 30976 | 0x7f6c7dcfbf80 | 0x7f6c7d4245c0 | 168919 | 168919 | 65536 | 1835008 | 270228 | 30248560 | 17704163588154 | 17704163551594 | 17704163833674 | 17704163835367 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 80 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 31680 | 0x7f6c7dcfbe00 | 0x7f6c7d424600 | 166818 | 166818 | 65536 | 1507328 | 226144 | 25298708 | 17704163876276 | 17704163833674 | 17704164120875 | 17704164122490 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 83 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 16 | 24 | 32640 | 0x7f6c7dcfbc80 | 0x7f6c7d424640 | 313307 | 313307 | 65536 | 1835008 | 273060 | 30490616 | 17704164157989 | 17704164120875 | 17704164493515 | 17704164495091 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 86 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 33600 | 0x7f6c7dcfbb00 | 0x7f6c7d424680 | 311646 | 311646 | 65536 | 1703936 | 248760 | 27772388 | 17704164528920 | 17704164493515 | 17704164862476 | 17704164864162 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 89 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 34560 | 0x7f6c7dcfb980 | 0x7f6c7d4246c0 | 169070 | 169070 | 65536 | 1769472 | 264799 | 29715516 | 17704164899431 | 17704164862476 | 17704165145516 | 17704165147125 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 92 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 8 | 24 | 35520 | 0x7f6c7dcfb800 | 0x7f6c7d424700 | 169812 | 169812 | 65536 | 2031616 | 303038 | 33948556 | 17704165182614 | 17704165145516 | 17704165430157 | 17704165431727 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 95 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 36224 | 0x7f6c7dcfb680 | 0x7f6c7d424740 | 169734 | 169734 | 65536 | 1638400 | 247300 | 27571712 | 17704165473646 | 17704165430157 | 17704165714637 | 17704165716200 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 98 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 37184 | 0x7f6c80453500 | 0x7f6c7d424780 | 312594 | 312594 | 65536 | 1966080 | 287935 | 32330112 | 17704165750630 | 17704165714637 | 17704166088878 | 17704166090591 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 101 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 38144 | 0x7f6c80453380 | 0x7f6c7d4247c0 | 311568 | 311568 | 65536 | 1835008 | 272288 | 30526020 | 17704166126110 | 17704166088878 | 17704166466319 | 17704166468062 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 104 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 39104 | 0x7f6c80453200 | 0x7f6c7d424800 | 166830 | 166830 | 65536 | 1900544 | 280895 | 31488136 | 17704166502801 | 17704166466319 | 17704166751919 | 17704166753534 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 107 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 8 | 24 | 40320 | 0x7f6c80453080 | 0x7f6c7d424840 | 168660 | 168660 | 65536 | 2228224 | 327623 | 36767524 | 17704166788573 | 17704166751919 | 17704167046000 | 17704167047547 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 110 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 41280 | 0x7f6c7dcfbf00 | 0x7f6c7d424880 | 169480 | 169480 | 65536 | 1703936 | 255814 | 28567784 | 17704167090266 | 17704167046000 | 17704167329200 | 17704167330780 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 113 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 42240 | 0x7f6c7dcfbd80 | 0x7f6c7d4248c0 | 310824 | 310824 | 65536 | 2097152 | 310808 | 34841344 | 17704167366739 | 17704167329200 | 17704167698161 | 17704167699640 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 116 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 43200 | 0x7f6c7dcfbc00 | 0x7f6c7d424900 | 309821 | 309821 | 65536 | 1966080 | 282942 | 31711288 | 17704167734410 | 17704167698161 | 17704168067441 | 17704168069071 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 119 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 8 | 24 | 44160 | 0x7f6c7dcfba80 | 0x7f6c7d424940 | 166646 | 166646 | 65536 | 2031616 | 302875 | 33953936 | 17704168103680 | 17704168067441 | 17704168351122 | 17704168352674 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 122 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 45376 | 0x7f6c7dcfb900 | 0x7f6c7d424980 | 169915 | 169915 | 65536 | 2424832 | 364068 | 40806484 | 17704168387423 | 17704168351122 | 17704168641202 | 17704168642657 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 125 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 46336 | 0x7f6c7dcfb780 | 0x7f6c7d4249c0 | 166020 | 166020 | 65536 | 1835008 | 282877 | 31667064 | 17704168683636 | 17704168641202 | 17704168930163 | 17704168931739 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 128 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 47552 | 0x7f6c7dcfb600 | 0x7f6c7d424a00 | 306661 | 306661 | 65536 | 2228224 | 328767 | 36724868 | 17704168966889 | 17704168930163 | 17704169301363 | 17704169302890 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 131 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 48512 | 0x7f6c80453480 | 0x7f6c7d424a40 | 304645 | 304645 | 65536 | 2097152 | 308947 | 34642688 | 17704169337869 | 17704169301363 | 17704169670484 | 17704169671881 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 134 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 8 | 24 | 49472 | 0x7f6c80453300 | 0x7f6c7d424a80 | 168251 | 168251 | 65536 | 2162688 | 319265 | 35691792 | 17704169706960 | 17704169670484 | 17704169956564 | 17704169958104 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 137 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 50688 | 0x7f6c80453180 | 0x7f6c7d424ac0 | 167746 | 167746 | 65536 | 2621440 | 406289 | 45504056 | 17704169992933 | 17704169956564 | 17704170249205 | 17704170251006 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 140 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 51648 | 0x7f6c80453000 | 0x7f6c7d424b00 | 166236 | 166236 | 65536 | 1966080 | 296329 | 33230512 | 17704170293235 | 17704170249205 | 17704170539445 | 17704170541049 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 143 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 52864 | 0x7f6c7dcfbe80 | 0x7f6c7d424b40 | 307321 | 307321 | 65536 | 2359296 | 352569 | 39484244 | 17704170576378 | 17704170539445 | 17704170907926 | 17704170909620 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 146 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 54080 | 0x7f6c7dcfbd00 | 0x7f6c7d424b80 | 304571 | 304571 | 65536 | 2228224 | 332634 | 37309124 | 17704170945119 | 17704170907926 | 17704171278967 | 17704171280530 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 149 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 8 | 24 | 55296 | 0x7f6c7dcfbb80 | 0x7f6c7d424bc0 | 169167 | 169167 | 65536 | 2293760 | 344091 | 38427532 | 17704171314759 | 17704171278967 | 17704171565527 | 17704171567143 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 152 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 56768 | 0x7f6c7dcfba00 | 0x7f6c7d424c00 | 169515 | 169515 | 65536 | 2752512 | 419782 | 47017872 | 17704171601222 | 17704171565527 | 17704171853687 | 17704171855086 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 155 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 57728 | 0x7f6c7dcfb880 | 0x7f6c7d424c40 | 168560 | 168560 | 65536 | 2031616 | 305455 | 34203368 | 17704171896545 | 17704171853687 | 17704172145208 | 17704172146799 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 158 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 58944 | 0x7f6c7dcfb700 | 0x7f6c7d424c80 | 305008 | 305008 | 65536 | 2490368 | 366195 | 40955016 | 17704172181818 | 17704172145208 | 17704172513689 | 17704172515219 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 161 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 60160 | 0x7f6c80453580 | 0x7f6c7d424cc0 | 305017 | 305017 | 65536 | 2359296 | 352260 | 39467964 | 17704172550388 | 17704172513689 | 17704172882329 | 17704172883810 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 164 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 8 | 24 | 61376 | 0x7f6c80453400 | 0x7f6c7d424d00 | 168850 | 168850 | 65536 | 2424832 | 368934 | 41229788 | 17704172919289 | 17704172882329 | 17704173165370 | 17704173166923 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 167 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 62848 | 0x7f6c80453280 | 0x7f6c7d424d40 | 171892 | 171892 | 65536 | 2949120 | 436967 | 48854712 | 17704173201462 | 17704173165370 | 17704173459450 | 17704173461095 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 170 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 63808 | 0x7f6c80453100 | 0x7f6c7d424d80 | 167754 | 167754 | 65536 | 2162688 | 322680 | 36173836 | 17704173503994 | 17704173459450 | 17704173748251 | 17704173749958 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 173 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 65024 | 0x7f6c7dcfbf80 | 0x7f6c7d424dc0 | 305880 | 305880 | 65536 | 2621440 | 387123 | 43391064 | 17704173785507 | 17704173748251 | 17704174117371 | 17704174119179 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 176 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 66240 | 0x7f6c7dcfbe00 | 0x7f6c7d424e00 | 303228 | 303228 | 65536 | 2490368 | 362497 | 40535292 | 17704174154778 | 17704174117371 | 17704174490012 | 17704174491490 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 179 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 8 | 24 | 67456 | 0x7f6c7dcfbc80 | 0x7f6c7d424e40 | 169642 | 169642 | 65536 | 2555904 | 379446 | 42484480 | 17704174525519 | 17704174490012 | 17704174777692 | 17704174779292 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 182 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 68928 | 0x7f6c7dcfbb00 | 0x7f6c7d424e80 | 176172 | 176172 | 65536 | 3145728 | 481896 | 53972432 | 17704174813882 | 17704174777692 | 17704175067773 | 17704175069345 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 185 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 70144 | 0x7f6c7dcfb980 | 0x7f6c7d424ec0 | 166678 | 166678 | 65536 | 2228224 | 326607 | 36711996 | 17704175111054 | 17704175067773 | 17704175356093 | 17704175357678 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 188 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 71616 | 0x7f6c7dcfb800 | 0x7f6c7d424f00 | 304181 | 304181 | 65536 | 2752512 | 406696 | 45458344 | 17704175392347 | 17704175356093 | 17704175727294 | 17704175728849 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 191 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 72832 | 0x7f6c7dcfb680 | 0x7f6c7d424f40 | 305152 | 305152 | 65536 | 2621440 | 387695 | 43464796 | 17704175762908 | 17704175727294 | 17704176098334 | 17704176099939 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 194 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 8 | 24 | 74048 | 0x7f6c80453500 | 0x7f6c7d424f80 | 168018 | 168018 | 65536 | 2686976 | 399160 | 44685680 | 17704176134368 | 17704176098334 | 17704176389855 | 17704176391472 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 197 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 75776 | 0x7f6c80453380 | 0x7f6c7d424fc0 | 181176 | 181176 | 65536 | 3342336 | 501317 | 56060580 | 17704176426461 | 17704176389855 | 17704176687935 | 17704176689405 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 200 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 76992 | 0x7f6c80453200 | 0x7f6c7d425000 | 167740 | 167740 | 65536 | 2359296 | 350615 | 39328332 | 17704176741973 | 17704176687935 | 17704176976736 | 17704176978527 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 203 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 78464 | 0x7f6c80453080 | 0x7f6c7d425040 | 302124 | 302124 | 65536 | 2883584 | 433830 | 48563020 | 17704177013466 | 17704176976736 | 17704177346177 | 17704177347738 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 206 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 79936 | 0x7f6c7dcfbf00 | 0x7f6c7d425080 | 299830 | 299830 | 65536 | 2686976 | 399693 | 44783316 | 17704177382207 | 17704177346177 | 17704177715617 | 17704177717249 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 209 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 8 | 24 | 81408 | 0x7f6c7dcfbd80 | 0x7f6c7d4250c0 | 168092 | 168092 | 65536 | 2818048 | 430303 | 48194572 | 17704177751738 | 17704177715617 | 17704178002978 | 17704178004712 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 212 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 83136 | 0x7f6c7dcfbc00 | 0x7f6c7d425100 | 192728 | 192728 | 65536 | 3538944 | 529984 | 59365900 | 17704178039201 | 17704178002978 | 17704178310818 | 17704178312654 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 215 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 84352 | 0x7f6c7dcfba80 | 0x7f6c7d425140 | 165674 | 165674 | 65536 | 2424832 | 362751 | 40601584 | 17704178354033 | 17704178310818 | 17704178603779 | 17704178605257 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 218 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 85824 | 0x7f6c7dcfb900 | 0x7f6c7d425180 | 307376 | 307376 | 65536 | 3014656 | 449675 | 50323204 | 17704178639926 | 17704178603779 | 17704178983459 | 17704178985057 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 221 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 87296 | 0x7f6c7dcfb780 | 0x7f6c7d4251c0 | 304466 | 304466 | 65536 | 2818048 | 431525 | 48287348 | 17704179020446 | 17704178983459 | 17704179356100 | 17704179357688 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 224 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 88768 | 0x7f6c7dcfb600 | 0x7f6c7d425200 | 168328 | 168328 | 65536 | 2949120 | 436666 | 48806608 | 17704179391767 | 17704179356100 | 17704179640900 | 17704179642610 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 227 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 90752 | 0x7f6c80453480 | 0x7f6c7d425240 | 200892 | 200892 | 65536 | 3735552 | 553500 | 61965708 | 17704179677450 | 17704179640900 | 17704179947461 | 17704179949133 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 230 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 91968 | 0x7f6c80453300 | 0x7f6c7d425280 | 168500 | 168500 | 65536 | 2555904 | 387538 | 43436088 | 17704179990562 | 17704179947461 | 17704180240261 | 17704180241795 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 233 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 93440 | 0x7f6c80453180 | 0x7f6c7d4252c0 | 306215 | 306215 | 65536 | 3145728 | 471334 | 52790384 | 17704180277864 | 17704180240261 | 17704180616902 | 17704180618606 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 236 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 94912 | 0x7f6c80453000 | 0x7f6c7d425300 | 302798 | 302798 | 65536 | 2949120 | 445943 | 49931896 | 17704180653395 | 17704180616902 | 17704180986343 | 17704180987917 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 239 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 96384 | 0x7f6c7dcfbe80 | 0x7f6c7d425340 | 168096 | 168096 | 65536 | 3080192 | 454786 | 50938888 | 17704181021666 | 17704180986343 | 17704181272263 | 17704181273999 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 242 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 98368 | 0x7f6c7dcfbd00 | 0x7f6c7d425380 | 209942 | 209942 | 65536 | 3932160 | 592130 | 66353396 | 17704181308309 | 17704181272263 | 17704181589384 | 17704181591021 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 245 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 99584 | 0x7f6c7dcfbb80 | 0x7f6c7d4253c0 | 166984 | 166984 | 65536 | 2621440 | 401803 | 44935552 | 17704181631940 | 17704181589384 | 17704181878824 | 17704181880404 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 248 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 101312 | 0x7f6c7dcfba00 | 0x7f6c7d425400 | 305356 | 305356 | 65536 | 3276800 | 488873 | 54731676 | 17704181915113 | 17704181878824 | 17704182249545 | 17704182251185 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 251 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 102784 | 0x7f6c7dcfb880 | 0x7f6c7d425440 | 302306 | 302306 | 65536 | 3080192 | 452995 | 50725176 | 17704182286034 | 17704182249545 | 17704182621545 | 17704182623305 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 254 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 104256 | 0x7f6c7dcfb700 | 0x7f6c7d425480 | 166960 | 166960 | 65536 | 3211264 | 469980 | 52659848 | 17704182657675 | 17704182621545 | 17704182905866 | 17704182907498 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 257 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 106240 | 0x7f6c80453580 | 0x7f6c7d4254c0 | 219510 | 219510 | 65536 | 4128768 | 613915 | 68774508 | 17704182941997 | 17704182905866 | 17704183223946 | 17704183225560 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 260 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 107712 | 0x7f6c80453400 | 0x7f6c7d425500 | 165036 | 165036 | 65536 | 2752512 | 418275 | 46836784 | 17704183267209 | 17704183223946 | 17704183513227 | 17704183514723 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 263 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 16 | 24 | 109440 | 0x7f6c80453280 | 0x7f6c7d425540 | 301720 | 301720 | 65536 | 3407872 | 508536 | 56888776 | 17704183550622 | 17704183513227 | 17704183880907 | 17704183882364 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 266 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 16 | 24 | 111168 | 0x7f6c80453100 | 0x7f6c7d425580 | 303460 | 303460 | 65536 | 3211264 | 480222 | 53865036 | 17704183917403 | 17704183880907 | 17704184257068 | 17704184258914 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 269 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 8 | 24 | 112896 | 0x7f6c7dcfbf80 | 0x7f6c7d4255c0 | 168986 | 168986 | 65536 | 3276800 | 518151 | 58160460 | 17704184293643 | 17704184257068 | 17704184543468 | 17704184545157 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 272 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 115136 | 0x7f6c7dcfbe00 | 0x7f6c7d425600 | 229139 | 229139 | 65536 | 4325376 | 645364 | 72308656 | 17704184579166 | 17704184543468 | 17704184867469 | 17704184869069 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 275 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 116608 | 0x7f6c7dcfbc80 | 0x7f6c7d425640 | 167758 | 167758 | 65536 | 2818048 | 417690 | 46803356 | 17704184910228 | 17704184867469 | 17704185157069 | 17704185158922 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 278 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 16 | 24 | 118336 | 0x7f6c7dcfbb00 | 0x7f6c7d425680 | 299459 | 299459 | 65536 | 3538944 | 524698 | 58820728 | 17704185193731 | 17704185157069 | 17704185523470 | 17704185525002 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 281 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 16 | 24 | 120064 | 0x7f6c7dcfb980 | 0x7f6c7d4256c0 | 306024 | 306024 | 65536 | 3407872 | 522287 | 58376396 | 17704185559322 | 17704185523470 | 17704185894991 | 17704185896703 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 284 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 121792 | 0x7f6c7dcfb800 | 0x7f6c7d425700 | 170315 | 170315 | 65536 | 3407872 | 556716 | 62351916 | 17704185930172 | 17704185894991 | 17704186182671 | 17704186184386 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 287 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 124032 | 0x7f6c7dcfb680 | 0x7f6c7d425740 | 238109 | 238109 | 65536 | 4521984 | 691065 | 77314756 | 17704186220505 | 17704186182671 | 17704186518192 | 17704186519777 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 290 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 125504 | 0x7f6c80453500 | 0x7f6c7d425780 | 169173 | 169173 | 65536 | 3014656 | 458787 | 51391772 | 17704186561396 | 17704186518192 | 17704186806192 | 17704186807800 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 293 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 127488 | 0x7f6c80453380 | 0x7f6c7d4257c0 | 302454 | 302454 | 65536 | 3801088 | 579074 | 64938744 | 17704186842419 | 17704186806192 | 17704187183953 | 17704187185711 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 296 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 129216 | 0x7f6c80453200 | 0x7f6c7d425800 | 300815 | 300815 | 65536 | 3670016 | 550214 | 61492068 | 17704187220330 | 17704187183953 | 17704187553073 | 17704187554562 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 299 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 130944 | 0x7f6c80453080 | 0x7f6c7d425840 | 172025 | 172025 | 65536 | 3670016 | 549019 | 61461248 | 17704187589121 | 17704187553073 | 17704187841394 | 17704187843004 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 302 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 133440 | 0x7f6c7dcfbf00 | 0x7f6c7d425880 | 259721 | 259721 | 65536 | 4915200 | 757092 | 84746412 | 17704187878063 | 17704187841394 | 17704188185394 | 17704188186986 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 305 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 134912 | 0x7f6c7dcfbd80 | 0x7f6c7d4258c0 | 168995 | 168995 | 65536 | 3145728 | 466523 | 52212692 | 17704188229435 | 17704188185394 | 17704188480755 | 17704188482378 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 308 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 136896 | 0x7f6c7dcfbc00 | 0x7f6c7d425900 | 298839 | 298839 | 65536 | 4063232 | 621606 | 69601032 | 17704188517047 | 17704188480755 | 17704188853236 | 17704188854909 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 311 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 138880 | 0x7f6c7dcfba80 | 0x7f6c7d425940 | 301633 | 301633 | 65536 | 3932160 | 593512 | 66430688 | 17704188889558 | 17704188853236 | 17704189224436 | 17704189226250 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 314 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 140864 | 0x7f6c7dcfb900 | 0x7f6c7d425980 | 178277 | 178277 | 65536 | 3932160 | 588443 | 65935496 | 17704189259979 | 17704189224436 | 17704189523637 | 17704189525242 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 317 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 143616 | 0x7f6c7dcfb780 | 0x7f6c7d4259c0 | 280199 | 280199 | 65536 | 5308416 | 792307 | 88715344 | 17704189560231 | 17704189523637 | 17704189882677 | 17704189884173 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 320 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 145344 | 0x7f6c7dcfb600 | 0x7f6c7d425a00 | 168553 | 168553 | 65536 | 3342336 | 500804 | 56093968 | 17704189927142 | 17704189882677 | 17704190178518 | 17704190180416 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 323 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 147584 | 0x7f6c80453480 | 0x7f6c7d425a40 | 300002 | 300002 | 65536 | 4325376 | 675469 | 75752580 | 17704190215475 | 17704190178518 | 17704190556438 | 17704190558086 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 326 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 149568 | 0x7f6c80453300 | 0x7f6c7d425a80 | 301273 | 301273 | 65536 | 4194304 | 640919 | 71863264 | 17704190593275 | 17704190556438 | 17704190929559 | 17704190931057 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 329 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 151552 | 0x7f6c80453180 | 0x7f6c7d425ac0 | 186280 | 186280 | 65536 | 4194304 | 633297 | 70937904 | 17704190965796 | 17704190929559 | 17704191229720 | 17704191231369 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 332 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 154304 | 0x7f6c80453000 | 0x7f6c7d425b00 | 300325 | 300325 | 65536 | 5701632 | 850477 | 95281112 | 17704191266508 | 17704191229720 | 17704191598360 | 17704191600070 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 335 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 156288 | 0x7f6c7dcfbe80 | 0x7f6c7d425b40 | 172934 | 172934 | 65536 | 3735552 | 562548 | 63081084 | 17704191641659 | 17704191598360 | 17704191888921 | 17704191890453 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 338 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 158784 | 0x7f6c7dcfbd00 | 0x7f6c7d425b80 | 302047 | 302047 | 65536 | 4849664 | 743572 | 83294680 | 17704191925262 | 17704191888921 | 17704192262361 | 17704192263853 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 341 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 161024 | 0x7f6c7dcfbb80 | 0x7f6c7d425bc0 | 304244 | 304244 | 65536 | 4718592 | 731748 | 81955996 | 17704192298133 | 17704192262361 | 17704192643002 | 17704192644554 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 344 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 163264 | 0x7f6c7dcfba00 | 0x7f6c7d425c00 | 206135 | 206135 | 65536 | 4718592 | 722436 | 80934076 | 17704192678263 | 17704192643002 | 17704192953882 | 17704192955516 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 347 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 166528 | 0x7f6c7dcfb880 | 0x7f6c7d425c40 | 340416 | 340416 | 65536 | 6488064 | 972403 | 108929700 | 17704192989545 | 17704192953882 | 17704193346843 | 17704193366746 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 350 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 168512 | 0x7f6c7dcfb700 | 0x7f6c7d425c80 | 183933 | 183933 | 65536 | 4128768 | 617542 | 69236980 | 17704193390635 | 17704193346843 | 17704193648924 | 17704193650718 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 353 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 171264 | 0x7f6c80453580 | 0x7f6c7d425cc0 | 303720 | 303720 | 65536 | 5373952 | 831013 | 93075408 | 17704193685338 | 17704193648924 | 17704194029404 | 17704194030939 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 356 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 173760 | 0x7f6c80453400 | 0x7f6c7d425d00 | 301763 | 301763 | 65536 | 5242880 | 834680 | 93529352 | 17704194066168 | 17704194029404 | 17704194417405 | 17704194419099 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 359 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 176256 | 0x7f6c80453280 | 0x7f6c7d425d40 | 226000 | 226000 | 65536 | 5242880 | 783753 | 87803004 | 17704194453958 | 17704194417405 | 17704194742045 | 17704194743731 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 362 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 179776 | 0x7f6c80453100 | 0x7f6c7d425d80 | 381672 | 381672 | 65536 | 7274496 | 1102848 | 123473236 | 17704194778700 | 17704194742045 | 17704195167166 | 17704195188440 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 365 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 182272 | 0x7f6c7dcfbf80 | 0x7f6c7d425dc0 | 211164 | 211164 | 65536 | 4915200 | 736133 | 82422488 | 17704195210879 | 17704195167166 | 17704195487967 | 17704195489702 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 368 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 185536 | 0x7f6c7dcfbe00 | 0x7f6c7d425e00 | 306329 | 306329 | 65536 | 6422528 | 1006174 | 112663736 | 17704195523561 | 17704195487967 | 17704195865887 | 17704195886792 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 371 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 188544 | 0x7f6c7dcfbc80 | 0x7f6c7d425e40 | 311818 | 311818 | 65536 | 6291456 | 1017071 | 113963012 | 17704195901812 | 17704195865887 | 17704196251008 | 17704196271422 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 374 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 191552 | 0x7f6c7dcfbb00 | 0x7f6c7d425e80 | 265845 | 265845 | 65536 | 6291456 | 956078 | 106910056 | 17704196286122 | 17704196251008 | 17704196601728 | 17704196603384 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 377 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 195840 | 0x7f6c7dcfb980 | 0x7f6c7d425ec0 | 461636 | 461636 | 65536 | 8847360 | 1335882 | 149643144 | 17704196637363 | 17704196601728 | 17704197072929 | 17704197090572 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 380 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 198592 | 0x7f6c7dcfb800 | 0x7f6c7d425f00 | 242417 | 242417 | 65536 | 5701632 | 865558 | 97070268 | 17704197116371 | 17704197072929 | 17704197411810 | 17704197413534 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 383 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 202368 | 0x7f6c7dcfb680 | 0x7f6c7d425f40 | 335820 | 335820 | 65536 | 7471104 | 1196898 | 134020200 | 17704197447613 | 17704197411810 | 17704197813410 | 17704197831443 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 386 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 205888 | 0x7f6c80453500 | 0x7f6c7d425f80 | 331829 | 331829 | 65536 | 7340032 | 1176522 | 131743572 | 17704197849603 | 17704197813410 | 17704198215651 | 17704198234023 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 389 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 209408 | 0x7f6c80453380 | 0x7f6c7d425fc0 | 306688 | 306688 | 65536 | 7340032 | 1123154 | 125770792 | 17704198252353 | 17704198215651 | 17704198595972 | 17704198597674 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 392 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 214464 | 0x7f6c80453200 | 0x7f6c7d426000 | 542348 | 542348 | 65536 | 10420224 | 1588521 | 177877532 | 17704198631953 | 17704198595972 | 17704199118213 | 17704199135741 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 395 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 217728 | 0x7f6c80453080 | 0x7f6c7d426040 | 272767 | 272767 | 65536 | 6488064 | 999128 | 111905856 | 17704199162340 | 17704199118213 | 17704199479013 | 17704199480502 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 398 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 222016 | 0x7f6c7dcfbf00 | 0x7f6c7d426080 | 364792 | 364792 | 65536 | 8519680 | 1349671 | 151174388 | 17704199515811 | 17704199479013 | 17704199894854 | 17704199913311 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 401 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 226048 | 0x7f6c7dcfbd80 | 0x7f6c7d4260c0 | 364843 | 364843 | 65536 | 8388608 | 1320151 | 147880736 | 17704199932191 | 17704199894854 | 17704200315815 | 17704200333221 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 404 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 230080 | 0x7f6c7dcfbc00 | 0x7f6c7d426100 | 348454 | 348454 | 65536 | 8388608 | 1299781 | 145533968 | 17704200352600 | 17704200315815 | 17704200716775 | 17704200735411 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 407 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 235904 | 0x7f6c7dcfba80 | 0x7f6c7d426140 | 625393 | 625393 | 65536 | 11993088 | 1819930 | 203817112 | 17704200753070 | 17704200716775 | 17704201292296 | 17704201309556 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 410 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 239424 | 0x7f6c7dcfb900 | 0x7f6c7d426180 | 303836 | 303836 | 65536 | 7274496 | 1127943 | 126332228 | 17704201336255 | 17704201292296 | 17704201673577 | 17704201675237 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 413 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 244224 | 0x7f6c7dcfb780 | 0x7f6c7d4261c0 | 396271 | 396271 | 65536 | 9568256 | 1520445 | 170314324 | 17704201708936 | 17704201673577 | 17704202112298 | 17704202129896 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 416 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 248768 | 0x7f6c7dcfb600 | 0x7f6c7d426200 | 390629 | 390629 | 65536 | 9437184 | 1514911 | 169741156 | 17704202150725 | 17704202112298 | 17704202554218 | 17704202572194 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 419 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 253312 | 0x7f6c80453480 | 0x7f6c7d426240 | 388489 | 388489 | 65536 | 9437184 | 1477661 | 165596200 | 17704202590044 | 17704202554218 | 17704202981739 | 17704202999584 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 422 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 8 | 24 | 255552 | 0x7f6c80453300 | 0x7f6c7d426280 | 719911 | 719911 | 65536 | 16056320 | 2303651 | 257991612 | 17704203018193 | 17704202981739 | 17704203622860 | 17704203640818 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 425 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 259840 | 0x7f6c80453180 | 0x7f6c7d4262c0 | 363315 | 363315 | 65536 | 8847360 | 1372036 | 153628960 | 17704203667237 | 17704203622860 | 17704204042861 | 17704204059437 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 428 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 265664 | 0x7f6c80453000 | 0x7f6c7d426300 | 468935 | 468935 | 65536 | 11665408 | 1827708 | 204568404 | 17704204079127 | 17704204042861 | 17704204535502 | 17704204553735 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 431 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 271232 | 0x7f6c7dcfbe80 | 0x7f6c7d426340 | 470477 | 470477 | 65536 | 11468800 | 1808106 | 202548488 | 17704204571664 | 17704204535502 | 17704205023822 | 17704205042582 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 434 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 8 | 24 | 273216 | 0x7f6c7dcfbd00 | 0x7f6c7d426380 | 483540 | 483540 | 65536 | 14090240 | 2021979 | 226372164 | 17704205059392 | 17704205023822 | 17704205516143 | 17704205534070 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 437 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 8 | 24 | 275712 | 0x7f6c7dcfbb80 | 0x7f6c7d4263c0 | 879252 | 879252 | 65536 | 19202048 | 2758128 | 308795244 | 17704205552589 | 17704205516143 | 17704206261904 | 17704206280681 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 440 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 280768 | 0x7f6c7dcfba00 | 0x7f6c7d426400 | 427638 | 427638 | 65536 | 10420224 | 1593972 | 178497680 | 17704206306760 | 17704206261904 | 17704206725425 | 17704206769799 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 443 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 287616 | 0x7f6c7dcfb880 | 0x7f6c7d426440 | 548689 | 548689 | 65536 | 13762560 | 2199715 | 246293920 | 17704206780649 | 17704206725425 | 17704207296626 | 17704207340744 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 446 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 294208 | 0x7f6c7dcfb700 | 0x7f6c7d426480 | 550682 | 550682 | 65536 | 13565952 | 2138111 | 239336248 | 17704207351754 | 17704207296626 | 17704207864947 | 17704207909520 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 449 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 8 | 24 | 296960 | 0x7f6c80453580 | 0x7f6c7d4264c0 | 563359 | 563359 | 65536 | 15466496 | 2232725 | 250066464 | 17704207920280 | 17704207864947 | 17704208432468 | 17704208476886 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 452 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 8 | 24 | 299968 | 0x7f6c80453400 | 0x7f6c7d426500 | 1041654 | 1041654 | 65536 | 22347776 | 3212046 | 359821336 | 17704208487146 | 17704208432468 | 17704209307989 | 17704209352904 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 455 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 8 | 24 | 302720 | 0x7f6c80453280 | 0x7f6c7d426540 | 720055 | 720055 | 65536 | 20250624 | 2907213 | 325648160 | 17704209372783 | 17704209307989 | 17704209971511 | 17704210016437 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 458 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 305472 | 0x7f6c80453100 | 0x7f6c7d426580 | 722738 | 722738 | 65536 | 20447232 | 2940129 | 329197616 | 17704210027507 | 17704209971511 | 17704210679672 | 17704210699210 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 461 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 308224 | 0x7f6c7dcfbf80 | 0x7f6c7d4265c0 | 721833 | 721833 | 65536 | 19595264 | 2824863 | 316435572 | 17704210715960 | 17704210679672 | 17704211334713 | 17704211352754 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 464 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 8 | 24 | 310976 | 0x7f6c7dcfbe00 | 0x7f6c7d426600 | 726275 | 726275 | 65536 | 20381696 | 2934425 | 328691172 | 17704211370413 | 17704211334713 | 17704211977114 | 17704211997108 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 467 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 8 | 24 | 313216 | 0x7f6c7dcfbc80 | 0x7f6c7d426640 | 1365971 | 1365971 | 65536 | 31522816 | 4513966 | 505673184 | 17704212013457 | 17704211977149 | 17704213034110 | 17704213083370 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 470 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 8 | 24 | 315968 | 0x7f6c7dcfbb00 | 0x7f6c7d426680 | 1370661 | 1370661 | 65536 | 38993920 | 5588263 | 625770684 | 17704213102340 | 17704213034110 | 17704214126111 | 17704214153534 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 473 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 318720 | 0x7f6c7dcfb980 | 0x7f6c7d4266c0 | 1372709 | 1372709 | 65536 | 39124992 | 5605493 | 627872544 | 17704214165143 | 17704214126111 | 17704215237153 | 17704215303345 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 476 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 321472 | 0x7f6c7dcfb800 | 0x7f6c7d426700 | 1370309 | 1370309 | 65536 | 38469632 | 5509750 | 617037956 | 17704215314814 | 17704215237153 | 17704216371235 | 17704216414197 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 479 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 8 | 24 | 324224 | 0x7f6c7dcfb680 | 0x7f6c7d426740 | 1376183 | 1376183 | 65536 | 39059456 | 5598144 | 627004592 | 17704216425886 | 17704216371235 | 17704217462437 | 17704217503639 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 482 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 8 | 24 | 326464 | 0x7f6c80453500 | 0x7f6c7d426780 | 2662517 | 2662517 | 65536 | 60489728 | 8653646 | 969020212 | 17704217514989 | 17704217462437 | 17704219402280 | 17704219455750 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 485 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 8 | 24 | 329216 | 0x7f6c80453380 | 0x7f6c7d4267c0 | 2669105 | 2669105 | 65536 | 77266944 | 11060372 | 1238524332 | 17704219475740 | 17704219402280 | 17704221317164 | 17704221357712 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 488 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 331968 | 0x7f6c80453200 | 0x7f6c7d426800 | 2669052 | 2669052 | 65536 | 77398016 | 11071730 | 1240048880 | 17704221369542 | 17704221317164 | 17704223268527 | 17704223314293 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 491 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 12 | 24 | 334720 | 0x7f6c80453080 | 0x7f6c7d426840 | 2670134 | 2670134 | 65536 | 76218368 | 10904022 | 1221319080 | 17704223326273 | 17704223268527 | 17704225220690 | 17704225261974 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 494 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 8 | 24 | 337472 | 0x7f6c7dcfbf00 | 0x7f6c7d426880 | 2672739 | 2672739 | 65536 | 77332480 | 11064825 | 1239334608 | 17704225273134 | 17704225220690 | 17704227124854 | 17704227194456 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 497 | 229387 | 229387 | 4194304 | 256 | 0 | 0 | 8 | 24 | 0 | 0x7f6c7dcfbd80 | 0x7f6c7d4268c0 | 5257738 | 5257738 | 65536 | 120258560 | 17189281 | 1925701096 | 17704227207336 | 17704227124854 | 17704230750140 | 17704230818275 |