43 KiB
43 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | SQ_INSTS_VMEM | SQ_INST_LEVEL_VMEM | SQ_ACCUM_PREV_HIRES | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBuffer.kd | 0 | 0 | 0 | 921153 | 921158 | 33554432 | 256 | 0 | 0 | 8 | 32 | 6464 | 0x0 | 0x7fbf7ac04180 | 1048576 | 11001658 | 1408052856 | 12076324607361092 | 12076324851578856 | 12076324851903654 | 12076324852039846 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 921153 | 921158 | 32768 | 256 | 0 | 0 | 24 | 24 | 12480 | 0x0 | 0x7fbf7ac35100 | 4096 | 113289 | 14479660 | 12076324866554932 | 12076324866851777 | 12076324866858017 | 12076324866863235 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 4 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 12928 | 0x7fc0aab91900 | 0x7fbf7ac35140 | 524288 | 12401318 | 1587311276 | 12076324866927514 | 12076324867148415 | 12076324867279615 | 12076324867283767 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 6 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 36 | 24 | 13632 | 0x7fc0aab91800 | 0x7fbf7ac35180 | 524288 | 13924068 | 1782351476 | 12076324867354438 | 12076324867525693 | 12076324867773532 | 12076324867842695 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 8 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 14080 | 0x7fc0aab91700 | 0x7fbf7ac351c0 | 524288 | 14366779 | 1838880984 | 12076324867872430 | 12076324868062971 | 12076324868314809 | 12076324868383570 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 10 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 14528 | 0x7fc0aab91600 | 0x7fbf7ac35200 | 524288 | 11167660 | 1429516928 | 12076324868408617 | 12076324868594968 | 12076324868731607 | 12076324868735214 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 12 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 14976 | 0x7fc0aab91500 | 0x7fbf7ac35240 | 524288 | 12212582 | 1563143728 | 12076324868785387 | 12076324868956246 | 12076324869088885 | 12076324869092698 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 14 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 15424 | 0x7fc0aab91400 | 0x7fbf7ac35280 | 524288 | 12734855 | 1630074280 | 12076324869171385 | 12076324869342644 | 12076324869472563 | 12076324869476321 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 16 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 16128 | 0x7fc0aab91300 | 0x7fbf7ac352c0 | 524288 | 13905355 | 1779832888 | 12076324869526575 | 12076324869705202 | 12076324869958961 | 12076324870005104 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 18 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 16832 | 0x7fc0aab91a00 | 0x7fbf7ac35300 | 524288 | 13638895 | 1745720368 | 12076324870031794 | 12076324870211280 | 12076324870466638 | 12076324870507167 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 20 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 17536 | 0x7fc0aab91900 | 0x7fbf7ac35340 | 524288 | 11953865 | 1530028984 | 12076324870530250 | 12076324870718637 | 12076324870851916 | 12076324870855575 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 22 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 18240 | 0x7fc0aab91800 | 0x7fbf7ac35380 | 524288 | 11019037 | 1410452988 | 12076324870903554 | 12076324871079435 | 12076324871216235 | 12076324871220112 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 24 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 18944 | 0x7fc0aab91700 | 0x7fbf7ac353c0 | 524288 | 12347166 | 1580393688 | 12076324871281817 | 12076324871445993 | 12076324871577833 | 12076324871581554 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 26 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 19904 | 0x7fc0aab91600 | 0x7fbf7ac35400 | 524288 | 14251323 | 1824182664 | 12076324871624504 | 12076324871801512 | 12076324872056070 | 12076324872124513 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 28 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 20608 | 0x7fc0aab91500 | 0x7fbf7ac35440 | 524288 | 14134381 | 1809184948 | 12076324872148016 | 12076324872336869 | 12076324872590788 | 12076324872657093 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 30 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 21312 | 0x7fc0aab91400 | 0x7fbf7ac35480 | 524288 | 12003708 | 1536401320 | 12076324872680987 | 12076324872859106 | 12076324872992066 | 12076324872995692 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 32 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 22016 | 0x7fc0aab91300 | 0x7fbf7ac354c0 | 524288 | 12761839 | 1633550800 | 12076324873044783 | 12076324873215584 | 12076324873345824 | 12076324873349419 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 34 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 22720 | 0x7fc0aab91a00 | 0x7fbf7ac35500 | 524288 | 12355665 | 1581510772 | 12076324873408950 | 12076324873572063 | 12076324873703742 | 12076324873707294 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 36 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 23680 | 0x7fc0aab91900 | 0x7fbf7ac35540 | 524288 | 13960437 | 1786860424 | 12076324873758660 | 12076324873919901 | 12076324874172059 | 12076324874214918 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 38 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 24384 | 0x7fc0aab91800 | 0x7fbf7ac35580 | 524288 | 14296440 | 1829925976 | 12076324874237069 | 12076324874424378 | 12076324874672537 | 12076324874713925 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 40 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 25088 | 0x7fc0aab91700 | 0x7fbf7ac355c0 | 524288 | 11419318 | 1461579156 | 12076324874735505 | 12076324874917976 | 12076324875052855 | 12076324875056792 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 42 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 25792 | 0x7fc0aab91600 | 0x7fbf7ac35600 | 524288 | 12716538 | 1627629044 | 12076324875107927 | 12076324875278934 | 12076324875409173 | 12076324875413004 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 44 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 26496 | 0x7fc0aab91500 | 0x7fbf7ac35640 | 524288 | 12786121 | 1636755892 | 12076324875472425 | 12076324875634612 | 12076324875764851 | 12076324875768585 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 46 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 27712 | 0x7fc0aab91400 | 0x7fbf7ac35680 | 524288 | 13985714 | 1790158532 | 12076324875816554 | 12076324875982770 | 12076324876235249 | 12076324876303439 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 48 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 28416 | 0x7fc0aab91300 | 0x7fbf7ac356c0 | 524288 | 13560902 | 1735756300 | 12076324876330079 | 12076324876507248 | 12076324876758446 | 12076324876825439 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 50 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 29120 | 0x7fc0aab91a00 | 0x7fbf7ac35700 | 524288 | 11718659 | 1499951512 | 12076324876850366 | 12076324877034445 | 12076324877168204 | 12076324877171973 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 52 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 30080 | 0x7fc0aab91900 | 0x7fbf7ac35740 | 524288 | 12932359 | 1655304508 | 12076324877219902 | 12076324877389163 | 12076324877519402 | 12076324877523086 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 54 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 30784 | 0x7fc0aab91800 | 0x7fbf7ac35780 | 524288 | 12610659 | 1614160584 | 12076324877581434 | 12076324877741481 | 12076324877871401 | 12076324877875140 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 56 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 32000 | 0x7fc0aab91700 | 0x7fbf7ac357c0 | 524288 | 14065498 | 1800337208 | 12076324877923720 | 12076324878115879 | 12076324878372038 | 12076324878439409 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 58 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 32960 | 0x7fc0aab91600 | 0x7fbf7ac35800 | 524288 | 14390289 | 1841900872 | 12076324878466319 | 12076324878642597 | 12076324878896835 | 12076324878963042 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 60 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 33920 | 0x7fc0aab91500 | 0x7fbf7ac35840 | 524288 | 11632795 | 1488875344 | 12076324878988389 | 12076324879172194 | 12076324879307713 | 12076324879311890 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 62 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 34880 | 0x7fc0aab91400 | 0x7fbf7ac35880 | 524288 | 13041589 | 1669311224 | 12076324879360360 | 12076324879526272 | 12076324879656991 | 12076324879660839 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 64 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 35840 | 0x7fc0aab91300 | 0x7fbf7ac358c0 | 524288 | 13141993 | 1682249604 | 12076324879722754 | 12076324879885790 | 12076324880014110 | 12076324880017852 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 66 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 37312 | 0x7fc0aab91a00 | 0x7fbf7ac35900 | 524288 | 13903488 | 1779637896 | 12076324880067464 | 12076324880239229 | 12076324880495707 | 12076324880563456 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 68 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 38272 | 0x7fc0aab91900 | 0x7fbf7ac35940 | 524288 | 13863049 | 1774444876 | 12076324880586780 | 12076324880772026 | 12076324881022745 | 12076324881091307 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 70 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 39232 | 0x7fc0aab91800 | 0x7fbf7ac35980 | 524288 | 12585259 | 1610915156 | 12076324881119910 | 12076324881299543 | 12076324881430582 | 12076324881434365 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 72 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 40192 | 0x7fc0aab91700 | 0x7fbf7ac359c0 | 524288 | 12147124 | 1554843264 | 12076324881482705 | 12076324881653941 | 12076324881787221 | 12076324881791128 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 74 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 41152 | 0x7fc0aab91600 | 0x7fbf7ac35a00 | 524288 | 12065079 | 1544321884 | 12076324881850709 | 12076324882012339 | 12076324882144979 | 12076324882148993 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 76 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 42624 | 0x7fc0aab91500 | 0x7fbf7ac35a40 | 524288 | 13593200 | 1739929944 | 12076324882196461 | 12076324882368338 | 12076324882625456 | 12076324882691912 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 78 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 43584 | 0x7fc0aab91400 | 0x7fbf7ac35a80 | 524288 | 14200515 | 1817602084 | 12076324882713462 | 12076324882892175 | 12076324883145294 | 12076324883216226 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 80 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 44544 | 0x7fc0aab91300 | 0x7fbf7ac35ac0 | 524288 | 12974942 | 1660889500 | 12076324883238357 | 12076324883418092 | 12076324883547532 | 12076324883551209 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 82 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 45760 | 0x7fc0aab91a00 | 0x7fbf7ac35b00 | 524288 | 12389424 | 1585815896 | 12076324883599499 | 12076324883764651 | 12076324883896810 | 12076324883900618 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 84 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 46720 | 0x7fc0aab91900 | 0x7fbf7ac35b40 | 524288 | 12579260 | 1610101880 | 12076324883959738 | 12076324884128009 | 12076324884258248 | 12076324884262240 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 86 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 48448 | 0x7fc0aab91800 | 0x7fbf7ac35b80 | 524288 | 13798283 | 1766179384 | 12076324884310390 | 12076324884477287 | 12076324884741606 | 12076324884808636 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 88 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 49408 | 0x7fc0aab91700 | 0x7fbf7ac35bc0 | 524288 | 13967280 | 1787765120 | 12076324884832991 | 12076324885007524 | 12076324885301443 | 12076324885368246 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 90 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 50368 | 0x7fc0aab91600 | 0x7fbf7ac35c00 | 524288 | 12768928 | 1634420072 | 12076324885393152 | 12076324885575521 | 12076324885705281 | 12076324885709039 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 92 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 51584 | 0x7fc0aab91500 | 0x7fbf7ac35c40 | 524288 | 11048220 | 1414101748 | 12076324885756788 | 12076324885922719 | 12076324886059999 | 12076324886063758 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 94 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 52544 | 0x7fc0aab91400 | 0x7fbf7ac35c80 | 524288 | 11869975 | 1519411292 | 12076324886124431 | 12076324886288158 | 12076324886420317 | 12076324886424038 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 96 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 54272 | 0x7fc0aab91300 | 0x7fbf7ac35cc0 | 524288 | 12994597 | 1663228396 | 12076324886468681 | 12076324886637116 | 12076324886906874 | 12076324886949354 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 98 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 55488 | 0x7fc0aab91a00 | 0x7fbf7ac35d00 | 524288 | 14232764 | 1821788460 | 12076324886975783 | 12076324887154713 | 12076324887406712 | 12076324887475632 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 100 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 56704 | 0x7fc0aab91900 | 0x7fbf7ac35d40 | 524288 | 13097771 | 1676571164 | 12076324887499006 | 12076324887675351 | 12076324887804150 | 12076324887808080 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 102 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 58176 | 0x7fc0aab91800 | 0x7fbf7ac35d80 | 524288 | 9712685 | 1243268284 | 12076324887858624 | 12076324888030709 | 12076324888172788 | 12076324888176825 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 104 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 59392 | 0x7fc0aab91700 | 0x7fbf7ac35dc0 | 524288 | 11709071 | 1498779836 | 12076324888236827 | 12076324888397907 | 12076324888531026 | 12076324888534821 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 106 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 61376 | 0x7fc0aab91600 | 0x7fbf7ac35e00 | 524288 | 14539178 | 1861072408 | 12076324888582319 | 12076324888746865 | 12076324889014544 | 12076324889081958 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 108 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 62592 | 0x7fc0aab91500 | 0x7fbf7ac35e40 | 524288 | 14171868 | 1814021376 | 12076324889105682 | 12076324889292942 | 12076324889544781 | 12076324889611411 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 110 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 63808 | 0x7fc0aab91400 | 0x7fbf7ac35e80 | 524288 | 11767035 | 1506177424 | 12076324889635867 | 12076324889818380 | 12076324889993419 | 12076324889997218 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 112 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 65280 | 0x7fc0aab91300 | 0x7fbf7ac35ec0 | 524288 | 9202080 | 1177852572 | 12076324890047051 | 12076324890215818 | 12076324890356777 | 12076324890360614 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 114 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 66496 | 0x7fc0aab91a00 | 0x7fbf7ac35f00 | 524288 | 12333047 | 1578665472 | 12076324890422609 | 12076324890583496 | 12076324890714055 | 12076324890718158 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 116 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 68480 | 0x7fc0aab91900 | 0x7fbf7ac35f40 | 524288 | 13147150 | 1682780388 | 12076324890763743 | 12076324890932934 | 12076324891196933 | 12076324891267369 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 118 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 69696 | 0x7fc0aab91800 | 0x7fbf7ac35f80 | 524288 | 14153714 | 1811632852 | 12076324891292906 | 12076324891468931 | 12076324891717890 | 12076324891784791 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 120 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 70912 | 0x7fc0aab91700 | 0x7fbf7ac35fc0 | 524288 | 11152062 | 1427486812 | 12076324891810709 | 12076324891983809 | 12076324892118048 | 12076324892122168 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 122 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 72384 | 0x7fc0aab91600 | 0x7fbf7ac36000 | 524288 | 7595469 | 972160732 | 12076324892171249 | 12076324892335487 | 12076324892475806 | 12076324892479612 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 124 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 73600 | 0x7fc0aab91500 | 0x7fbf7ac36040 | 524288 | 12148182 | 1554948808 | 12076324892538181 | 12076324892695805 | 12076324892828924 | 12076324892832708 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 126 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 75840 | 0x7fc0aab91400 | 0x7fbf7ac36080 | 524288 | 13124035 | 1679848188 | 12076324892880517 | 12076324893070203 | 12076324893331802 | 12076324893381418 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 128 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 77056 | 0x7fc0aab91300 | 0x7fbf7ac360c0 | 524288 | 14233274 | 1821792808 | 12076324893405332 | 12076324893586040 | 12076324893839159 | 12076324893888650 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 130 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 78272 | 0x7fc0aab91a00 | 0x7fbf7ac36100 | 524288 | 12840930 | 1643719556 | 12076324893913857 | 12076324894095478 | 12076324894224117 | 12076324894228342 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 132 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 80000 | 0x7fc0aab91900 | 0x7fbf7ac36140 | 524288 | 7040782 | 901187228 | 12076324894275089 | 12076324894446196 | 12076324894590355 | 12076324894594292 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 134 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 81216 | 0x7fc0aab91800 | 0x7fbf7ac36180 | 524288 | 12809973 | 1639613120 | 12076324894654794 | 12076324894813234 | 12076324894943473 | 12076324894947218 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 136 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 83456 | 0x7fc0aab91700 | 0x7fbf7ac361c0 | 524288 | 14132386 | 1808914756 | 12076324894994185 | 12076324895168432 | 12076324895433711 | 12076324895484486 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 138 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 84928 | 0x7fc0aab91600 | 0x7fbf7ac36200 | 524288 | 13678968 | 1750855192 | 12076324895509914 | 12076324895688270 | 12076324895938348 | 12076324895987581 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 140 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 86400 | 0x7fc0aab91500 | 0x7fbf7ac36240 | 524288 | 11779596 | 1507833372 | 12076324896020793 | 12076324896204907 | 12076324896338986 | 12076324896342932 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 142 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 88128 | 0x7fc0aab91400 | 0x7fbf7ac36280 | 524288 | 5370329 | 687500044 | 12076324896392764 | 12076324896558985 | 12076324896710184 | 12076324896714011 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 144 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 89600 | 0x7fc0aab91300 | 0x7fbf7ac362c0 | 524288 | 12296817 | 1573999032 | 12076324896791876 | 12076324896949543 | 12076324897081543 | 12076324897085722 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 146 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 92096 | 0x7fc0aab91a00 | 0x7fbf7ac36300 | 524288 | 11501488 | 1472202096 | 12076324897134282 | 12076324897305541 | 12076324897573540 | 12076324897596201 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 148 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 93568 | 0x7fc0aab91900 | 0x7fbf7ac36340 | 524288 | 13320122 | 1704983752 | 12076324897638279 | 12076324897797219 | 12076324898055458 | 12076324898107120 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 150 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 95040 | 0x7fc0aab91800 | 0x7fbf7ac36380 | 524288 | 12016359 | 1538034476 | 12076324898134050 | 12076324898310816 | 12076324898443616 | 12076324898447503 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 152 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 96768 | 0x7fc0aab91700 | 0x7fbf7ac363c0 | 524288 | 4326131 | 553723324 | 12076324898495282 | 12076324898661854 | 12076324898819294 | 12076324898823261 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 154 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 98240 | 0x7fc0aab91600 | 0x7fbf7ac36400 | 524288 | 12239178 | 1566613400 | 12076324898883263 | 12076324899049212 | 12076324899182172 | 12076324899186055 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 156 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 100736 | 0x7fc0aab91500 | 0x7fbf7ac36440 | 524288 | 12133403 | 1553101152 | 12076324899233854 | 12076324899407131 | 12076324899674489 | 12076324899722693 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 158 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 102208 | 0x7fc0aab91400 | 0x7fbf7ac36480 | 524288 | 13469460 | 1724089464 | 12076324899748821 | 12076324899922648 | 12076324900183607 | 12076324900237450 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 160 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 103680 | 0x7fc0aab91300 | 0x7fbf7ac364c0 | 524288 | 10572687 | 1353220160 | 12076324900264750 | 12076324900443285 | 12076324900583285 | 12076324900586959 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 162 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 105664 | 0x7fc0aab91a00 | 0x7fbf7ac36500 | 524288 | 4142103 | 530260360 | 12076324900636742 | 12076324900810483 | 12076324900976403 | 12076324900980340 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 164 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 107136 | 0x7fc0aab91900 | 0x7fbf7ac36540 | 524288 | 12008178 | 1537017356 | 12076324901042836 | 12076324901205361 | 12076324901338641 | 12076324901342203 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 166 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 109888 | 0x7fc0aab91800 | 0x7fbf7ac36580 | 524288 | 9834726 | 1258810876 | 12076324901393728 | 12076324901555280 | 12076324901821678 | 12076324901867108 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 168 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 111360 | 0x7fc0aab91700 | 0x7fbf7ac365c0 | 524288 | 14102675 | 1805176040 | 12076324901893748 | 12076324902072877 | 12076324902326636 | 12076324902374351 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 170 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 112832 | 0x7fc0aab91600 | 0x7fbf7ac36600 | 524288 | 10607477 | 1357736056 | 12076324902401040 | 12076324902577194 | 12076324902715754 | 12076324902719783 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 172 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 114816 | 0x7fc0aab91500 | 0x7fbf7ac36640 | 524288 | 3527276 | 451413128 | 12076324902766670 | 12076324902933033 | 12076324903106952 | 12076324903111360 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 174 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 116288 | 0x7fc0aab91400 | 0x7fbf7ac36680 | 524288 | 12880722 | 1648750984 | 12076324903171562 | 12076324903335751 | 12076324903465030 | 12076324903468805 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 176 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 119040 | 0x7fc0aab91300 | 0x7fbf7ac366c0 | 524288 | 9146419 | 1170760916 | 12076324903512506 | 12076324903682309 | 12076324903939907 | 12076324903986697 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 178 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 120768 | 0x7fc0aab91a00 | 0x7fbf7ac36700 | 524288 | 14038124 | 1796871968 | 12076324904016483 | 12076324904198306 | 12076324904453505 | 12076324904502616 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 180 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 122496 | 0x7fc0aab91900 | 0x7fbf7ac36740 | 524288 | 10574105 | 1353496756 | 12076324904529416 | 12076324904710464 | 12076324904849663 | 12076324904853478 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 182 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 124736 | 0x7fc0aab91800 | 0x7fbf7ac36780 | 524288 | 3457399 | 442518116 | 12076324904902720 | 12076324905072382 | 12076324905255741 | 12076324905259603 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 184 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 126464 | 0x7fc0aab91700 | 0x7fbf7ac367c0 | 524288 | 10207108 | 1306525100 | 12076324905320226 | 12076324905479740 | 12076324905664379 | 12076324905668333 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 186 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 20 | 24 | 127936 | 0x7fc0aab91600 | 0x7fbf7ac36800 | 524288 | 4125913 | 528139660 | 12076324905718255 | 12076324905879578 | 12076324906178616 | 12076324906225939 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 188 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 129664 | 0x7fc0aab91500 | 0x7fbf7ac36840 | 524288 | 13900881 | 1779277944 | 12076324906251737 | 12076324906430775 | 12076324906685333 | 12076324906733031 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 190 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 131392 | 0x7fc0aab91400 | 0x7fbf7ac36880 | 524288 | 11632847 | 1488971872 | 12076324906758919 | 12076324906931732 | 12076324907066132 | 12076324907069937 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 192 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 133632 | 0x7fc0aab91300 | 0x7fbf7ac368c0 | 524288 | 3437352 | 439997196 | 12076324907120692 | 12076324907290770 | 12076324907482769 | 12076324907530934 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 194 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 135360 | 0x7fc0aab91a00 | 0x7fbf7ac36900 | 524288 | 11389714 | 1457913640 | 12076324907569756 | 12076324907729168 | 12076324907864207 | 12076324907868001 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 196 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 20 | 24 | 136832 | 0x7fc0aab91900 | 0x7fbf7ac36940 | 524288 | 2914743 | 373162536 | 12076324907916030 | 12076324908096526 | 12076324908381805 | 12076324908430977 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 198 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 138560 | 0x7fc0aab91800 | 0x7fbf7ac36980 | 524288 | 13932315 | 1783280116 | 12076324908456384 | 12076324908633324 | 12076324908892522 | 12076324908913363 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 200 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 140288 | 0x7fc0aab91700 | 0x7fbf7ac369c0 | 524288 | 10430768 | 1335016856 | 12076324908955692 | 12076324909121001 | 12076324909261160 | 12076324909265337 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 202 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 142784 | 0x7fc0aab91600 | 0x7fbf7ac36a00 | 524288 | 3351105 | 429074216 | 12076324909313978 | 12076324909480199 | 12076324909690118 | 12076324909737725 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 204 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 144768 | 0x7fc0aab91500 | 0x7fbf7ac36a40 | 524288 | 10451016 | 1337718216 | 12076324909776077 | 12076324909934917 | 12076324910073476 | 12076324910077457 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 206 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 20 | 24 | 145728 | 0x7fc0aab91400 | 0x7fbf7ac36a80 | 524288 | 2564820 | 328282864 | 12076324910127720 | 12076324910298755 | 12076324910608673 | 12076324910655411 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 208 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 147712 | 0x7fc0aab91300 | 0x7fbf7ac36ac0 | 524288 | 14030770 | 1795889424 | 12076324910681670 | 12076324910854752 | 12076324911109951 | 12076324911160049 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 210 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 149696 | 0x7fc0aab91a00 | 0x7fbf7ac36b00 | 524288 | 10435639 | 1335811920 | 12076324911186838 | 12076324911362910 | 12076324911502109 | 12076324911506032 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 212 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 152192 | 0x7fc0aab91900 | 0x7fbf7ac36b40 | 524288 | 3233595 | 413830248 | 12076324911554852 | 12076324911720828 | 12076324911982426 | 12076324912029735 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 214 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 154176 | 0x7fc0aab91800 | 0x7fbf7ac36b80 | 524288 | 10017803 | 1282209860 | 12076324912064670 | 12076324912235865 | 12076324912375864 | 12076324912379866 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 216 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 20 | 24 | 155648 | 0x7fc0aab91700 | 0x7fbf7ac36bc0 | 524288 | 2492896 | 319050360 | 12076324912427394 | 12076324912594263 | 12076324912925782 | 12076324912947611 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 218 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 157632 | 0x7fc0aab91600 | 0x7fbf7ac36c00 | 524288 | 12895056 | 1650572240 | 12076324912984680 | 12076324913146900 | 12076324913407379 | 12076324913456707 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 220 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 159616 | 0x7fc0aab91500 | 0x7fbf7ac36c40 | 524288 | 10583640 | 1354717808 | 12076324913478728 | 12076324913656658 | 12076324913796497 | 12076324913800476 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 222 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 162368 | 0x7fc0aab91400 | 0x7fbf7ac36c80 | 524288 | 3376223 | 432037936 | 12076324913848214 | 12076324914015216 | 12076324914261135 | 12076324914308670 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 224 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 164608 | 0x7fc0aab91300 | 0x7fbf7ac36cc0 | 524288 | 9625041 | 1232048032 | 12076324914345469 | 12076324914511300 | 12076324914651460 | 12076324914658581 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 226 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 20 | 24 | 166336 | 0x7fc0aab91a00 | 0x7fbf7ac36d00 | 524288 | 2385143 | 305245444 | 12076324914705838 | 12076324914865378 | 12076324915242656 | 12076324915293090 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 228 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 168576 | 0x7fc0aab91900 | 0x7fbf7ac36d40 | 524288 | 13874201 | 1775809428 | 12076324915318427 | 12076324915494335 | 12076324915749054 | 12076324915769124 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 230 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 170816 | 0x7fc0aab91800 | 0x7fbf7ac36d80 | 524288 | 9307681 | 1191433172 | 12076324915812435 | 12076324915970173 | 12076324916114332 | 12076324916118083 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 232 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 174080 | 0x7fc0aab91700 | 0x7fbf7ac36dc0 | 524288 | 3367622 | 430932036 | 12076324916167244 | 12076324916342651 | 12076324916653210 | 12076324916701397 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 234 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 176576 | 0x7fc0aab91600 | 0x7fbf7ac36e00 | 524288 | 8639586 | 1105829828 | 12076324916739287 | 12076324916897209 | 12076324917032249 | 12076324917035628 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 236 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 20 | 24 | 177792 | 0x7fc0aab91500 | 0x7fbf7ac36e40 | 524288 | 2339059 | 299339440 | 12076324917083978 | 12076324917253048 | 12076324917677686 | 12076324917724418 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 238 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 180288 | 0x7fc0aab91400 | 0x7fbf7ac36e80 | 524288 | 10103691 | 1293250032 | 12076324917750777 | 12076324917927285 | 12076324918192244 | 12076324918240618 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 240 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 182784 | 0x7fc0aab91300 | 0x7fbf7ac36ec0 | 524288 | 7301788 | 934484428 | 12076324918267037 | 12076324918444883 | 12076324918586162 | 12076324918589426 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 242 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 186304 | 0x7fc0aab91a00 | 0x7fbf7ac36f00 | 524288 | 3448522 | 441367708 | 12076324918637465 | 12076324918803921 | 12076324919119600 | 12076324919170886 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 244 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 189312 | 0x7fc0aab91900 | 0x7fbf7ac36f40 | 524288 | 3610119 | 462206688 | 12076324919207244 | 12076324919369519 | 12076324919523918 | 12076324919527128 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 246 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 20 | 24 | 190784 | 0x7fc0aab91800 | 0x7fbf7ac36f80 | 524288 | 2302329 | 294751312 | 12076324919574777 | 12076324919743917 | 12076324920260715 | 12076324920307849 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 248 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 193792 | 0x7fc0aab91700 | 0x7fbf7ac36fc0 | 524288 | 8378304 | 1072369756 | 12076324920330802 | 12076324920519754 | 12076324920817833 | 12076324920838546 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 250 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 196800 | 0x7fc0aab91600 | 0x7fbf7ac37000 | 524288 | 3326783 | 425884268 | 12076324920890202 | 12076324921054472 | 12076324921209031 | 12076324921212571 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 252 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 201088 | 0x7fc0aab91500 | 0x7fbf7ac37040 | 524288 | 3268023 | 418386768 | 12076324921259578 | 12076324921438470 | 12076324921824388 | 12076324921871065 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 254 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 204608 | 0x7fc0aab91400 | 0x7fbf7ac37080 | 524288 | 3406692 | 435950804 | 12076324921914355 | 12076324922081347 | 12076324922258467 | 12076324922261971 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 256 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 20 | 24 | 206080 | 0x7fc0aab91300 | 0x7fbf7ac370c0 | 524288 | 2321360 | 297201432 | 12076324922310371 | 12076324922480066 | 12076324923090623 | 12076324923138600 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 258 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 209600 | 0x7fc0aab91a00 | 0x7fbf7ac37100 | 524288 | 3726423 | 476982952 | 12076324923164739 | 12076324923348382 | 12076324923675741 | 12076324923721464 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 260 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 213120 | 0x7fc0aab91900 | 0x7fbf7ac37140 | 524288 | 3106039 | 397473404 | 12076324923748774 | 12076324923927260 | 12076324924105979 | 12076324924109525 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 262 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 218176 | 0x7fc0aab91800 | 0x7fbf7ac37180 | 524288 | 3312643 | 423978688 | 12076324924156622 | 12076324924328058 | 12076324924784376 | 12076324924832679 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 264 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 222208 | 0x7fc0aab91700 | 0x7fbf7ac371c0 | 524288 | 2983092 | 381885796 | 12076324924872042 | 12076324925039575 | 12076324925240214 | 12076324925289097 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 266 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 20 | 24 | 223936 | 0x7fc0aab91600 | 0x7fbf7ac37200 | 524288 | 2291301 | 293339744 | 12076324925311018 | 12076324925497013 | 12076324926207570 | 12076324926256495 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 268 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 227968 | 0x7fc0aab91500 | 0x7fbf7ac37240 | 524288 | 3602250 | 461175832 | 12076324926280810 | 12076324926461009 | 12076324926835087 | 12076324926881707 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 270 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 232000 | 0x7fc0aab91400 | 0x7fbf7ac37280 | 524288 | 3089036 | 395326984 | 12076324926908056 | 12076324927093806 | 12076324927297645 | 12076324927346741 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 272 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 237824 | 0x7fc0aab91300 | 0x7fbf7ac372c0 | 524288 | 4037597 | 516856392 | 12076324927371627 | 12076324927546764 | 12076324928073482 | 12076324928121651 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 274 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 242368 | 0x7fc0aab91a00 | 0x7fbf7ac37300 | 524288 | 3050385 | 390352172 | 12076324928160734 | 12076324928321641 | 12076324928545160 | 12076324928591574 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 276 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 20 | 24 | 243584 | 0x7fc0aab91900 | 0x7fbf7ac37340 | 524288 | 2324407 | 297411124 | 12076324928613475 | 12076324928796199 | 12076324929596196 | 12076324929646785 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 278 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 248128 | 0x7fc0aab91800 | 0x7fbf7ac37380 | 524288 | 3451819 | 441894164 | 12076324929672984 | 12076324929850595 | 12076324930272033 | 12076324930325016 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 280 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 252672 | 0x7fc0aab91700 | 0x7fbf7ac373c0 | 524288 | 3136706 | 401476888 | 12076324930351976 | 12076324930531072 | 12076324930757951 | 12076324930806060 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 282 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 259264 | 0x7fc0aab91600 | 0x7fbf7ac37400 | 524288 | 4642750 | 594336476 | 12076324930829994 | 12076324931004510 | 12076324931601467 | 12076324931650459 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 284 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 264832 | 0x7fc0aab91500 | 0x7fbf7ac37440 | 524288 | 3205878 | 410331404 | 12076324931687067 | 12076324931855866 | 12076324932126585 | 12076324932177739 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 286 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 20 | 24 | 266304 | 0x7fc0aab91400 | 0x7fbf7ac37480 | 524288 | 2309146 | 295428132 | 12076324932200201 | 12076324932379224 | 12076324933364020 | 12076324933431459 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 288 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 28 | 24 | 271872 | 0x7fc0aab91300 | 0x7fbf7ac374c0 | 524288 | 3535941 | 452505508 | 12076324933462126 | 12076324933637779 | 12076324934152977 | 12076324934219604 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 290 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 277440 | 0x7fc0aab91a00 | 0x7fbf7ac37500 | 524288 | 3205779 | 410295868 | 12076324934248407 | 12076324934424976 | 12076324934699054 | 12076324934765919 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 292 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 12 | 24 | 279936 | 0x7fc0aab91900 | 0x7fbf7ac37540 | 524288 | 2194670 | 280910352 | 12076324934793480 | 12076324934964493 | 12076324935704650 | 12076324935773872 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 294 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 286528 | 0x7fc0aab91800 | 0x7fbf7ac37580 | 524288 | 3287385 | 420792036 | 12076324935815820 | 12076324935979209 | 12076324936297128 | 12076324936364590 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 296 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 20 | 24 | 288000 | 0x7fc0aab91700 | 0x7fbf7ac375c0 | 524288 | 2280821 | 291909728 | 12076324936393123 | 12076324936571687 | 12076324937743362 | 12076324937809225 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 298 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 32 | 24 | 294592 | 0x7fc0aab91600 | 0x7fbf7ac37600 | 524288 | 3407856 | 436190608 | 12076324937839431 | 12076324938009281 | 12076324938618078 | 12076324938686485 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 300 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 301184 | 0x7fc0aab91500 | 0x7fbf7ac37640 | 524288 | 3310205 | 423678296 | 12076324938717172 | 12076324938892157 | 12076324939211196 | 12076324939280329 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 302 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 12 | 24 | 304960 | 0x7fc0aab91400 | 0x7fbf7ac37680 | 524288 | 2196223 | 280992068 | 12076324939309994 | 12076324939492634 | 12076324940371831 | 12076324940438000 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 304 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 24 | 24 | 313600 | 0x7fc0aab91300 | 0x7fbf7ac376c0 | 524288 | 3278376 | 419575164 | 12076324940480008 | 12076324940641750 | 12076324941053428 | 12076324941120028 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 306 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 20 | 24 | 314816 | 0x7fc0aab91a00 | 0x7fbf7ac37700 | 524288 | 2331810 | 298531300 | 12076324941151126 | 12076324941323667 | 12076324942873420 | 12076324942940451 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 308 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 20 | 24 | 317568 | 0x7fc0aab91900 | 0x7fbf7ac37740 | 524288 | 2263036 | 289789640 | 12076324942963183 | 12076324943154379 | 12076324943949736 | 12076324944019366 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 310 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 12 | 24 | 320320 | 0x7fc0aab91800 | 0x7fbf7ac37780 | 524288 | 2173619 | 278217040 | 12076324944048741 | 12076324944228614 | 12076324944643973 | 12076324944709699 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 312 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 12 | 24 | 324096 | 0x7fc0aab91700 | 0x7fbf7ac377c0 | 524288 | 2242042 | 286971484 | 12076324944733664 | 12076324944908772 | 12076324946068287 | 12076324946136180 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 314 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 12 | 24 | 328896 | 0x7fc0aab91600 | 0x7fbf7ac37800 | 524288 | 2242646 | 287191700 | 12076324946175754 | 12076324946337406 | 12076324947123642 | 12076324947191211 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 316 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 20 | 24 | 330112 | 0x7fc0aab91500 | 0x7fbf7ac37840 | 524288 | 2662363 | 340770928 | 12076324947220205 | 12076324947398521 | 12076324950447468 | 12076324950514557 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 318 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 20 | 24 | 332864 | 0x7fc0aab91400 | 0x7fbf7ac37880 | 524288 | 2298931 | 294319360 | 12076324950544573 | 12076324950722507 | 12076324952264421 | 12076324952331274 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 320 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 12 | 24 | 335616 | 0x7fc0aab91300 | 0x7fbf7ac378c0 | 524288 | 2197160 | 281088936 | 12076324952360167 | 12076324952544740 | 12076324953334016 | 12076324953402354 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 322 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 12 | 24 | 339392 | 0x7fc0aab91a00 | 0x7fbf7ac37900 | 524288 | 2535602 | 324582428 | 12076324953432911 | 12076324953610655 | 12076324955893526 | 12076324955961731 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 324 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 12 | 24 | 344192 | 0x7fc0aab91900 | 0x7fbf7ac37940 | 524288 | 2385934 | 305369720 | 12076324956007636 | 12076324956173524 | 12076324957708878 | 12076324957778467 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 326 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 20 | 24 | 345408 | 0x7fc0aab91800 | 0x7fbf7ac37980 | 524288 | 2884153 | 369236128 | 12076324957808362 | 12076324957987437 | 12076324964042291 | 12076324964112859 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 328 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 20 | 24 | 348160 | 0x7fc0aab91700 | 0x7fbf7ac379c0 | 524288 | 3377375 | 432171988 | 12076324964139058 | 12076324964317330 | 12076324967362437 | 12076324967593037 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 330 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 12 | 24 | 350912 | 0x7fc0aab91600 | 0x7fbf7ac37a00 | 524288 | 2262042 | 289551444 | 12076324967625167 | 12076324967808676 | 12076324969347709 | 12076324969417327 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 332 | 921153 | 921158 | 4194304 | 256 | 0 | 0 | 12 | 24 | 0 | 0x7fc0aab91500 | 0x7fbf7ac37a40 | 524288 | 2567679 | 328586028 | 12076324969444798 | 12076324969626428 | 12076324974153289 | 12076324974220834 |