50 KiB
50 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | GRBM_COUNT | GRBM_GUI_ACTIVE | CPC_ME1_BUSY_FOR_PACKET_DECODE | SQ_CYCLES | SQ_WAVES | SQ_WAVE_CYCLES | SQ_BUSY_CYCLES | SQ_LEVEL_WAVES | SQ_ACCUM_PREV_HIRES | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBuffer.kd | 0 | 0 | 0 | 932047 | 932054 | 33554432 | 256 | 0 | 0 | 8 | 32 | 6464 | 0x0 | 0x7f4318204180 | 502027 | 502027 | 17663 | 4016224 | 524288 | 373010853 | 3812072 | 0 | 1506849280 | 12076539256161927 | 12076539500209550 | 12076539500532269 | 12076539500642792 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 932047 | 932054 | 32768 | 256 | 0 | 0 | 24 | 24 | 12480 | 0x0 | 0x7f4318235100 | 28337 | 28337 | 21039 | 226704 | 512 | 1125690 | 76367 | 0 | 4517036 | 12076539515082191 | 12076539515408737 | 12076539515415137 | 12076539515423846 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 4 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 12928 | 0x7f4423eba900 | 0x7f4318235140 | 214085 | 214085 | 21876 | 1712688 | 65536 | 145056154 | 1546601 | 0 | 582037424 | 12076539515493015 | 12076539515729376 | 12076539515859296 | 12076539515863073 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 6 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 36 | 24 | 13632 | 0x7f4423eba800 | 0x7f4318235180 | 384636 | 384636 | 29429 | 3077096 | 65536 | 257748821 | 2910007 | 0 | 1032814660 | 12076539515940978 | 12076539516139775 | 12076539516384574 | 12076539516454523 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 8 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 14080 | 0x7f4423eba700 | 0x7f43182351c0 | 402492 | 402492 | 29357 | 3219944 | 65536 | 279692821 | 3037066 | 0 | 1120588996 | 12076539516489238 | 12076539516696253 | 12076539516951772 | 12076539517020887 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 10 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 14528 | 0x7f4423eba600 | 0x7f4318235200 | 212317 | 212317 | 22764 | 1698544 | 65536 | 155474951 | 1531408 | 0 | 623720392 | 12076539517046294 | 12076539517254331 | 12076539517383931 | 12076539517387499 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 12 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 14976 | 0x7f4423eba500 | 0x7f4318235240 | 211901 | 211901 | 22389 | 1695216 | 65536 | 142732486 | 1522500 | 0 | 572750716 | 12076539517445937 | 12076539517643130 | 12076539517771769 | 12076539517775330 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 14 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 15424 | 0x7f4423eba400 | 0x7f4318235280 | 215869 | 215869 | 19266 | 1726960 | 65536 | 159152180 | 1562834 | 0 | 638425092 | 12076539517864656 | 12076539518050328 | 12076539518182328 | 12076539518185914 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 16 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 16128 | 0x7f4423eba300 | 0x7f43182352c0 | 392132 | 392132 | 32200 | 3137064 | 65536 | 337425059 | 2961038 | 0 | 1351517408 | 12076539518245044 | 12076539518450007 | 12076539518699126 | 12076539518741016 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 18 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 16832 | 0x7f4423ebaa00 | 0x7f4318235300 | 397317 | 397317 | 28490 | 3178544 | 65536 | 314230850 | 3009046 | 0 | 1258740612 | 12076539518777825 | 12076539518966805 | 12076539519220404 | 12076539519289907 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 20 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 17536 | 0x7f4423eba900 | 0x7f4318235340 | 208428 | 208428 | 23475 | 1667432 | 65536 | 168392411 | 1499567 | 0 | 675389732 | 12076539519317439 | 12076539519521523 | 12076539519648243 | 12076539519651680 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 22 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 18240 | 0x7f4423eba800 | 0x7f4318235380 | 218181 | 218181 | 22368 | 1745456 | 65536 | 148176463 | 1578162 | 0 | 594517888 | 12076539519709708 | 12076539519900562 | 12076539520034162 | 12076539520037909 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 24 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 18944 | 0x7f4423eba700 | 0x7f43182353c0 | 211493 | 211493 | 23293 | 1691952 | 65536 | 159187710 | 1520072 | 0 | 638568648 | 12076539520111125 | 12076539520295281 | 12076539520423920 | 12076539520427443 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 26 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 19904 | 0x7f4423eba600 | 0x7f4318235400 | 392900 | 392900 | 22533 | 3143208 | 65536 | 323568499 | 2957821 | 0 | 1296089812 | 12076539520488988 | 12076539520679279 | 12076539520930638 | 12076539520997003 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 28 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 20608 | 0x7f4423eba500 | 0x7f4318235440 | 388044 | 388044 | 27421 | 3104360 | 65536 | 315968977 | 2925187 | 0 | 1265693716 | 12076539521029143 | 12076539521233997 | 12076539521480877 | 12076539521549430 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 30 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 21312 | 0x7f4423eba400 | 0x7f4318235480 | 212861 | 212861 | 25994 | 1702896 | 65536 | 160543700 | 1517346 | 0 | 643992048 | 12076539521571471 | 12076539521771916 | 12076539521900715 | 12076539521904220 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 32 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 22016 | 0x7f4423eba300 | 0x7f43182354c0 | 215373 | 215373 | 21749 | 1722992 | 65536 | 152440532 | 1553500 | 0 | 611571948 | 12076539521955896 | 12076539522157834 | 12076539522289674 | 12076539522293064 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 34 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 22720 | 0x7f4423ebaa00 | 0x7f4318235500 | 208701 | 208701 | 17514 | 1669616 | 65536 | 165297552 | 1495890 | 0 | 663012708 | 12076539522363775 | 12076539522541833 | 12076539522669193 | 12076539522672720 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 36 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 23680 | 0x7f4423eba900 | 0x7f4318235540 | 399460 | 399460 | 33571 | 3195688 | 65536 | 364799220 | 3028168 | 0 | 1461014924 | 12076539522730978 | 12076539522919912 | 12076539523175591 | 12076539523242860 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 38 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 24384 | 0x7f4423eba800 | 0x7f4318235580 | 397604 | 397604 | 29669 | 3180840 | 65536 | 328803190 | 2990824 | 0 | 1317029904 | 12076539523267366 | 12076539523465670 | 12076539523718309 | 12076539523785009 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 40 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 25088 | 0x7f4423eba700 | 0x7f43182355c0 | 210581 | 210581 | 23874 | 1684656 | 65536 | 161468109 | 1515980 | 0 | 647690564 | 12076539523809915 | 12076539524007748 | 12076539524136228 | 12076539524139869 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 42 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 25792 | 0x7f4423eba600 | 0x7f4318235600 | 218085 | 218085 | 23334 | 1744688 | 65536 | 160499877 | 1576869 | 0 | 643821736 | 12076539524202566 | 12076539524399107 | 12076539524532706 | 12076539524536006 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 44 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 26496 | 0x7f4423eba500 | 0x7f4318235640 | 209717 | 209717 | 22643 | 1677744 | 65536 | 159537471 | 1511311 | 0 | 639967800 | 12076539524607639 | 12076539524781825 | 12076539524909345 | 12076539524912676 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 46 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 27712 | 0x7f4423eba400 | 0x7f4318235680 | 389613 | 389613 | 33391 | 3116912 | 65536 | 315783764 | 2960375 | 0 | 1264951208 | 12076539524969692 | 12076539525170144 | 12076539525420223 | 12076539525488207 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 48 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 28416 | 0x7f4423eba300 | 0x7f43182356c0 | 394892 | 394892 | 30346 | 3159144 | 65536 | 335876840 | 2992166 | 0 | 1345325376 | 12076539525512733 | 12076539525711262 | 12076539525963741 | 12076539526030456 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 50 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 29120 | 0x7f4423ebaa00 | 0x7f4318235700 | 209245 | 209245 | 20208 | 1673968 | 65536 | 164075248 | 1511213 | 0 | 658119196 | 12076539526053679 | 12076539526253820 | 12076539526381820 | 12076539526385386 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 52 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 30080 | 0x7f4423eba900 | 0x7f4318235740 | 218381 | 218381 | 26547 | 1747056 | 65536 | 161860757 | 1576635 | 0 | 649255836 | 12076539526445337 | 12076539526628859 | 12076539526762779 | 12076539526766174 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 54 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 30784 | 0x7f4423eba800 | 0x7f4318235780 | 210437 | 210437 | 22470 | 1683504 | 65536 | 160228275 | 1521869 | 0 | 642750380 | 12076539526836936 | 12076539527008378 | 12076539527137497 | 12076539527140951 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 56 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 32000 | 0x7f4423eba700 | 0x7f43182357c0 | 449005 | 449005 | 15250 | 3592048 | 65536 | 298339799 | 2970249 | 0 | 1195174808 | 12076539527196735 | 12076539527397656 | 12076539527686456 | 12076539527752980 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 58 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 32960 | 0x7f4423eba600 | 0x7f4318235800 | 396132 | 396132 | 28667 | 3169064 | 65536 | 300122611 | 2992825 | 0 | 1202309044 | 12076539527775251 | 12076539527971575 | 12076539528223894 | 12076539528293094 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 60 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 33920 | 0x7f4423eba500 | 0x7f4318235840 | 208044 | 208044 | 22029 | 1664360 | 65536 | 165662590 | 1501017 | 0 | 664472032 | 12076539528317059 | 12076539528514453 | 12076539528642132 | 12076539528645540 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 62 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 34880 | 0x7f4423eba400 | 0x7f4318235880 | 213420 | 213420 | 25970 | 1707368 | 65536 | 158450111 | 1535263 | 0 | 635627332 | 12076539528704590 | 12076539528890771 | 12076539529021331 | 12076539529024856 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 64 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 35840 | 0x7f4423eba300 | 0x7f43182358c0 | 214341 | 214341 | 22778 | 1714736 | 65536 | 158503640 | 1555723 | 0 | 635840568 | 12076539529095136 | 12076539529269170 | 12076539529400690 | 12076539529404191 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 66 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 37312 | 0x7f4423ebaa00 | 0x7f4318235900 | 393501 | 393501 | 27294 | 3148016 | 65536 | 292135368 | 2959063 | 0 | 1170360636 | 12076539529461838 | 12076539529646769 | 12076539529899088 | 12076539529966156 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 68 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 38272 | 0x7f4423eba900 | 0x7f4318235940 | 395740 | 395740 | 29857 | 3165928 | 65536 | 318956410 | 2991481 | 0 | 1277643520 | 12076539529988839 | 12076539530193007 | 12076539530446286 | 12076539530514006 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 70 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 39232 | 0x7f4423eba800 | 0x7f4318235980 | 210892 | 210892 | 24694 | 1687144 | 65536 | 161933161 | 1514602 | 0 | 649554832 | 12076539530537108 | 12076539530742285 | 12076539530870925 | 12076539530874506 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 72 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 40192 | 0x7f4423eba700 | 0x7f43182359c0 | 218149 | 218149 | 25502 | 1745200 | 65536 | 167197763 | 1572574 | 0 | 670637260 | 12076539530932795 | 12076539531121004 | 12076539531255563 | 12076539531259282 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 74 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 41152 | 0x7f4423eba600 | 0x7f4318235a00 | 213669 | 213669 | 24950 | 1709360 | 65536 | 158758103 | 1534953 | 0 | 636856296 | 12076539531331696 | 12076539531503563 | 12076539531633642 | 12076539531637205 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 76 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 42624 | 0x7f4423eba500 | 0x7f4318235a40 | 387493 | 387493 | 27375 | 3099952 | 65536 | 288078618 | 2915784 | 0 | 1154135460 | 12076539531694331 | 12076539531880841 | 12076539532129960 | 12076539532199771 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 78 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 43584 | 0x7f4423eba400 | 0x7f4318235a80 | 388805 | 388805 | 28163 | 3110448 | 65536 | 257785117 | 2922396 | 0 | 1032958956 | 12076539532223926 | 12076539532421639 | 12076539532669799 | 12076539532736670 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 80 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 44544 | 0x7f4423eba300 | 0x7f4318235ac0 | 212876 | 212876 | 25302 | 1703016 | 65536 | 163427144 | 1518417 | 0 | 655547712 | 12076539532759983 | 12076539532952998 | 12076539533082117 | 12076539533085900 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 82 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 45760 | 0x7f4423ebaa00 | 0x7f4318235b00 | 214476 | 214476 | 25502 | 1715816 | 65536 | 162024480 | 1539520 | 0 | 649921084 | 12076539533145601 | 12076539533339236 | 12076539533470916 | 12076539533474523 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 84 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 46720 | 0x7f4423eba900 | 0x7f4318235b40 | 210084 | 210084 | 21001 | 1680680 | 65536 | 163816612 | 1516465 | 0 | 657097232 | 12076539533546456 | 12076539533717475 | 12076539533846275 | 12076539533849971 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 86 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 48448 | 0x7f4423eba800 | 0x7f4318235b80 | 409333 | 409333 | 33833 | 3274672 | 65536 | 309768922 | 3060020 | 0 | 1240895608 | 12076539533909772 | 12076539534100834 | 12076539534361633 | 12076539534429709 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 88 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 49408 | 0x7f4423eba700 | 0x7f4318235bc0 | 449285 | 449285 | 15102 | 3594288 | 65536 | 332564316 | 2962689 | 0 | 1332073724 | 12076539534453423 | 12076539534647712 | 12076539534936831 | 12076539535010980 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 90 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 50368 | 0x7f4423eba600 | 0x7f4318235c00 | 214037 | 214037 | 25667 | 1712304 | 65536 | 161217224 | 1538544 | 0 | 646712252 | 12076539535035356 | 12076539535231230 | 12076539535361469 | 12076539535365169 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 92 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 51584 | 0x7f4423eba500 | 0x7f4318235c40 | 215093 | 215093 | 25716 | 1720752 | 65536 | 158219899 | 1544277 | 0 | 634702480 | 12076539535425041 | 12076539535606269 | 12076539535739068 | 12076539535743002 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 94 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 52544 | 0x7f4423eba400 | 0x7f4318235c80 | 214317 | 214317 | 21854 | 1714544 | 65536 | 161781270 | 1545844 | 0 | 648942668 | 12076539535813954 | 12076539535983707 | 12076539536114907 | 12076539536118671 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 96 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 54272 | 0x7f4423eba300 | 0x7f4318235cc0 | 410324 | 410324 | 33047 | 3282600 | 65536 | 339523520 | 3107522 | 0 | 1359914564 | 12076539536169826 | 12076539536369466 | 12076539536633625 | 12076539536700433 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 98 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 55488 | 0x7f4423ebaa00 | 0x7f4318235d00 | 392629 | 392629 | 30177 | 3141040 | 65536 | 316266298 | 2969078 | 0 | 1266883720 | 12076539536724368 | 12076539536919704 | 12076539537171863 | 12076539537239776 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 100 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 56704 | 0x7f4423eba900 | 0x7f4318235d40 | 213741 | 213741 | 20559 | 1709936 | 65536 | 160614774 | 1544044 | 0 | 644290392 | 12076539537266155 | 12076539537460822 | 12076539537592502 | 12076539537596009 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 102 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 58176 | 0x7f4423eba800 | 0x7f4318235d80 | 224884 | 224884 | 27629 | 1799080 | 65536 | 178813063 | 1622518 | 0 | 717122716 | 12076539537654087 | 12076539537838741 | 12076539537977460 | 12076539537981045 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 104 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 59392 | 0x7f4423eba700 | 0x7f4318235dc0 | 212324 | 212324 | 24327 | 1698600 | 65536 | 159376433 | 1529213 | 0 | 639328396 | 12076539538051386 | 12076539538224340 | 12076539538355219 | 12076539538358728 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 106 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 61376 | 0x7f4423eba600 | 0x7f4318235e00 | 405484 | 405484 | 33823 | 3243880 | 65536 | 316935047 | 3073762 | 0 | 1269554680 | 12076539538417687 | 12076539538602098 | 12076539538863217 | 12076539538928908 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 108 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 62592 | 0x7f4423eba500 | 0x7f4318235e40 | 394789 | 394789 | 23300 | 3158320 | 65536 | 290527648 | 2973188 | 0 | 1163929528 | 12076539538951560 | 12076539539151697 | 12076539539405776 | 12076539539472740 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 110 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 63808 | 0x7f4423eba400 | 0x7f4318235e80 | 217668 | 217668 | 24042 | 1741352 | 65536 | 166154705 | 1572065 | 0 | 666468924 | 12076539539491395 | 12076539539698095 | 12076539539831374 | 12076539539834904 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 112 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 65280 | 0x7f4423eba300 | 0x7f4318235ec0 | 218605 | 218605 | 27048 | 1748848 | 65536 | 182181831 | 1583724 | 0 | 730568756 | 12076539539893232 | 12076539540086093 | 12076539540221613 | 12076539540225270 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 114 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 66496 | 0x7f4423ebaa00 | 0x7f4318235f00 | 213317 | 213317 | 25345 | 1706544 | 65536 | 157655889 | 1537173 | 0 | 632441556 | 12076539540299027 | 12076539540471692 | 12076539540602412 | 12076539540605988 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 116 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 68480 | 0x7f4423eba900 | 0x7f4318235f40 | 404109 | 404109 | 32279 | 3232880 | 65536 | 292745969 | 3056493 | 0 | 1172827892 | 12076539540655169 | 12076539540847371 | 12076539541108810 | 12076539541176629 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 118 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 69696 | 0x7f4423eba800 | 0x7f4318235f80 | 386989 | 386989 | 28700 | 3095920 | 65536 | 312968802 | 2923908 | 0 | 1253693336 | 12076539541200684 | 12076539541400649 | 12076539541648968 | 12076539541715602 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 120 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 70912 | 0x7f4423eba700 | 0x7f4318235fc0 | 210908 | 210908 | 24817 | 1687272 | 65536 | 161522256 | 1518926 | 0 | 647957384 | 12076539541738444 | 12076539541931527 | 12076539542061127 | 12076539542064902 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 122 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 72384 | 0x7f4423eba600 | 0x7f4318236000 | 225629 | 225629 | 28226 | 1805040 | 65536 | 184569635 | 1633291 | 0 | 740148196 | 12076539542115265 | 12076539542314886 | 12076539542453925 | 12076539542457562 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 124 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 73600 | 0x7f4423eba500 | 0x7f4318236040 | 212597 | 212597 | 25805 | 1700784 | 65536 | 161704193 | 1531454 | 0 | 648642700 | 12076539542528103 | 12076539542701604 | 12076539542831844 | 12076539542835565 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 126 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 75840 | 0x7f4423eba400 | 0x7f4318236080 | 405725 | 405725 | 37301 | 3245808 | 65536 | 317268621 | 3072402 | 0 | 1270891056 | 12076539542886590 | 12076539543086563 | 12076539543348322 | 12076539543414582 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 128 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 77056 | 0x7f4423eba300 | 0x7f43182360c0 | 402196 | 402196 | 29450 | 3217576 | 65536 | 277427634 | 3017926 | 0 | 1111527848 | 12076539543433878 | 12076539543631841 | 12076539543889280 | 12076539543956530 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 130 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 78272 | 0x7f4423ebaa00 | 0x7f4318236100 | 212149 | 212149 | 26028 | 1697200 | 65536 | 167169679 | 1521350 | 0 | 670528196 | 12076539543980795 | 12076539544182559 | 12076539544312159 | 12076539544316009 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 132 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 80000 | 0x7f4423eba900 | 0x7f4318236140 | 232541 | 232541 | 26099 | 1860336 | 65536 | 201096862 | 1689339 | 0 | 806253228 | 12076539544367785 | 12076539544565758 | 12076539544710238 | 12076539544713929 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 134 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 81216 | 0x7f4423eba800 | 0x7f4318236180 | 219516 | 219516 | 23605 | 1756136 | 65536 | 165799056 | 1582560 | 0 | 665053064 | 12076539544785632 | 12076539544956317 | 12076539545091036 | 12076539545095138 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 136 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 83456 | 0x7f4423eba700 | 0x7f43182361c0 | 414972 | 414972 | 30784 | 3319784 | 65536 | 319219982 | 3097550 | 0 | 1278700860 | 12076539545151022 | 12076539545344955 | 12076539545611355 | 12076539545678413 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 138 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 84928 | 0x7f4423eba600 | 0x7f4318236200 | 393308 | 393308 | 33782 | 3146472 | 65536 | 326389601 | 2963130 | 0 | 1307374880 | 12076539545703400 | 12076539545898074 | 12076539546150713 | 12076539546192159 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 140 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 86400 | 0x7f4423eba500 | 0x7f4318236240 | 210901 | 210901 | 26428 | 1687216 | 65536 | 159867269 | 1511839 | 0 | 641322452 | 12076539546229278 | 12076539546414392 | 12076539546543831 | 12076539546547520 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 142 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 88128 | 0x7f4423eba400 | 0x7f4318236280 | 240757 | 240757 | 28236 | 1926064 | 65536 | 211812374 | 1760878 | 0 | 849109668 | 12076539546605939 | 12076539546789111 | 12076539546939030 | 12076539546942585 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 144 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 89600 | 0x7f4423eba300 | 0x7f43182362c0 | 212141 | 212141 | 25544 | 1697136 | 65536 | 160031469 | 1523145 | 0 | 641969516 | 12076539547036279 | 12076539547208789 | 12076539547339509 | 12076539547343180 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 146 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 92096 | 0x7f4423ebaa00 | 0x7f4318236300 | 408236 | 408236 | 32430 | 3265896 | 65536 | 291600969 | 3023547 | 0 | 1168222160 | 12076539547402110 | 12076539547585428 | 12076539547848147 | 12076539547915525 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 148 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 93568 | 0x7f4423eba900 | 0x7f4318236340 | 391564 | 391564 | 31768 | 3132520 | 65536 | 329929306 | 2951494 | 0 | 1321549252 | 12076539547940451 | 12076539548139506 | 12076539548391665 | 12076539548460829 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 150 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 95040 | 0x7f4423eba800 | 0x7f4318236380 | 220932 | 220932 | 27239 | 1767464 | 65536 | 170692455 | 1596627 | 0 | 684601716 | 12076539548483731 | 12076539548682384 | 12076539548818224 | 12076539548821931 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 152 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 96768 | 0x7f4423eba700 | 0x7f43182363c0 | 252132 | 252132 | 28039 | 2017064 | 65536 | 219135315 | 1848924 | 0 | 878405476 | 12076539548879017 | 12076539549060463 | 12076539549218222 | 12076539549222115 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 154 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 98240 | 0x7f4423eba600 | 0x7f4318236400 | 217908 | 217908 | 26726 | 1743272 | 65536 | 161732542 | 1565425 | 0 | 648762004 | 12076539549293428 | 12076539549464781 | 12076539549598381 | 12076539549602122 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 156 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 100736 | 0x7f4423eba500 | 0x7f4318236440 | 410508 | 410508 | 35220 | 3284072 | 65536 | 324406985 | 3094544 | 0 | 1299446960 | 12076539549659258 | 12076539549841100 | 12076539550106059 | 12076539550176250 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 158 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 102208 | 0x7f4423eba400 | 0x7f4318236480 | 400476 | 400476 | 29633 | 3203816 | 65536 | 258771257 | 3009523 | 0 | 1036904296 | 12076539550200855 | 12076539550395178 | 12076539550652617 | 12076539550719741 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 160 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 103680 | 0x7f4423eba300 | 0x7f43182364c0 | 220597 | 220597 | 25705 | 1764784 | 65536 | 169493389 | 1591755 | 0 | 679862632 | 12076539550743385 | 12076539550936456 | 12076539551072616 | 12076539551076524 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 162 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 105664 | 0x7f4423ebaa00 | 0x7f4318236500 | 266717 | 266717 | 29492 | 2133744 | 65536 | 236403157 | 1963801 | 0 | 947460520 | 12076539551134903 | 12076539551330055 | 12076539551497095 | 12076539551500804 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 164 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 107136 | 0x7f4423eba900 | 0x7f4318236540 | 220516 | 220516 | 27298 | 1764136 | 65536 | 165012275 | 1586662 | 0 | 661875912 | 12076539551570724 | 12076539551742214 | 12076539551878373 | 12076539551882003 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 166 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 109888 | 0x7f4423eba800 | 0x7f4318236580 | 404381 | 404381 | 38320 | 3235056 | 65536 | 315768659 | 3036582 | 0 | 1264902140 | 12076539551932647 | 12076539552131172 | 12076539552392131 | 12076539552443096 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 168 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 111360 | 0x7f4423eba700 | 0x7f43182365c0 | 397124 | 397124 | 26136 | 3177000 | 65536 | 259676647 | 2956125 | 0 | 1040523852 | 12076539552467832 | 12076539552660611 | 12076539552916290 | 12076539552938358 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 170 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 112832 | 0x7f4423eba600 | 0x7f4318236600 | 217381 | 217381 | 23631 | 1739056 | 65536 | 167844787 | 1568447 | 0 | 673256672 | 12076539552992238 | 12076539553167969 | 12076539553301568 | 12076539553305541 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 172 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 114816 | 0x7f4423eba500 | 0x7f4318236640 | 275765 | 275765 | 29612 | 2206128 | 65536 | 245890555 | 2042546 | 0 | 985409772 | 12076539553364370 | 12076539553548608 | 12076539553722687 | 12076539553726474 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 174 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 116288 | 0x7f4423eba400 | 0x7f4318236680 | 219277 | 219277 | 24997 | 1754224 | 65536 | 172741132 | 1583926 | 0 | 692837616 | 12076539553796905 | 12076539553970366 | 12076539554105566 | 12076539554109326 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 176 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 119040 | 0x7f4423eba300 | 0x7f43182366c0 | 397924 | 397924 | 38664 | 3183400 | 65536 | 335150662 | 2995908 | 0 | 1342474532 | 12076539554166292 | 12076539554359645 | 12076539554617084 | 12076539554665741 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 178 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 120768 | 0x7f4423ebaa00 | 0x7f4318236700 | 451429 | 451429 | 19078 | 3611440 | 65536 | 265901707 | 2923095 | 0 | 1065425080 | 12076539554688834 | 12076539554884123 | 12076539555174202 | 12076539555223699 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 180 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 122496 | 0x7f4423eba900 | 0x7f4318236740 | 222077 | 222077 | 27234 | 1776624 | 65536 | 169508774 | 1599073 | 0 | 679907308 | 12076539555248014 | 12076539555445561 | 12076539555581881 | 12076539555585642 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 182 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 124736 | 0x7f4423eba800 | 0x7f4318236780 | 289532 | 289532 | 30316 | 2316264 | 65536 | 258844184 | 2153967 | 0 | 1037246008 | 12076539555645313 | 12076539555828760 | 12076539556012119 | 12076539556016073 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 184 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 126464 | 0x7f4423eba700 | 0x7f43182367c0 | 218221 | 218221 | 22984 | 1745776 | 65536 | 165781438 | 1559706 | 0 | 664998292 | 12076539556101341 | 12076539556276438 | 12076539556408918 | 12076539556412790 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 186 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 20 | 24 | 127936 | 0x7f4423eba600 | 0x7f4318236800 | 408589 | 408589 | 35900 | 3268720 | 65536 | 377033478 | 3099857 | 0 | 1509953888 | 12076539556473523 | 12076539556654677 | 12076539556919636 | 12076539556968063 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 188 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 129664 | 0x7f4423eba500 | 0x7f4318236840 | 389164 | 389164 | 34775 | 3113320 | 65536 | 315336088 | 2919102 | 0 | 1263165704 | 12076539556989643 | 12076539557196915 | 12076539557446994 | 12076539557496837 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 190 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 131392 | 0x7f4423eba400 | 0x7f4318236880 | 214700 | 214700 | 20603 | 1717608 | 65536 | 166865449 | 1551116 | 0 | 669317244 | 12076539557530940 | 12076539557722353 | 12076539557854993 | 12076539557858880 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 192 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 133632 | 0x7f4423eba300 | 0x7f43182368c0 | 302381 | 302381 | 32196 | 2419056 | 65536 | 272099268 | 2251294 | 0 | 1090241708 | 12076539557916808 | 12076539558107792 | 12076539558299311 | 12076539558348942 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 194 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 135360 | 0x7f4423ebaa00 | 0x7f4318236900 | 221972 | 221972 | 25312 | 1775784 | 65536 | 171171967 | 1604347 | 0 | 686563316 | 12076539558387053 | 12076539558563630 | 12076539558700910 | 12076539558704623 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 196 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 20 | 24 | 136832 | 0x7f4423eba900 | 0x7f4318236940 | 436981 | 436981 | 41608 | 3495856 | 65536 | 403803421 | 3313333 | 0 | 1617035172 | 12076539558762150 | 12076539558948909 | 12076539559232588 | 12076539559281286 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 198 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 138560 | 0x7f4423eba800 | 0x7f4318236980 | 387732 | 387732 | 33051 | 3101864 | 65536 | 336168336 | 2924330 | 0 | 1346515816 | 12076539559305892 | 12076539559499787 | 12076539559750506 | 12076539559799290 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 200 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 140288 | 0x7f4423eba700 | 0x7f43182369c0 | 227357 | 227357 | 27174 | 1818864 | 65536 | 173238101 | 1633646 | 0 | 694839224 | 12076539559817203 | 12076539560014986 | 12076539560154825 | 12076539560159139 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 202 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 142784 | 0x7f4423eba600 | 0x7f4318236a00 | 330132 | 330132 | 33365 | 2641064 | 65536 | 297166738 | 2474091 | 0 | 1190521024 | 12076539560215955 | 12076539560411304 | 12076539560621863 | 12076539560644171 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 204 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 144768 | 0x7f4423eba500 | 0x7f4318236a40 | 213357 | 213357 | 26864 | 1706864 | 65536 | 163963370 | 1537735 | 0 | 657724816 | 12076539560710896 | 12076539560883463 | 12076539561015142 | 12076539561019059 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 206 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 20 | 24 | 145728 | 0x7f4423eba400 | 0x7f4318236a80 | 472652 | 472652 | 42088 | 3781224 | 65536 | 435175208 | 3605903 | 0 | 1742521028 | 12076539561068801 | 12076539561260741 | 12076539561569380 | 12076539561591313 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 208 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 147712 | 0x7f4423eba300 | 0x7f4318236ac0 | 391572 | 391572 | 31869 | 3132584 | 65536 | 312644928 | 2938508 | 0 | 1252403528 | 12076539561643220 | 12076539561811139 | 12076539562063779 | 12076539562086093 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 210 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 149696 | 0x7f4423ebaa00 | 0x7f4318236b00 | 213901 | 213901 | 25989 | 1711216 | 65536 | 163129910 | 1538185 | 0 | 654384080 | 12076539562138731 | 12076539562310978 | 12076539562442977 | 12076539562446905 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 212 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 152192 | 0x7f4423eba900 | 0x7f4318236b40 | 358245 | 358245 | 36987 | 2865968 | 65536 | 326658037 | 2689677 | 0 | 1308478340 | 12076539562504502 | 12076539562690656 | 12076539562918976 | 12076539562939872 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 214 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 154176 | 0x7f4423eba800 | 0x7f4318236b80 | 217597 | 217597 | 27104 | 1740784 | 65536 | 171228040 | 1572096 | 0 | 686808540 | 12076539563009271 | 12076539563184751 | 12076539563319471 | 12076539563326871 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 216 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 20 | 24 | 155648 | 0x7f4423eba700 | 0x7f4318236bc0 | 506516 | 506516 | 44667 | 4052136 | 65536 | 472333292 | 3881050 | 0 | 1891153688 | 12076539563374320 | 12076539563594829 | 12076539563925388 | 12076539563945552 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 218 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 157632 | 0x7f4423eba600 | 0x7f4318236c00 | 394044 | 394044 | 34711 | 3152360 | 65536 | 338460257 | 2965566 | 0 | 1355667104 | 12076539564004963 | 12076539564177387 | 12076539564432107 | 12076539564482531 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 220 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 159616 | 0x7f4423eba500 | 0x7f4318236c40 | 218148 | 218148 | 27459 | 1745192 | 65536 | 161402768 | 1567003 | 0 | 647476664 | 12076539564507167 | 12076539564704106 | 12076539564838666 | 12076539564841719 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 222 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 162368 | 0x7f4423eba400 | 0x7f4318236c80 | 382685 | 382685 | 37057 | 3061488 | 65536 | 352418579 | 2893804 | 0 | 1411522080 | 12076539564899647 | 12076539565090345 | 12076539565335464 | 12076539565385200 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 224 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 164608 | 0x7f4423eba300 | 0x7f4318236cc0 | 222684 | 222684 | 28213 | 1781480 | 65536 | 174659076 | 1610928 | 0 | 700515228 | 12076539565419614 | 12076539565624744 | 12076539565762343 | 12076539565765327 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 226 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 20 | 24 | 166336 | 0x7f4423ebaa00 | 0x7f4318236d00 | 575277 | 575277 | 49017 | 4602224 | 65536 | 542085357 | 4423425 | 0 | 2170161148 | 12076539565822624 | 12076539566006663 | 12076539566383142 | 12076539566438009 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 228 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 168576 | 0x7f4423eba900 | 0x7f4318236d40 | 411333 | 411333 | 32773 | 3290672 | 65536 | 294082965 | 3109407 | 0 | 1178149968 | 12076539566462494 | 12076539566681861 | 12076539566948100 | 12076539566995155 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 230 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 170816 | 0x7f4423eba800 | 0x7f4318236d80 | 220189 | 220189 | 27563 | 1761520 | 65536 | 180631894 | 1591688 | 0 | 724389492 | 12076539567017396 | 12076539567219779 | 12076539567356579 | 12076539567359663 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 232 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 174080 | 0x7f4423eba700 | 0x7f4318236dc0 | 434277 | 434277 | 40134 | 3474224 | 65536 | 400605027 | 3308028 | 0 | 1604265284 | 12076539567418563 | 12076539567603778 | 12076539567883458 | 12076539567931457 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 234 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 176576 | 0x7f4423eba600 | 0x7f4318236e00 | 221860 | 221860 | 26317 | 1774888 | 65536 | 183990518 | 1582528 | 0 | 737848128 | 12076539567966682 | 12076539568154497 | 12076539568290657 | 12076539568293951 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 236 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 20 | 24 | 177792 | 0x7f4423eba500 | 0x7f4318236e40 | 681069 | 681069 | 15834 | 5448560 | 65536 | 613770776 | 5015320 | 0 | 2456901536 | 12076539568355185 | 12076539568539936 | 12076539568988895 | 12076539569036933 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 238 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 180288 | 0x7f4423eba400 | 0x7f4318236e80 | 406237 | 406237 | 38275 | 3249904 | 65536 | 337896445 | 3059312 | 0 | 1353414276 | 12076539569061068 | 12076539569257854 | 12076539569520734 | 12076539569567560 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 240 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 182784 | 0x7f4423eba300 | 0x7f4318236ec0 | 221404 | 221404 | 25492 | 1771240 | 65536 | 187699303 | 1605385 | 0 | 752685080 | 12076539569590152 | 12076539569784413 | 12076539569922173 | 12076539569925175 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 242 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 186304 | 0x7f4423ebaa00 | 0x7f4318236f00 | 488172 | 488172 | 43321 | 3905384 | 65536 | 456128425 | 3738992 | 0 | 1826365740 | 12076539569983995 | 12076539570178812 | 12076539570494491 | 12076539570543575 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 244 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 189312 | 0x7f4423eba900 | 0x7f4318236f40 | 242548 | 242548 | 26894 | 1940392 | 65536 | 215380939 | 1778368 | 0 | 863419016 | 12076539570578210 | 12076539570761850 | 12076539570914330 | 12076539570917401 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 246 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 20 | 24 | 190784 | 0x7f4423eba800 | 0x7f4318236f80 | 785316 | 785316 | 60413 | 6282536 | 65536 | 750386555 | 6116830 | 0 | 3003366548 | 12076539570975639 | 12076539571166329 | 12076539571685208 | 12076539571735092 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 248 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 193792 | 0x7f4423eba700 | 0x7f4318236fc0 | 462404 | 462404 | 41294 | 3699240 | 65536 | 389065757 | 3519488 | 0 | 1558101460 | 12076539571759537 | 12076539571953047 | 12076539572255927 | 12076539572305873 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 250 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 196800 | 0x7f4423eba600 | 0x7f4318237000 | 246205 | 246205 | 27832 | 1969648 | 65536 | 217456841 | 1805195 | 0 | 871712088 | 12076539572330299 | 12076539572526006 | 12076539572680085 | 12076539572683225 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 252 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 201088 | 0x7f4423eba500 | 0x7f4318237040 | 592757 | 592757 | 47125 | 4742064 | 65536 | 560846135 | 4582835 | 0 | 2245236168 | 12076539572743437 | 12076539572924405 | 12076539573310804 | 12076539573360074 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 254 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 204608 | 0x7f4423eba400 | 0x7f4318237080 | 279484 | 279484 | 30869 | 2235880 | 65536 | 250652439 | 2064728 | 0 | 1004506820 | 12076539573394529 | 12076539573578803 | 12076539573755123 | 12076539573758245 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 256 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 20 | 24 | 206080 | 0x7f4423eba300 | 0x7f43182370c0 | 925917 | 925917 | 69064 | 7407344 | 65536 | 888877037 | 7236333 | 0 | 3557328232 | 12076539573814099 | 12076539574003442 | 12076539574617360 | 12076539574667527 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 258 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 209600 | 0x7f4423ebaa00 | 0x7f4318237100 | 502348 | 502348 | 44590 | 4018792 | 65536 | 439118559 | 3825833 | 0 | 1758313140 | 12076539574691411 | 12076539574889200 | 12076539575217519 | 12076539575267342 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 260 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 213120 | 0x7f4423eba900 | 0x7f4318237140 | 282684 | 282684 | 28726 | 2261480 | 65536 | 252689238 | 2099931 | 0 | 1012641916 | 12076539575291597 | 12076539575486478 | 12076539575666158 | 12076539575669320 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 262 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 218176 | 0x7f4423eba800 | 0x7f4318237180 | 699004 | 699004 | 55608 | 5592040 | 65536 | 664823353 | 5420629 | 0 | 2661141680 | 12076539575728059 | 12076539575911117 | 12076539576367436 | 12076539576418283 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 264 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 222208 | 0x7f4423eba700 | 0x7f43182371c0 | 313445 | 313445 | 31630 | 2507568 | 65536 | 282905871 | 2340290 | 0 | 1133508000 | 12076539576455062 | 12076539576633835 | 12076539576834315 | 12076539576883679 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 266 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 20 | 24 | 223936 | 0x7f4423eba600 | 0x7f4318237200 | 1067005 | 1067005 | 77826 | 8536048 | 65536 | 1028681435 | 8360329 | 0 | 4116546560 | 12076539576907864 | 12076539577105034 | 12076539577811112 | 12076539577880232 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 268 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 227968 | 0x7f4423eba500 | 0x7f4318237240 | 567516 | 567516 | 47066 | 4540136 | 65536 | 533040219 | 4369038 | 0 | 2134004644 | 12076539577903656 | 12076539578103591 | 12076539578476871 | 12076539578544288 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 270 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 232000 | 0x7f4423eba400 | 0x7f4318237280 | 318932 | 318932 | 33166 | 2551464 | 65536 | 289021482 | 2378929 | 0 | 1157974008 | 12076539578567581 | 12076539578762630 | 12076539578965509 | 12076539579033618 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 272 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 237824 | 0x7f4423eba300 | 0x7f43182372c0 | 803653 | 803653 | 60431 | 6429232 | 65536 | 770151333 | 6265288 | 0 | 3082454928 | 12076539579062081 | 12076539579256069 | 12076539579783427 | 12076539579850538 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 274 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 242368 | 0x7f4423ebaa00 | 0x7f4318237300 | 349972 | 349972 | 35373 | 2799784 | 65536 | 319600579 | 2626228 | 0 | 1280294176 | 12076539579885503 | 12076539580069506 | 12076539580293186 | 12076539580362299 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 276 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 20 | 24 | 243584 | 0x7f4423eba900 | 0x7f4318237340 | 1209261 | 1209261 | 86183 | 9674096 | 65536 | 1168697018 | 9490305 | 0 | 4676608676 | 12076539580385312 | 12076539580581025 | 12076539581381983 | 12076539581449672 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 278 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 248128 | 0x7f4423eba800 | 0x7f4318237380 | 640132 | 640132 | 53668 | 5121064 | 65536 | 599660316 | 4940574 | 0 | 2400485004 | 12076539581479718 | 12076539581674782 | 12076539582097341 | 12076539582165464 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 280 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 252672 | 0x7f4423eba700 | 0x7f43182373c0 | 353644 | 353644 | 35173 | 2829160 | 65536 | 322966437 | 2656731 | 0 | 1293749792 | 12076539582196702 | 12076539582390140 | 12076539582616860 | 12076539582683527 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 282 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 259264 | 0x7f4423eba600 | 0x7f4318237400 | 913252 | 913252 | 68136 | 7306024 | 65536 | 874047575 | 7108852 | 0 | 3498042204 | 12076539582706029 | 12076539582904859 | 12076539583502618 | 12076539583572010 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 284 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 264832 | 0x7f4423eba500 | 0x7f4318237440 | 465477 | 465477 | 15623 | 3723824 | 65536 | 385617966 | 3174831 | 0 | 1544356816 | 12076539583607025 | 12076539583792857 | 12076539584094456 | 12076539584164873 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 286 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 20 | 24 | 266304 | 0x7f4423eba400 | 0x7f4318237480 | 1489852 | 1489852 | 102328 | 11918824 | 65536 | 1447143697 | 11738272 | 0 | 5790395304 | 12076539584187906 | 12076539584384375 | 12076539585372853 | 12076539585441117 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 288 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 28 | 24 | 271872 | 0x7f4423eba300 | 0x7f43182374c0 | 776861 | 776861 | 59692 | 6214896 | 65536 | 741678364 | 6048016 | 0 | 2968545520 | 12076539585470481 | 12076539585667252 | 12076539586182131 | 12076539586250302 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 290 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 277440 | 0x7f4423ebaa00 | 0x7f4318237500 | 424052 | 424052 | 40753 | 3392424 | 65536 | 390940143 | 3216035 | 0 | 1565656504 | 12076539586281059 | 12076539586473970 | 12076539586747249 | 12076539586814421 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 292 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 12 | 24 | 279936 | 0x7f4423eba900 | 0x7f4318237540 | 1127588 | 1127588 | 79764 | 9020712 | 65536 | 1089666359 | 8846401 | 0 | 4360489876 | 12076539586837584 | 12076539587040369 | 12076539587780047 | 12076539587849266 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 294 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 286528 | 0x7f4423eba800 | 0x7f4318237580 | 491236 | 491236 | 44858 | 3929896 | 65536 | 456921999 | 3756820 | 0 | 1829591628 | 12076539587884682 | 12076539588075886 | 12076539588394445 | 12076539588463619 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 296 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 20 | 24 | 288000 | 0x7f4423eba700 | 0x7f43182375c0 | 1768581 | 1768581 | 117542 | 14148656 | 65536 | 1724447322 | 13979919 | 0 | 6899609844 | 12076539588480260 | 12076539588686124 | 12076539589862441 | 12076539589930097 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 298 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 32 | 24 | 294592 | 0x7f4423eba600 | 0x7f4318237600 | 921053 | 921053 | 66297 | 7368432 | 65536 | 804876492 | 7196129 | 0 | 3221370360 | 12076539589960724 | 12076539590164040 | 12076539590776999 | 12076539590846932 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 300 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 301184 | 0x7f4423eba500 | 0x7f4318237640 | 492644 | 492644 | 42992 | 3941160 | 65536 | 461031505 | 3771720 | 0 | 1846012960 | 12076539590876347 | 12076539591075558 | 12076539591395397 | 12076539591462808 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 302 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 12 | 24 | 304960 | 0x7f4423eba400 | 0x7f4318237680 | 1337396 | 1337396 | 92333 | 10699176 | 65536 | 1299277386 | 10528946 | 0 | 5198938588 | 12076539591485901 | 12076539591683877 | 12076539592563714 | 12076539592632033 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 304 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 24 | 24 | 313600 | 0x7f4423eba300 | 0x7f43182376c0 | 633333 | 633333 | 54072 | 5066672 | 65536 | 596476135 | 4888805 | 0 | 2387800312 | 12076539592676495 | 12076539592851394 | 12076539593264353 | 12076539593334429 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 306 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 20 | 24 | 314816 | 0x7f4423ebaa00 | 0x7f4318237700 | 2333356 | 2333356 | 79878 | 18666856 | 65536 | 2284896529 | 18494385 | 0 | 9141407988 | 12076539593365377 | 12076539593559872 | 12076539595112668 | 12076539595180623 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 308 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 20 | 24 | 317568 | 0x7f4423eba900 | 0x7f4318237740 | 1201356 | 1201356 | 84410 | 9610856 | 65536 | 1163784346 | 9436414 | 0 | 4656960640 | 12076539595208676 | 12076539595416667 | 12076539596213945 | 12076539596281711 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 310 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 12 | 24 | 320320 | 0x7f4423eba800 | 0x7f4318237780 | 640204 | 640204 | 49910 | 5121640 | 65536 | 609787230 | 4957036 | 0 | 2440985580 | 12076539596312980 | 12076539596508024 | 12076539596923863 | 12076539596991732 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 312 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 12 | 24 | 324096 | 0x7f4423eba700 | 0x7f43182377c0 | 1758908 | 1758908 | 118155 | 14071272 | 65536 | 1714603939 | 13898946 | 0 | 6860241008 | 12076539597015316 | 12076539597221622 | 12076539598381619 | 12076539598451678 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 314 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 12 | 24 | 328896 | 0x7f4423eba600 | 0x7f4318237800 | 1198893 | 1198893 | 83313 | 9591152 | 65536 | 1162202950 | 9418965 | 0 | 4650639276 | 12076539598497092 | 12076539598670739 | 12076539599457617 | 12076539599525425 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 316 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 20 | 24 | 330112 | 0x7f4423eba500 | 0x7f4318237840 | 4584605 | 4584605 | 282315 | 36676848 | 65536 | 4514668689 | 36504958 | 0 | 18060495812 | 12076539599556202 | 12076539599751536 | 12076539602807688 | 12076539602875888 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 318 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 20 | 24 | 332864 | 0x7f4423eba400 | 0x7f4318237880 | 2323717 | 2323717 | 149516 | 18589744 | 65536 | 2276271710 | 18426457 | 0 | 9106912448 | 12076539602907176 | 12076539603104647 | 12076539604650083 | 12076539604718685 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 320 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 12 | 24 | 335616 | 0x7f4423eba300 | 0x7f43182378c0 | 1203644 | 1203644 | 84669 | 9629160 | 65536 | 1165498254 | 9459635 | 0 | 4663816016 | 12076539604744233 | 12076539604944162 | 12076539605734400 | 12076539605803483 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 322 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 12 | 24 | 339392 | 0x7f4423ebaa00 | 0x7f4318237900 | 3442909 | 3442909 | 215169 | 27543280 | 65536 | 3384776709 | 27373869 | 0 | 13540931208 | 12076539605831495 | 12076539606036160 | 12076539608318234 | 12076539608386899 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 324 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 12 | 24 | 344192 | 0x7f4423eba900 | 0x7f4318237940 | 2326380 | 2326380 | 152550 | 18611048 | 65536 | 2276299888 | 18421771 | 0 | 9107028724 | 12076539608431972 | 12076539608608793 | 12076539610145269 | 12076539610213496 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 326 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 20 | 24 | 345408 | 0x7f4423eba800 | 0x7f4318237980 | 9087740 | 9087740 | 473479 | 72701928 | 65536 | 8978154106 | 72527985 | 0 | 35914436988 | 12076539610248151 | 12076539610438708 | 12076539616501253 | 12076539616571974 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 328 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 20 | 24 | 348160 | 0x7f4423eba700 | 0x7f43182379c0 | 4574484 | 4574484 | 283331 | 36595880 | 65536 | 4501040258 | 36416888 | 0 | 18005984112 | 12076539616598613 | 12076539616799652 | 12076539619846204 | 12076539619916605 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 330 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 12 | 24 | 350912 | 0x7f4423eba600 | 0x7f4318237a00 | 2330213 | 2330213 | 150793 | 18641712 | 65536 | 2281449272 | 18463936 | 0 | 9127621428 | 12076539619943846 | 12076539620150203 | 12076539621690679 | 12076539621760165 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 332 | 932047 | 932054 | 4194304 | 256 | 0 | 0 | 12 | 24 | 0 | 0x7f4423eba500 | 0x7f4318237a40 | 6816229 | 6816229 | 412766 | 54529840 | 65536 | 6723941280 | 54336435 | 0 | 26897589764 | 12076539621793717 | 12076539621986528 | 12076539626515797 | 12076539626589217 |