41 KiB
41 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | SQ_INSTS_VMEM | SQ_INST_LEVEL_VMEM | SQ_ACCUM_PREV_HIRES | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBufferAligned.kd | 0 | 0 | 0 | 238129 | 238129 | 33554432 | 256 | 0 | 0 | 4 | 32 | 4160 | 0x0 | 0x7fe2c7e04280 | 524288 | 5497472 | 615656480 | 17851610507915 | 17849318958956 | 17851757718801 | 17851757807931 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 238129 | 238129 | 32768 | 256 | 0 | 0 | 12 | 24 | 13888 | 0x0 | 0x7fe2c7e23f80 | 4096 | 55920 | 6257708 | 17851762985423 | 17851757718801 | 17851763112570 | 17851763117229 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 5 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 14336 | 0x7fe2d67ec380 | 0x7fe2c7e23fc0 | 524288 | 10960198 | 1227561992 | 17851763151509 | 17851763112570 | 17851763483290 | 17851763485710 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 8 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15040 | 0x7fe2d67ec200 | 0x7fe2c7e24000 | 524288 | 11381323 | 1274672356 | 17851763522879 | 17851763483290 | 17851763890331 | 17851763892860 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 11 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15488 | 0x7fe2d67ec080 | 0x7fe2c7e24040 | 524288 | 11627241 | 1302212244 | 17851763925789 | 17851763890331 | 17851764290172 | 17851764292530 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 14 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 15936 | 0x7fe2d414df00 | 0x7fe2c7e24080 | 524288 | 10699863 | 1198379556 | 17851764323980 | 17851764290172 | 17851764605852 | 17851764608203 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 17 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 16384 | 0x7fe2d414dd80 | 0x7fe2c7e240c0 | 524288 | 11118838 | 1245185864 | 17851764640972 | 17851764605852 | 17851764908573 | 17851764910935 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 20 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 17088 | 0x7fe2d414dc00 | 0x7fe2c7e24100 | 524288 | 11178497 | 1251943004 | 17851764953374 | 17851764908573 | 17851765209053 | 17851765211248 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 23 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 16 | 24 | 17792 | 0x7fe2d414da80 | 0x7fe2c7e24140 | 524288 | 11592460 | 1298324336 | 17851765242887 | 17851765209053 | 17851765599934 | 17851765602108 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 26 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 16 | 24 | 18496 | 0x7fe2d414d900 | 0x7fe2c7e24180 | 524288 | 11494634 | 1287368864 | 17851765632697 | 17851765599934 | 17851765988574 | 17851765990788 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 29 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19200 | 0x7fe2d414d780 | 0x7fe2c7e241c0 | 524288 | 11287982 | 1264243188 | 17851766020358 | 17851765988574 | 17851766334655 | 17851766337010 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 32 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19904 | 0x7fe2d414d600 | 0x7fe2c7e24200 | 524288 | 11023054 | 1234642988 | 17851766367699 | 17851766334655 | 17851766641056 | 17851766643422 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 35 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 20608 | 0x7fe2d67ec480 | 0x7fe2c7e24240 | 524288 | 11244797 | 1259455848 | 17851766682701 | 17851766641056 | 17851766954976 | 17851766957234 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 38 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 16 | 24 | 21312 | 0x7fe2d67ec300 | 0x7fe2c7e24280 | 524288 | 11510571 | 1289156640 | 17851766990564 | 17851766954976 | 17851767331937 | 17851767333595 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 41 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22016 | 0x7fe2d67ec180 | 0x7fe2c7e242c0 | 524288 | 11447156 | 1282083652 | 17851767364564 | 17851767331937 | 17851767690497 | 17851767692186 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 44 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22720 | 0x7fe2d67ec000 | 0x7fe2c7e24300 | 524288 | 11276589 | 1263015848 | 17851767723665 | 17851767690497 | 17851767963778 | 17851767965349 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 47 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 23424 | 0x7fe2d414de80 | 0x7fe2c7e24340 | 524288 | 10903637 | 1221189884 | 17851767996329 | 17851767963778 | 17851768237058 | 17851768238773 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 50 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 24128 | 0x7fe2d414dd00 | 0x7fe2c7e24380 | 524288 | 11051283 | 1237706736 | 17851768276892 | 17851768237058 | 17851768510659 | 17851768512396 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 53 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 16 | 24 | 24832 | 0x7fe2d414db80 | 0x7fe2c7e243c0 | 524288 | 11567105 | 1295514892 | 17851768543615 | 17851768510659 | 17851768871299 | 17851768873267 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 56 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 16 | 24 | 25536 | 0x7fe2d414da00 | 0x7fe2c7e24400 | 524288 | 11440192 | 1281276188 | 17851768903966 | 17851768871299 | 17851769237540 | 17851769239258 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 59 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26240 | 0x7fe2d414d880 | 0x7fe2c7e24440 | 524288 | 11218351 | 1256413152 | 17851769269957 | 17851769237540 | 17851769511780 | 17851769513491 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 62 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26944 | 0x7fe2d414d700 | 0x7fe2c7e24480 | 524288 | 10893140 | 1220038764 | 17851769544010 | 17851769511780 | 17851769786981 | 17851769788744 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 65 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 27648 | 0x7fe2d67ec580 | 0x7fe2c7e244c0 | 524288 | 11184468 | 1252652572 | 17851769827593 | 17851769786981 | 17851770067781 | 17851770069447 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 68 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 16 | 24 | 28608 | 0x7fe2d67ec400 | 0x7fe2c7e24500 | 524288 | 11405712 | 1277359184 | 17851770101856 | 17851770067781 | 17851770434982 | 17851770436678 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 71 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 16 | 24 | 29312 | 0x7fe2d67ec280 | 0x7fe2c7e24540 | 524288 | 11384947 | 1275100984 | 17851770467807 | 17851770434982 | 17851770798343 | 17851770800169 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 74 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 30016 | 0x7fe2d67ec100 | 0x7fe2c7e24580 | 524288 | 11239872 | 1258881312 | 17851770831338 | 17851770798343 | 17851771073223 | 17851771074972 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 77 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 8 | 24 | 30976 | 0x7fe2d414df80 | 0x7fe2c7e245c0 | 524288 | 10799987 | 1209563668 | 17851771105501 | 17851771073223 | 17851771344744 | 17851771346485 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 80 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 31680 | 0x7fe2d414de00 | 0x7fe2c7e24600 | 524288 | 11131170 | 1246673252 | 17851771384385 | 17851771344744 | 17851771619144 | 17851771620859 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 83 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 16 | 24 | 32640 | 0x7fe2d414dc80 | 0x7fe2c7e24640 | 524288 | 11467964 | 1284374572 | 17851771652478 | 17851771619144 | 17851771986025 | 17851771987720 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 86 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 33600 | 0x7fe2d414db00 | 0x7fe2c7e24680 | 524288 | 11240089 | 1258865168 | 17851772018959 | 17851771986025 | 17851772349385 | 17851772351110 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 89 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 34560 | 0x7fe2d414d980 | 0x7fe2c7e246c0 | 524288 | 11111679 | 1244473400 | 17851772381930 | 17851772349385 | 17851772624266 | 17851772626054 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 92 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 8 | 24 | 35520 | 0x7fe2d414d800 | 0x7fe2c7e24700 | 524288 | 10752960 | 1204236396 | 17851772656993 | 17851772624266 | 17851772900906 | 17851772902707 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 95 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 36224 | 0x7fe2d414d680 | 0x7fe2c7e24740 | 524288 | 11148981 | 1248709068 | 17851772941226 | 17851772900906 | 17851773176907 | 17851773178670 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 98 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 37184 | 0x7fe2d67ec500 | 0x7fe2c7e24780 | 524288 | 11424600 | 1279548008 | 17851773209649 | 17851773176907 | 17851773539627 | 17851773541161 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 101 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 38144 | 0x7fe2d67ec380 | 0x7fe2c7e247c0 | 524288 | 11391928 | 1275859604 | 17851773572850 | 17851773539627 | 17851773903308 | 17851773905072 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 104 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 39104 | 0x7fe2d67ec200 | 0x7fe2c7e24800 | 524288 | 10688825 | 1197121120 | 17851773936171 | 17851773903308 | 17851774175948 | 17851774177675 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 107 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 8 | 24 | 40320 | 0x7fe2d67ec080 | 0x7fe2c7e24840 | 524288 | 10142263 | 1135919060 | 17851774209724 | 17851774175948 | 17851774455789 | 17851774457488 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 110 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 41280 | 0x7fe2d414df00 | 0x7fe2c7e24880 | 524288 | 10949440 | 1226295444 | 17851774496357 | 17851774455789 | 17851774742829 | 17851774744601 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 113 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 42240 | 0x7fe2d414dd80 | 0x7fe2c7e248c0 | 524288 | 11379921 | 1274545880 | 17851774774940 | 17851774742829 | 17851775110510 | 17851775112212 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 116 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 43200 | 0x7fe2d414dc00 | 0x7fe2c7e24900 | 524288 | 11416790 | 1278677352 | 17851775143441 | 17851775110510 | 17851775471951 | 17851775473633 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 119 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 8 | 24 | 44160 | 0x7fe2d414da80 | 0x7fe2c7e24940 | 524288 | 10352192 | 1159389384 | 17851775504362 | 17851775471951 | 17851775746831 | 17851775748466 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 122 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 45376 | 0x7fe2d414d900 | 0x7fe2c7e24980 | 524288 | 9913960 | 1110386536 | 17851775779665 | 17851775746831 | 17851776020432 | 17851776022119 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 125 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 46336 | 0x7fe2d414d780 | 0x7fe2c7e249c0 | 524288 | 10513747 | 1177552012 | 17851776060108 | 17851776020432 | 17851776296912 | 17851776298582 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 128 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 47552 | 0x7fe2d414d600 | 0x7fe2c7e24a00 | 524288 | 11381922 | 1274753504 | 17851776329492 | 17851776296912 | 17851776657713 | 17851776659383 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 131 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 48512 | 0x7fe2d67ec480 | 0x7fe2c7e24a40 | 524288 | 11333933 | 1269382580 | 17851776690293 | 17851776657713 | 17851777015633 | 17851777017335 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 134 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 8 | 24 | 49472 | 0x7fe2d67ec300 | 0x7fe2c7e24a80 | 524288 | 10580465 | 1185002716 | 17851777048404 | 17851777015633 | 17851777289234 | 17851777290928 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 137 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 50688 | 0x7fe2d67ec180 | 0x7fe2c7e24ac0 | 524288 | 9199320 | 1030329784 | 17851777322447 | 17851777289234 | 17851777571314 | 17851777572971 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 140 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 51648 | 0x7fe2d67ec000 | 0x7fe2c7e24b00 | 524288 | 10586783 | 1185637180 | 17851777611420 | 17851777571314 | 17851777859635 | 17851777861264 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 143 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 52864 | 0x7fe2d414de80 | 0x7fe2c7e24b40 | 524288 | 11290441 | 1264513584 | 17851777892063 | 17851777859635 | 17851778228755 | 17851778230584 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 146 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 54080 | 0x7fe2d414dd00 | 0x7fe2c7e24b80 | 524288 | 11333004 | 1269285372 | 17851778262294 | 17851778228755 | 17851778596116 | 17851778597795 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 149 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 8 | 24 | 55296 | 0x7fe2d414db80 | 0x7fe2c7e24bc0 | 524288 | 10333600 | 1157349612 | 17851778628455 | 17851778596116 | 17851778872916 | 17851778874719 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 152 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 56768 | 0x7fe2d414da00 | 0x7fe2c7e24c00 | 524288 | 7758862 | 868986468 | 17851778905648 | 17851778872916 | 17851779148117 | 17851779149842 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 155 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 57728 | 0x7fe2d414d880 | 0x7fe2c7e24c40 | 524288 | 10751011 | 1204055656 | 17851779187561 | 17851779148117 | 17851779424917 | 17851779426605 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 158 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 58944 | 0x7fe2d414d700 | 0x7fe2c7e24c80 | 524288 | 11359499 | 1272250716 | 17851779457324 | 17851779424917 | 17851779788118 | 17851779789916 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 161 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 60160 | 0x7fe2d67ec580 | 0x7fe2c7e24cc0 | 524288 | 11359245 | 1272205808 | 17851779820985 | 17851779788118 | 17851780151639 | 17851780153257 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 164 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 8 | 24 | 61376 | 0x7fe2d67ec400 | 0x7fe2c7e24d00 | 524288 | 10233865 | 1146208680 | 17851780183876 | 17851780151639 | 17851780432279 | 17851780434060 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 167 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 62848 | 0x7fe2d67ec280 | 0x7fe2c7e24d40 | 524288 | 6790915 | 760638956 | 17851780466599 | 17851780432279 | 17851780715160 | 17851780716753 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 170 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 63808 | 0x7fe2d67ec100 | 0x7fe2c7e24d80 | 524288 | 10722907 | 1200890196 | 17851780755482 | 17851780715160 | 17851780993400 | 17851780994976 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 173 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 65024 | 0x7fe2d414df80 | 0x7fe2c7e24dc0 | 524288 | 11235953 | 1258389508 | 17851781026845 | 17851780993400 | 17851781354361 | 17851781356027 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 176 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 66240 | 0x7fe2d414de00 | 0x7fe2c7e24e00 | 524288 | 11251763 | 1260196968 | 17851781387597 | 17851781354361 | 17851781716601 | 17851781718348 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 179 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 8 | 24 | 67456 | 0x7fe2d414dc80 | 0x7fe2c7e24e40 | 524288 | 10603428 | 1187614532 | 17851781749108 | 17851781716601 | 17851781993562 | 17851781995242 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 182 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 68928 | 0x7fe2d414db00 | 0x7fe2c7e24e80 | 524288 | 5736171 | 642479920 | 17851782026071 | 17851781993562 | 17851782284602 | 17851782286414 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 185 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 70144 | 0x7fe2d414d980 | 0x7fe2c7e24ec0 | 524288 | 10761174 | 1205159824 | 17851782324253 | 17851782284602 | 17851782562523 | 17851782564147 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 188 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 71616 | 0x7fe2d414d800 | 0x7fe2c7e24f00 | 524288 | 11277622 | 1263104348 | 17851782596237 | 17851782562523 | 17851782924923 | 17851782926658 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 191 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 72832 | 0x7fe2d414d680 | 0x7fe2c7e24f40 | 524288 | 11403554 | 1277177012 | 17851782958358 | 17851782924923 | 17851783294044 | 17851783295759 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 194 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 8 | 24 | 74048 | 0x7fe2d67ec500 | 0x7fe2c7e24f80 | 524288 | 9971998 | 1116839528 | 17851783326518 | 17851783294044 | 17851783572605 | 17851783574332 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 197 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 75776 | 0x7fe2d67ec380 | 0x7fe2c7e24fc0 | 524288 | 4788676 | 536323888 | 17851783605412 | 17851783572605 | 17851783862525 | 17851783864245 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 200 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 76992 | 0x7fe2d67ec200 | 0x7fe2c7e25000 | 524288 | 10496241 | 1175548992 | 17851783902714 | 17851783862525 | 17851784138365 | 17851784140138 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 203 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 78464 | 0x7fe2d67ec080 | 0x7fe2c7e25040 | 524288 | 11254474 | 1260459736 | 17851784171147 | 17851784138365 | 17851784500446 | 17851784502099 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 206 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 79936 | 0x7fe2d414df00 | 0x7fe2c7e25080 | 524288 | 11308943 | 1266564232 | 17851784534368 | 17851784500446 | 17851784865247 | 17851784866980 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 209 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 8 | 24 | 81408 | 0x7fe2d414dd80 | 0x7fe2c7e250c0 | 524288 | 9969059 | 1116531716 | 17851784897639 | 17851784865247 | 17851785139647 | 17851785141433 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 212 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 83136 | 0x7fe2d414dc00 | 0x7fe2c7e25100 | 524288 | 4101249 | 459292572 | 17851785172763 | 17851785139647 | 17851785435168 | 17851785436936 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 215 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 84352 | 0x7fe2d414da80 | 0x7fe2c7e25140 | 524288 | 10552160 | 1181829580 | 17851785487385 | 17851785435168 | 17851785716928 | 17851785718719 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 218 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 85824 | 0x7fe2d414d900 | 0x7fe2c7e25180 | 524288 | 11311011 | 1266806536 | 17851785749208 | 17851785716928 | 17851786084129 | 17851786085730 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 221 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 87296 | 0x7fe2d414d780 | 0x7fe2c7e251c0 | 524288 | 11219564 | 1256568920 | 17851786117729 | 17851786084129 | 17851786457889 | 17851786459631 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 224 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 88768 | 0x7fe2d414d600 | 0x7fe2c7e25200 | 524288 | 9820308 | 1099748564 | 17851786490400 | 17851786457889 | 17851786735490 | 17851786737154 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 227 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 90752 | 0x7fe2d67ec480 | 0x7fe2c7e25240 | 524288 | 3671648 | 411187864 | 17851786768093 | 17851786735490 | 17851787037890 | 17851787039626 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 230 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 91968 | 0x7fe2d67ec300 | 0x7fe2c7e25280 | 524288 | 10077664 | 1128706364 | 17851787077675 | 17851787037890 | 17851787315331 | 17851787316989 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 233 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 93440 | 0x7fe2d67ec180 | 0x7fe2c7e252c0 | 524288 | 11126647 | 1246159484 | 17851787348009 | 17851787315331 | 17851787674692 | 17851787676360 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 236 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 94912 | 0x7fe2d67ec000 | 0x7fe2c7e25300 | 524288 | 11153488 | 1249170388 | 17851787708170 | 17851787674692 | 17851788032292 | 17851788034032 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 239 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 96384 | 0x7fe2d414de80 | 0x7fe2c7e25340 | 524288 | 8941596 | 1001449384 | 17851788064441 | 17851788032292 | 17851788306853 | 17851788308635 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 242 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 98368 | 0x7fe2d414dd00 | 0x7fe2c7e25380 | 524288 | 3497243 | 391708692 | 17851788339414 | 17851788306853 | 17851788613413 | 17851788614977 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 245 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 99584 | 0x7fe2d414db80 | 0x7fe2c7e253c0 | 524288 | 9670492 | 1083108004 | 17851788652536 | 17851788613413 | 17851788896934 | 17851788898650 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 248 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 101312 | 0x7fe2d414da00 | 0x7fe2c7e25400 | 524288 | 11021697 | 1234414332 | 17851788930049 | 17851788896934 | 17851789261734 | 17851789263381 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 251 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 102784 | 0x7fe2d414d880 | 0x7fe2c7e25440 | 524288 | 11132126 | 1246798012 | 17851789294310 | 17851789261734 | 17851789621895 | 17851789623662 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 254 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 104256 | 0x7fe2d414d700 | 0x7fe2c7e25480 | 524288 | 8689261 | 973198924 | 17851789653931 | 17851789621895 | 17851789898375 | 17851789900145 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 257 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 106240 | 0x7fe2d67ec580 | 0x7fe2c7e254c0 | 524288 | 3296359 | 369169100 | 17851789930734 | 17851789898375 | 17851790211816 | 17851790213657 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 260 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 107712 | 0x7fe2d67ec400 | 0x7fe2c7e25500 | 524288 | 10037455 | 1124195284 | 17851790252606 | 17851790211816 | 17851790489256 | 17851790491010 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 263 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 16 | 24 | 109440 | 0x7fe2d67ec280 | 0x7fe2c7e25540 | 524288 | 11174234 | 1251471072 | 17851790521940 | 17851790489256 | 17851790848457 | 17851790850182 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 266 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 16 | 24 | 111168 | 0x7fe2d67ec100 | 0x7fe2c7e25580 | 524288 | 11156391 | 1249494572 | 17851790881871 | 17851790848457 | 17851791213898 | 17851791215562 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 269 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 8 | 24 | 112896 | 0x7fe2d414df80 | 0x7fe2c7e255c0 | 524288 | 8453395 | 946749724 | 17851791246402 | 17851791213898 | 17851791491658 | 17851791493396 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 272 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 115136 | 0x7fe2d414de00 | 0x7fe2c7e25600 | 524288 | 3024996 | 338796148 | 17851791524785 | 17851791491658 | 17851791816619 | 17851791818288 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 275 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 116608 | 0x7fe2d414dc80 | 0x7fe2c7e25640 | 524288 | 9898403 | 1108578380 | 17851791856967 | 17851791816619 | 17851792098539 | 17851792100221 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 278 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 16 | 24 | 118336 | 0x7fe2d414db00 | 0x7fe2c7e25680 | 524288 | 11104075 | 1243642512 | 17851792131210 | 17851792098539 | 17851792457420 | 17851792459142 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 281 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 16 | 24 | 120064 | 0x7fe2d414d980 | 0x7fe2c7e256c0 | 524288 | 11097123 | 1242879504 | 17851792489141 | 17851792457420 | 17851792817900 | 17851792819553 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 284 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 121792 | 0x7fe2d414d800 | 0x7fe2c7e25700 | 524288 | 7310378 | 818624588 | 17851792849692 | 17851792817900 | 17851793096141 | 17851793097826 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 287 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 124032 | 0x7fe2d414d680 | 0x7fe2c7e25740 | 524288 | 2941237 | 329425624 | 17851793128535 | 17851793096141 | 17851793421421 | 17851793423188 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 290 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 125504 | 0x7fe2d67ec500 | 0x7fe2c7e25780 | 524288 | 9559653 | 1070725500 | 17851793461137 | 17851793421421 | 17851793695662 | 17851793697541 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 293 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 127488 | 0x7fe2d67ec380 | 0x7fe2c7e257c0 | 524288 | 11023374 | 1234615968 | 17851793727930 | 17851793695662 | 17851794053262 | 17851794055012 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 296 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 129216 | 0x7fe2d67ec200 | 0x7fe2c7e25800 | 524288 | 11082656 | 1241258564 | 17851794092211 | 17851794053262 | 17851794431823 | 17851794433593 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 299 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 130944 | 0x7fe2d67ec080 | 0x7fe2c7e25840 | 524288 | 6353255 | 711593988 | 17851794464132 | 17851794431823 | 17851794712304 | 17851794713966 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 302 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 133440 | 0x7fe2d414df00 | 0x7fe2c7e25880 | 524288 | 2939088 | 329191932 | 17851794744745 | 17851794712304 | 17851795055664 | 17851795057367 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 305 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 134912 | 0x7fe2d414dd80 | 0x7fe2c7e258c0 | 524288 | 8674328 | 971491172 | 17851795096216 | 17851795055664 | 17851795333105 | 17851795334710 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 308 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 136896 | 0x7fe2d414dc00 | 0x7fe2c7e25900 | 524288 | 10772675 | 1206512204 | 17851795365530 | 17851795333105 | 17851795695185 | 17851795696821 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 311 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 138880 | 0x7fe2d414da80 | 0x7fe2c7e25940 | 524288 | 10815365 | 1211244236 | 17851795728621 | 17851795695185 | 17851796056626 | 17851796058483 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 314 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 140864 | 0x7fe2d414d900 | 0x7fe2c7e25980 | 524288 | 5008411 | 560934772 | 17851796088352 | 17851796056626 | 17851796340466 | 17851796342176 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 317 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 143616 | 0x7fe2d414d780 | 0x7fe2c7e259c0 | 524288 | 2860023 | 320346980 | 17851796373065 | 17851796340466 | 17851796691027 | 17851796692677 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 320 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 145344 | 0x7fe2d414d600 | 0x7fe2c7e25a00 | 524288 | 6975002 | 781170540 | 17851796731096 | 17851796691027 | 17851796968787 | 17851796970440 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 323 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 147584 | 0x7fe2d67ec480 | 0x7fe2c7e25a40 | 524288 | 10836988 | 1213716384 | 17851797001379 | 17851796968787 | 17851797330868 | 17851797332751 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 326 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 149568 | 0x7fe2d67ec300 | 0x7fe2c7e25a80 | 524288 | 10812264 | 1210981884 | 17851797363950 | 17851797330868 | 17851797699349 | 17851797701022 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 329 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 151552 | 0x7fe2d67ec180 | 0x7fe2c7e25ac0 | 524288 | 3932869 | 440446248 | 17851797731601 | 17851797699349 | 17851797996469 | 17851797998205 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 332 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 154304 | 0x7fe2d67ec000 | 0x7fe2c7e25b00 | 524288 | 2846565 | 318818040 | 17851798029344 | 17851797996469 | 17851798366710 | 17851798368385 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 335 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 156288 | 0x7fe2d414de80 | 0x7fe2c7e25b40 | 524288 | 5834515 | 653448932 | 17851798406914 | 17851798366710 | 17851798658070 | 17851798659808 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 338 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 158784 | 0x7fe2d414dd00 | 0x7fe2c7e25b80 | 524288 | 10823083 | 1212141256 | 17851798690347 | 17851798658070 | 17851799020311 | 17851799022009 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 341 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 161024 | 0x7fe2d414db80 | 0x7fe2c7e25bc0 | 524288 | 10796310 | 1209189816 | 17851799053408 | 17851799020311 | 17851799383512 | 17851799385260 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 344 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 163264 | 0x7fe2d414da00 | 0x7fe2c7e25c00 | 524288 | 3807149 | 426378124 | 17851799416469 | 17851799383512 | 17851799687192 | 17851799688903 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 347 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 166528 | 0x7fe2d414d880 | 0x7fe2c7e25c40 | 524288 | 2876568 | 322203864 | 17851799719172 | 17851799687192 | 17851800076153 | 17851800121672 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 350 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 168512 | 0x7fe2d414d700 | 0x7fe2c7e25c80 | 524288 | 4400559 | 492855256 | 17851800141391 | 17851800076153 | 17851800403993 | 17851800405705 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 353 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 171264 | 0x7fe2d67ec580 | 0x7fe2c7e25cc0 | 524288 | 10574190 | 1184279480 | 17851800437434 | 17851800403993 | 17851800769434 | 17851800771206 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 356 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 173760 | 0x7fe2d67ec400 | 0x7fe2c7e25d00 | 524288 | 9756056 | 1092609072 | 17851800803335 | 17851800769434 | 17851801141275 | 17851801142977 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 359 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 176256 | 0x7fe2d67ec280 | 0x7fe2c7e25d40 | 524288 | 2937151 | 328969808 | 17851801174356 | 17851801141275 | 17851801460635 | 17851801462349 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 362 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 179776 | 0x7fe2d67ec100 | 0x7fe2c7e25d80 | 524288 | 2885783 | 323165516 | 17851801493368 | 17851801460635 | 17851801877596 | 17851801898488 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 365 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 182272 | 0x7fe2d414df80 | 0x7fe2c7e25dc0 | 524288 | 3062370 | 343015688 | 17851801918537 | 17851801877596 | 17851802207196 | 17851802209040 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 368 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 185536 | 0x7fe2d414de00 | 0x7fe2c7e25e00 | 524288 | 7965851 | 892150972 | 17851802241089 | 17851802207196 | 17851802586877 | 17851802634739 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 371 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 188544 | 0x7fe2d414dc80 | 0x7fe2c7e25e40 | 524288 | 7295385 | 817165120 | 17851802647099 | 17851802586877 | 17851803000478 | 17851803045659 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 374 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 191552 | 0x7fe2d414db00 | 0x7fe2c7e25e80 | 524288 | 2808501 | 314562680 | 17851803057569 | 17851803000478 | 17851803378718 | 17851803380351 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 377 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 195840 | 0x7fe2d414d980 | 0x7fe2c7e25ec0 | 524288 | 2834429 | 317413852 | 17851803410380 | 17851803378718 | 17851803844639 | 17851803889878 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 380 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 198592 | 0x7fe2d414d800 | 0x7fe2c7e25f00 | 524288 | 2829364 | 316816148 | 17851803909458 | 17851803844639 | 17851804211040 | 17851804212750 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 383 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 202368 | 0x7fe2d414d680 | 0x7fe2c7e25f40 | 524288 | 7156252 | 801412676 | 17851804244429 | 17851804211040 | 17851804606400 | 17851804648529 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 386 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 205888 | 0x7fe2d67ec500 | 0x7fe2c7e25f80 | 524288 | 6546543 | 733169316 | 17851804661659 | 17851804606400 | 17851805024321 | 17851805066159 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 389 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 209408 | 0x7fe2d67ec380 | 0x7fe2c7e25fc0 | 524288 | 2782400 | 311622300 | 17851805077389 | 17851805024321 | 17851805419362 | 17851805421170 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 392 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 214464 | 0x7fe2d67ec200 | 0x7fe2c7e26000 | 524288 | 2897542 | 324507732 | 17851805452989 | 17851805419362 | 17851805937923 | 17851805958267 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 395 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 217728 | 0x7fe2d67ec080 | 0x7fe2c7e26040 | 524288 | 2758709 | 309008928 | 17851805978236 | 17851805937923 | 17851806302243 | 17851806304268 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 398 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 222016 | 0x7fe2d414df00 | 0x7fe2c7e26080 | 524288 | 5361502 | 600451100 | 17851806335168 | 17851806302243 | 17851806715684 | 17851806759087 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 401 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 226048 | 0x7fe2d414dd80 | 0x7fe2c7e260c0 | 524288 | 5241560 | 587040032 | 17851806772477 | 17851806715684 | 17851807162405 | 17851807206206 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 404 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 230080 | 0x7fe2d414dc00 | 0x7fe2c7e26100 | 524288 | 2719578 | 304632596 | 17851807218236 | 17851807162405 | 17851807586246 | 17851807627715 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 407 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 235904 | 0x7fe2d414da80 | 0x7fe2c7e26140 | 524288 | 2929353 | 328060908 | 17851807640425 | 17851807586246 | 17851808183207 | 17851808224711 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 410 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 239424 | 0x7fe2d414d900 | 0x7fe2c7e26180 | 524288 | 2798443 | 313443644 | 17851808244280 | 17851808183207 | 17851808586727 | 17851808588512 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 413 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 244224 | 0x7fe2d414d780 | 0x7fe2c7e261c0 | 524288 | 5198688 | 582256312 | 17851808619471 | 17851808586727 | 17851809020488 | 17851809062250 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 416 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 248768 | 0x7fe2d414d600 | 0x7fe2c7e26200 | 524288 | 3227946 | 361493392 | 17851809075529 | 17851809020488 | 17851809479849 | 17851809522538 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 419 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 253312 | 0x7fe2d67ec480 | 0x7fe2c7e26240 | 524288 | 2765869 | 309719692 | 17851809534718 | 17851809479849 | 17851809928650 | 17851809947908 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 422 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 8 | 24 | 255552 | 0x7fe2d67ec300 | 0x7fe2c7e26280 | 524288 | 2372030 | 265583500 | 17851809961547 | 17851809928650 | 17851810579051 | 17851810623291 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 425 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 259840 | 0x7fe2d67ec180 | 0x7fe2c7e262c0 | 524288 | 2780688 | 311398384 | 17851810643791 | 17851810579051 | 17851811023211 | 17851811067380 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 428 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 265664 | 0x7fe2d67ec000 | 0x7fe2c7e26300 | 524288 | 3273190 | 366588524 | 17851811079870 | 17851811023211 | 17851811539532 | 17851811581427 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 431 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 271232 | 0x7fe2d414de80 | 0x7fe2c7e26340 | 524288 | 3706436 | 415100620 | 17851811593917 | 17851811539532 | 17851812051693 | 17851812094375 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 434 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 8 | 24 | 273216 | 0x7fe2d414dd00 | 0x7fe2c7e26380 | 524288 | 2392570 | 267988172 | 17851812106724 | 17851812051693 | 17851812564014 | 17851812605892 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 437 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 8 | 24 | 275712 | 0x7fe2d414db80 | 0x7fe2c7e263c0 | 524288 | 2380155 | 266528932 | 17851812617972 | 17851812564014 | 17851813336815 | 17851813378153 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 440 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 280768 | 0x7fe2d414da00 | 0x7fe2c7e26400 | 524288 | 2651241 | 296869496 | 17851813398483 | 17851813336815 | 17851813813936 | 17851813832062 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 443 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 287616 | 0x7fe2d414d880 | 0x7fe2c7e26440 | 524288 | 3358527 | 376130448 | 17851813847012 | 17851813813936 | 17851814349137 | 17851814394698 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 446 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 294208 | 0x7fe2d414d700 | 0x7fe2c7e26480 | 524288 | 3595083 | 402577832 | 17851814407058 | 17851814349137 | 17851814926578 | 17851814972024 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 449 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 8 | 24 | 296960 | 0x7fe2d67ec580 | 0x7fe2c7e264c0 | 524288 | 2398306 | 268633068 | 17851814983683 | 17851814926578 | 17851815496819 | 17851815538310 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 452 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 8 | 24 | 299968 | 0x7fe2d67ec400 | 0x7fe2c7e26500 | 524288 | 2389962 | 267666172 | 17851815550579 | 17851815496819 | 17851816367541 | 17851816409418 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 455 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 8 | 24 | 302720 | 0x7fe2d67ec280 | 0x7fe2c7e26540 | 524288 | 2388205 | 267475364 | 17851816429357 | 17851816367541 | 17851817028342 | 17851817069932 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 458 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 305472 | 0x7fe2d67ec100 | 0x7fe2c7e26580 | 524288 | 2579021 | 288843416 | 17851817081861 | 17851817028342 | 17851817710423 | 17851817752365 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 461 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 308224 | 0x7fe2d414df80 | 0x7fe2c7e265c0 | 524288 | 2592302 | 290292660 | 17851817764284 | 17851817710423 | 17851818386584 | 17851818432168 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 464 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 8 | 24 | 310976 | 0x7fe2d414de00 | 0x7fe2c7e26600 | 524288 | 2392252 | 267948208 | 17851818443947 | 17851818386584 | 17851819065625 | 17851819114581 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 467 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 8 | 24 | 313216 | 0x7fe2d414dc80 | 0x7fe2c7e26640 | 524288 | 2411106 | 269994500 | 17851819127690 | 17851819065625 | 17851820154427 | 17851820200824 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 470 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 8 | 24 | 315968 | 0x7fe2d414db00 | 0x7fe2c7e26680 | 524288 | 2438201 | 273086344 | 17851820221473 | 17851820154085 | 17851821239526 | 17851821308076 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 473 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 318720 | 0x7fe2d414d980 | 0x7fe2c7e266c0 | 524288 | 2595984 | 290719540 | 17851821320076 | 17851821239526 | 17851822378407 | 17851822445038 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 476 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 321472 | 0x7fe2d414d800 | 0x7fe2c7e26700 | 524288 | 2597137 | 290863004 | 17851822458078 | 17851822378407 | 17851823516328 | 17851823583740 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 479 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 8 | 24 | 324224 | 0x7fe2d414d680 | 0x7fe2c7e26740 | 524288 | 2428844 | 272065092 | 17851823596109 | 17851823516328 | 17851824627689 | 17851824694792 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 482 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 8 | 24 | 326464 | 0x7fe2d67ec500 | 0x7fe2c7e26780 | 524288 | 2466156 | 276132408 | 17851824706782 | 17851824627689 | 17851826578251 | 17851826648574 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 485 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 8 | 24 | 329216 | 0x7fe2d67ec380 | 0x7fe2c7e267c0 | 524288 | 2464191 | 275993492 | 17851826670493 | 17851826578251 | 17851828504333 | 17851828576246 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 488 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 331968 | 0x7fe2d67ec200 | 0x7fe2c7e26800 | 524288 | 2621651 | 293624628 | 17851828588236 | 17851828504333 | 17851830489935 | 17851830560797 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 491 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 12 | 24 | 334720 | 0x7fe2d67ec080 | 0x7fe2c7e26840 | 524288 | 2626645 | 294164516 | 17851830573217 | 17851830489935 | 17851832474737 | 17851832543988 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 494 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 8 | 24 | 337472 | 0x7fe2d414df00 | 0x7fe2c7e26880 | 524288 | 2455750 | 275010384 | 17851832555917 | 17851832474737 | 17851834403859 | 17851834473550 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 497 | 238129 | 238129 | 4194304 | 256 | 0 | 0 | 8 | 24 | 0 | 0x7fe2d414dd80 | 0x7fe2c7e268c0 | 524288 | 2496448 | 279555072 | 17851834487209 | 17851834403859 | 17851838027063 | 17851838150278 |