40 KiB
40 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | SQ_INSTS_LDS | SQ_INST_LEVEL_LDS | SQ_ACCUM_PREV_HIRES | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBuffer.kd | 0 | 0 | 0 | 921341 | 921346 | 33554432 | 256 | 0 | 0 | 8 | 32 | 6464 | 0x0 | 0x7f75c7a04180 | 0 | 0 | 0 | 12076325872059438 | 12076326117604157 | 12076326117928636 | 12076326118038409 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 921341 | 921346 | 32768 | 256 | 0 | 0 | 24 | 24 | 12480 | 0x0 | 0x7f75c7a35100 | 0 | 0 | 0 | 12076326132896351 | 12076326133202573 | 12076326133209293 | 12076326133221776 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 4 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 12928 | 0x7f76f7c91900 | 0x7f75c7a35140 | 0 | 0 | 0 | 12076326133274564 | 12076326133491052 | 12076326133626091 | 12076326133629754 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 6 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 36 | 24 | 13632 | 0x7f76f7c91800 | 0x7f75c7a35180 | 0 | 0 | 0 | 12076326133699504 | 12076326133869611 | 12076326134124969 | 12076326134193793 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 8 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 14080 | 0x7f76f7c91700 | 0x7f75c7a351c0 | 0 | 0 | 0 | 12076326134229669 | 12076326134417768 | 12076326134668807 | 12076326134734778 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 10 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 14528 | 0x7f76f7c91600 | 0x7f75c7a35200 | 0 | 0 | 0 | 12076326134761488 | 12076326134943046 | 12076326135084326 | 12076326135088125 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 12 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 14976 | 0x7f76f7c91500 | 0x7f75c7a35240 | 0 | 0 | 0 | 12076326135137296 | 12076326135308805 | 12076326135447684 | 12076326135451039 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 14 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 15424 | 0x7f76f7c91400 | 0x7f75c7a35280 | 0 | 0 | 0 | 12076326135529615 | 12076326135693283 | 12076326135823523 | 12076326135826828 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 16 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 16128 | 0x7f76f7c91300 | 0x7f75c7a352c0 | 0 | 0 | 0 | 12076326135877061 | 12076326136052322 | 12076326136308321 | 12076326136350471 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 18 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 16832 | 0x7f76f7c91a00 | 0x7f75c7a35300 | 0 | 0 | 0 | 12076326136373504 | 12076326136557760 | 12076326136809439 | 12076326136850119 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 20 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 17536 | 0x7f76f7c91900 | 0x7f75c7a35340 | 0 | 0 | 0 | 12076326136873052 | 12076326137072958 | 12076326137201597 | 12076326137205129 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 22 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 18240 | 0x7f76f7c91800 | 0x7f75c7a35380 | 0 | 0 | 0 | 12076326137255543 | 12076326137421276 | 12076326137559996 | 12076326137563184 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 24 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 18944 | 0x7f76f7c91700 | 0x7f75c7a353c0 | 0 | 0 | 0 | 12076326137624148 | 12076326137790715 | 12076326137921754 | 12076326137925097 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 26 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 19904 | 0x7f76f7c91600 | 0x7f75c7a35400 | 0 | 0 | 0 | 12076326137973447 | 12076326138156953 | 12076326138407512 | 12076326138474969 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 28 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 20608 | 0x7f76f7c91500 | 0x7f75c7a35440 | 0 | 0 | 0 | 12076326138502099 | 12076326138682231 | 12076326138940150 | 12076326139012418 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 30 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 21312 | 0x7f76f7c91400 | 0x7f75c7a35480 | 0 | 0 | 0 | 12076326139040530 | 12076326139219029 | 12076326139348148 | 12076326139351418 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 32 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 22016 | 0x7f76f7c91300 | 0x7f75c7a354c0 | 0 | 0 | 0 | 12076326139399668 | 12076326139562388 | 12076326139700147 | 12076326139703232 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 34 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 22720 | 0x7f76f7c91a00 | 0x7f75c7a35500 | 0 | 0 | 0 | 12076326139764726 | 12076326139928146 | 12076326140060785 | 12076326140064122 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 36 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 23680 | 0x7f76f7c91900 | 0x7f75c7a35540 | 0 | 0 | 0 | 12076326140114366 | 12076326140288625 | 12076326140550864 | 12076326140616379 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 38 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 24384 | 0x7f76f7c91800 | 0x7f75c7a35580 | 0 | 0 | 0 | 12076326140639492 | 12076326140822702 | 12076326141111821 | 12076326141182581 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 40 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 25088 | 0x7f76f7c91700 | 0x7f75c7a355c0 | 0 | 0 | 0 | 12076326141207337 | 12076326141389420 | 12076326141516460 | 12076326141519838 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 42 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 25792 | 0x7f76f7c91600 | 0x7f75c7a35600 | 0 | 0 | 0 | 12076326141568368 | 12076326141731179 | 12076326141871658 | 12076326141875108 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 44 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 26496 | 0x7f76f7c91500 | 0x7f75c7a35640 | 0 | 0 | 0 | 12076326141936562 | 12076326142112777 | 12076326142246537 | 12076326142250055 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 46 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 27712 | 0x7f76f7c91400 | 0x7f75c7a35680 | 0 | 0 | 0 | 12076326142299296 | 12076326142468296 | 12076326142724135 | 12076326142790660 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 48 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 28416 | 0x7f76f7c91300 | 0x7f75c7a356c0 | 0 | 0 | 0 | 12076326142816928 | 12076326142994854 | 12076326143250053 | 12076326143316437 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 50 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 29120 | 0x7f76f7c91a00 | 0x7f75c7a35700 | 0 | 0 | 0 | 12076326143342956 | 12076326143518212 | 12076326143645091 | 12076326143648664 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 52 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 30080 | 0x7f76f7c91900 | 0x7f75c7a35740 | 0 | 0 | 0 | 12076326143698056 | 12076326143859650 | 12076326143998050 | 12076326144004806 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 54 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 30784 | 0x7f76f7c91800 | 0x7f75c7a35780 | 0 | 0 | 0 | 12076326144061822 | 12076326144224289 | 12076326144352608 | 12076326144355939 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 56 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 32000 | 0x7f76f7c91700 | 0x7f75c7a357c0 | 0 | 0 | 0 | 12076326144405230 | 12076326144574687 | 12076326144832766 | 12076326144898166 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 58 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 32960 | 0x7f76f7c91600 | 0x7f75c7a35800 | 0 | 0 | 0 | 12076326144921770 | 12076326145106525 | 12076326145363004 | 12076326145430646 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 60 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 33920 | 0x7f76f7c91500 | 0x7f75c7a35840 | 0 | 0 | 0 | 12076326145457255 | 12076326145633403 | 12076326145769402 | 12076326145772661 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 62 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 34880 | 0x7f76f7c91400 | 0x7f75c7a35880 | 0 | 0 | 0 | 12076326145820711 | 12076326145989082 | 12076326146129241 | 12076326146132931 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 64 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 35840 | 0x7f76f7c91300 | 0x7f75c7a358c0 | 0 | 0 | 0 | 12076326146194425 | 12076326146359800 | 12076326146493239 | 12076326146496587 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 66 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 37312 | 0x7f76f7c91a00 | 0x7f75c7a35900 | 0 | 0 | 0 | 12076326146544316 | 12076326146711159 | 12076326146970678 | 12076326147037602 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 68 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 38272 | 0x7f76f7c91900 | 0x7f75c7a35940 | 0 | 0 | 0 | 12076326147064472 | 12076326147244756 | 12076326147498835 | 12076326147564652 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 70 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 39232 | 0x7f76f7c91800 | 0x7f75c7a35980 | 0 | 0 | 0 | 12076326147590159 | 12076326147767794 | 12076326147905394 | 12076326147908631 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 72 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 40192 | 0x7f76f7c91700 | 0x7f75c7a359c0 | 0 | 0 | 0 | 12076326147957392 | 12076326148124433 | 12076326148257552 | 12076326148261036 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 74 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 41152 | 0x7f76f7c91600 | 0x7f75c7a35a00 | 0 | 0 | 0 | 12076326148323743 | 12076326148487631 | 12076326148620911 | 12076326148624111 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 76 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 42624 | 0x7f76f7c91500 | 0x7f75c7a35a40 | 0 | 0 | 0 | 12076326148673733 | 12076326148851470 | 12076326149116749 | 12076326149187508 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 78 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 43584 | 0x7f76f7c91400 | 0x7f75c7a35a80 | 0 | 0 | 0 | 12076326149215590 | 12076326149390508 | 12076326149650027 | 12076326149716060 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 80 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 44544 | 0x7f76f7c91300 | 0x7f75c7a35ac0 | 0 | 0 | 0 | 12076326149737961 | 12076326149917386 | 12076326150051465 | 12076326150055281 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 82 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 45760 | 0x7f76f7c91a00 | 0x7f75c7a35b00 | 0 | 0 | 0 | 12076326150105654 | 12076326150268744 | 12076326150406664 | 12076326150410030 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 84 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 46720 | 0x7f76f7c91900 | 0x7f75c7a35b40 | 0 | 0 | 0 | 12076326150470733 | 12076326150631303 | 12076326150762182 | 12076326150765260 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 86 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 48448 | 0x7f76f7c91800 | 0x7f75c7a35b80 | 0 | 0 | 0 | 12076326150813239 | 12076326150972101 | 12076326151240580 | 12076326151309261 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 88 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 49408 | 0x7f76f7c91700 | 0x7f75c7a35bc0 | 0 | 0 | 0 | 12076326151331823 | 12076326151511779 | 12076326151769538 | 12076326151834457 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 90 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 50368 | 0x7f76f7c91600 | 0x7f75c7a35c00 | 0 | 0 | 0 | 12076326151859934 | 12076326152040897 | 12076326152174977 | 12076326152178847 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 92 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 51584 | 0x7f76f7c91500 | 0x7f75c7a35c40 | 0 | 0 | 0 | 12076326152227087 | 12076326152396736 | 12076326152539615 | 12076326152543194 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 94 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 52544 | 0x7f76f7c91400 | 0x7f75c7a35c80 | 0 | 0 | 0 | 12076326152602434 | 12076326152762654 | 12076326152898654 | 12076326152901921 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 96 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 54272 | 0x7f76f7c91300 | 0x7f75c7a35cc0 | 0 | 0 | 0 | 12076326152951092 | 12076326153130013 | 12076326153401212 | 12076326153469927 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 98 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 55488 | 0x7f76f7c91a00 | 0x7f75c7a35d00 | 0 | 0 | 0 | 12076326153493110 | 12076326153677050 | 12076326153933849 | 12076326154005251 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 100 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 56704 | 0x7f76f7c91900 | 0x7f75c7a35d40 | 0 | 0 | 0 | 12076326154030138 | 12076326154208248 | 12076326154341688 | 12076326154344853 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 102 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 58176 | 0x7f76f7c91800 | 0x7f75c7a35d80 | 0 | 0 | 0 | 12076326154395607 | 12076326154553687 | 12076326154694326 | 12076326154697708 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 104 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 59392 | 0x7f76f7c91700 | 0x7f75c7a35dc0 | 0 | 0 | 0 | 12076326154758101 | 12076326154917205 | 12076326155054645 | 12076326155058849 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 106 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 61376 | 0x7f76f7c91600 | 0x7f75c7a35e00 | 0 | 0 | 0 | 12076326155107029 | 12076326155275604 | 12076326155539763 | 12076326155580709 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 108 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 62592 | 0x7f76f7c91500 | 0x7f75c7a35e40 | 0 | 0 | 0 | 12076326155606617 | 12076326155780242 | 12076326156037841 | 12076326156104052 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 110 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 63808 | 0x7f76f7c91400 | 0x7f75c7a35e80 | 0 | 0 | 0 | 12076326156130281 | 12076326156309680 | 12076326156449039 | 12076326156452720 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 112 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 65280 | 0x7f76f7c91300 | 0x7f75c7a35ec0 | 0 | 0 | 0 | 12076326156502412 | 12076326156664078 | 12076326156808558 | 12076326156811677 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 114 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 66496 | 0x7f76f7c91a00 | 0x7f75c7a35f00 | 0 | 0 | 0 | 12076326156873191 | 12076326157039917 | 12076326157171436 | 12076326157175022 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 116 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 68480 | 0x7f76f7c91900 | 0x7f75c7a35f40 | 0 | 0 | 0 | 12076326157224584 | 12076326157385835 | 12076326157653674 | 12076326157694267 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 118 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 69696 | 0x7f76f7c91800 | 0x7f75c7a35f80 | 0 | 0 | 0 | 12076326157719434 | 12076326157892233 | 12076326158150312 | 12076326158217620 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 120 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 70912 | 0x7f76f7c91700 | 0x7f75c7a35fc0 | 0 | 0 | 0 | 12076326158242997 | 12076326158420391 | 12076326158554311 | 12076326158557742 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 122 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 72384 | 0x7f76f7c91600 | 0x7f75c7a36000 | 0 | 0 | 0 | 12076326158605280 | 12076326158770950 | 12076326158910309 | 12076326158913954 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 124 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 73600 | 0x7f76f7c91500 | 0x7f75c7a36040 | 0 | 0 | 0 | 12076326158974226 | 12076326159138948 | 12076326159272868 | 12076326159276448 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 126 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 75840 | 0x7f76f7c91400 | 0x7f75c7a36080 | 0 | 0 | 0 | 12076326159323255 | 12076326159495427 | 12076326159764866 | 12076326159811672 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 128 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 77056 | 0x7f76f7c91300 | 0x7f75c7a360c0 | 0 | 0 | 0 | 12076326159838242 | 12076326160012705 | 12076326160260704 | 12076326160310209 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 130 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 78272 | 0x7f76f7c91a00 | 0x7f75c7a36100 | 0 | 0 | 0 | 12076326160336428 | 12076326160511103 | 12076326160650142 | 12076326160653727 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 132 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 80000 | 0x7f76f7c91900 | 0x7f75c7a36140 | 0 | 0 | 0 | 12076326160704752 | 12076326160873181 | 12076326161017021 | 12076326161020739 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 134 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 81216 | 0x7f76f7c91800 | 0x7f75c7a36180 | 0 | 0 | 0 | 12076326161081973 | 12076326161244860 | 12076326161378299 | 12076326161381850 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 136 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 83456 | 0x7f76f7c91700 | 0x7f75c7a361c0 | 0 | 0 | 0 | 12076326161429559 | 12076326161597178 | 12076326161867737 | 12076326161889584 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 138 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 84928 | 0x7f76f7c91600 | 0x7f75c7a36200 | 0 | 0 | 0 | 12076326161931943 | 12076326162094776 | 12076326162349335 | 12076326162398099 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 140 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 86400 | 0x7f76f7c91500 | 0x7f75c7a36240 | 0 | 0 | 0 | 12076326162423236 | 12076326162599734 | 12076326162737334 | 12076326162740505 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 142 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 88128 | 0x7f76f7c91400 | 0x7f75c7a36280 | 0 | 0 | 0 | 12076326162790849 | 12076326162951253 | 12076326163102132 | 12076326163105955 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 144 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 89600 | 0x7f76f7c91300 | 0x7f75c7a362c0 | 0 | 0 | 0 | 12076326163188588 | 12076326163349171 | 12076326163480371 | 12076326163483917 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 146 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 92096 | 0x7f76f7c91a00 | 0x7f75c7a36300 | 0 | 0 | 0 | 12076326163533800 | 12076326163691890 | 12076326163957809 | 12076326164011979 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 148 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 93568 | 0x7f76f7c91900 | 0x7f75c7a36340 | 0 | 0 | 0 | 12076326164038738 | 12076326164214768 | 12076326164472527 | 12076326164519772 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 150 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 95040 | 0x7f76f7c91800 | 0x7f75c7a36380 | 0 | 0 | 0 | 12076326164543446 | 12076326164721806 | 12076326164860365 | 12076326164864002 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 152 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 96768 | 0x7f76f7c91700 | 0x7f75c7a363c0 | 0 | 0 | 0 | 12076326164914386 | 12076326165079884 | 12076326165237804 | 12076326165241544 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 154 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 98240 | 0x7f76f7c91600 | 0x7f75c7a36400 | 0 | 0 | 0 | 12076326165301735 | 12076326165462283 | 12076326165596362 | 12076326165599729 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 156 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 100736 | 0x7f76f7c91500 | 0x7f75c7a36440 | 0 | 0 | 0 | 12076326165647979 | 12076326165815561 | 12076326166082920 | 12076326166111721 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 158 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 102208 | 0x7f76f7c91400 | 0x7f75c7a36480 | 0 | 0 | 0 | 12076326166151415 | 12076326166309319 | 12076326166565638 | 12076326166590881 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 160 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 103680 | 0x7f76f7c91300 | 0x7f75c7a364c0 | 0 | 0 | 0 | 12076326166639852 | 12076326166800997 | 12076326166936197 | 12076326166939760 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 162 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 105664 | 0x7f76f7c91a00 | 0x7f75c7a36500 | 0 | 0 | 0 | 12076326166990905 | 12076326167156516 | 12076326167322595 | 12076326167326328 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 164 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 107136 | 0x7f76f7c91900 | 0x7f75c7a36540 | 0 | 0 | 0 | 12076326167387402 | 12076326167548194 | 12076326167683234 | 12076326167686868 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 166 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 109888 | 0x7f76f7c91800 | 0x7f75c7a36580 | 0 | 0 | 0 | 12076326167733485 | 12076326167898433 | 12076326168163232 | 12076326168188370 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 168 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 111360 | 0x7f76f7c91700 | 0x7f75c7a365c0 | 0 | 0 | 0 | 12076326168229276 | 12076326168390751 | 12076326168644990 | 12076326168664795 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 170 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 112832 | 0x7f76f7c91600 | 0x7f75c7a36600 | 0 | 0 | 0 | 12076326168708587 | 12076326168866749 | 12076326169008828 | 12076326169012582 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 172 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 114816 | 0x7f76f7c91500 | 0x7f75c7a36640 | 0 | 0 | 0 | 12076326169060611 | 12076326169230428 | 12076326169404027 | 12076326169407496 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 174 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 116288 | 0x7f76f7c91400 | 0x7f75c7a36680 | 0 | 0 | 0 | 12076326169468760 | 12076326169626426 | 12076326169767545 | 12076326169770981 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 176 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 119040 | 0x7f76f7c91300 | 0x7f75c7a366c0 | 0 | 0 | 0 | 12076326169819501 | 12076326169979225 | 12076326170240824 | 12076326170268686 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 178 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 120768 | 0x7f76f7c91a00 | 0x7f75c7a36700 | 0 | 0 | 0 | 12076326170308741 | 12076326170469943 | 12076326170723862 | 12076326170746825 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 180 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 122496 | 0x7f76f7c91900 | 0x7f75c7a36740 | 0 | 0 | 0 | 12076326170790476 | 12076326170946741 | 12076326171088340 | 12076326171092046 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 182 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 124736 | 0x7f76f7c91800 | 0x7f75c7a36780 | 0 | 0 | 0 | 12076326171140416 | 12076326171308499 | 12076326171491858 | 12076326171495336 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 184 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 126464 | 0x7f76f7c91700 | 0x7f75c7a367c0 | 0 | 0 | 0 | 12076326171554185 | 12076326171713458 | 12076326171854417 | 12076326171857940 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 186 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 20 | 24 | 127936 | 0x7f76f7c91600 | 0x7f75c7a36800 | 0 | 0 | 0 | 12076326171907041 | 12076326172073136 | 12076326172340175 | 12076326172364611 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 188 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 129664 | 0x7f76f7c91500 | 0x7f75c7a36840 | 0 | 0 | 0 | 12076326172409815 | 12076326172574734 | 12076326172834093 | 12076326172857427 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 190 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 131392 | 0x7f76f7c91400 | 0x7f75c7a36880 | 0 | 0 | 0 | 12076326172903733 | 12076326173060652 | 12076326173195532 | 12076326173199172 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 192 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 133632 | 0x7f76f7c91300 | 0x7f75c7a368c0 | 0 | 0 | 0 | 12076326173248955 | 12076326173412011 | 12076326173603690 | 12076326173626787 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 194 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 135360 | 0x7f76f7c91a00 | 0x7f75c7a36900 | 0 | 0 | 0 | 12076326173682180 | 12076326173843209 | 12076326173983848 | 12076326173987668 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 196 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 20 | 24 | 136832 | 0x7f76f7c91900 | 0x7f75c7a36940 | 0 | 0 | 0 | 12076326174035607 | 12076326174208007 | 12076326174491686 | 12076326174517883 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 198 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 138560 | 0x7f76f7c91800 | 0x7f75c7a36980 | 0 | 0 | 0 | 12076326174558418 | 12076326174713605 | 12076326174974084 | 12076326174996793 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 200 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 140288 | 0x7f76f7c91700 | 0x7f75c7a369c0 | 0 | 0 | 0 | 12076326175045013 | 12076326175202563 | 12076326175338083 | 12076326175341734 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 202 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 142784 | 0x7f76f7c91600 | 0x7f75c7a36a00 | 0 | 0 | 0 | 12076326175388361 | 12076326175553762 | 12076326175764641 | 12076326175784307 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 204 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 144768 | 0x7f76f7c91500 | 0x7f75c7a36a40 | 0 | 0 | 0 | 12076326175842906 | 12076326176006080 | 12076326176145120 | 12076326176149035 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 206 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 20 | 24 | 145728 | 0x7f76f7c91400 | 0x7f75c7a36a80 | 0 | 0 | 0 | 12076326176195491 | 12076326176371999 | 12076326176681437 | 12076326176704617 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 208 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 147712 | 0x7f76f7c91300 | 0x7f75c7a36ac0 | 0 | 0 | 0 | 12076326176749440 | 12076326176909437 | 12076326177175355 | 12076326177204276 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 210 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 149696 | 0x7f76f7c91a00 | 0x7f75c7a36b00 | 0 | 0 | 0 | 12076326177245282 | 12076326177402875 | 12076326177544954 | 12076326177548235 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 212 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 152192 | 0x7f76f7c91900 | 0x7f75c7a36b40 | 0 | 0 | 0 | 12076326177599340 | 12076326177756473 | 12076326177984952 | 12076326178013359 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 214 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 154176 | 0x7f76f7c91800 | 0x7f75c7a36b80 | 0 | 0 | 0 | 12076326178071167 | 12076326178232471 | 12076326178372951 | 12076326178376434 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 216 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 20 | 24 | 155648 | 0x7f76f7c91700 | 0x7f75c7a36bc0 | 0 | 0 | 0 | 12076326178424433 | 12076326178591350 | 12076326178920948 | 12076326178943718 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 218 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 157632 | 0x7f76f7c91600 | 0x7f75c7a36c00 | 0 | 0 | 0 | 12076326178986157 | 12076326179151028 | 12076326179416466 | 12076326179443577 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 220 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 159616 | 0x7f76f7c91500 | 0x7f75c7a36c40 | 0 | 0 | 0 | 12076326179482800 | 12076326179642546 | 12076326179779665 | 12076326179783329 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 222 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 162368 | 0x7f76f7c91400 | 0x7f75c7a36c80 | 0 | 0 | 0 | 12076326179831198 | 12076326179990704 | 12076326180235983 | 12076326180259293 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 224 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 164608 | 0x7f76f7c91300 | 0x7f75c7a36cc0 | 0 | 0 | 0 | 12076326180316890 | 12076326180482029 | 12076326180626509 | 12076326180633849 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 226 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 20 | 24 | 166336 | 0x7f76f7c91a00 | 0x7f75c7a36d00 | 0 | 0 | 0 | 12076326180677030 | 12076326180855947 | 12076326181257385 | 12076326181285881 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 228 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 168576 | 0x7f76f7c91900 | 0x7f75c7a36d40 | 0 | 0 | 0 | 12076326181326958 | 12076326181485545 | 12076326181750664 | 12076326181772816 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 230 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 170816 | 0x7f76f7c91800 | 0x7f75c7a36d80 | 0 | 0 | 0 | 12076326181815896 | 12076326181970983 | 12076326182110342 | 12076326182113700 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 232 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 174080 | 0x7f76f7c91700 | 0x7f75c7a36dc0 | 0 | 0 | 0 | 12076326182165897 | 12076326182331942 | 12076326182611461 | 12076326182634878 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 234 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 176576 | 0x7f76f7c91600 | 0x7f75c7a36e00 | 0 | 0 | 0 | 12076326182696092 | 12076326182857860 | 12076326182996259 | 12076326182999616 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 236 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 20 | 24 | 177792 | 0x7f76f7c91500 | 0x7f75c7a36e40 | 0 | 0 | 0 | 12076326183048026 | 12076326183220738 | 12076326183646337 | 12076326183672036 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 238 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 180288 | 0x7f76f7c91400 | 0x7f75c7a36e80 | 0 | 0 | 0 | 12076326183709986 | 12076326183869056 | 12076326184133855 | 12076326184157207 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 240 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 182784 | 0x7f76f7c91300 | 0x7f75c7a36ec0 | 0 | 0 | 0 | 12076326184200518 | 12076326184359135 | 12076326184498174 | 12076326184501497 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 242 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 186304 | 0x7f76f7c91a00 | 0x7f75c7a36f00 | 0 | 0 | 0 | 12076326184551580 | 12076326184711293 | 12076326185026652 | 12076326185051069 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 244 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 189312 | 0x7f76f7c91900 | 0x7f75c7a36f40 | 0 | 0 | 0 | 12076326185111311 | 12076326185274811 | 12076326185426491 | 12076326185429542 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 246 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 20 | 24 | 190784 | 0x7f76f7c91800 | 0x7f75c7a36f80 | 0 | 0 | 0 | 12076326185478333 | 12076326185639770 | 12076326186157208 | 12076326186181670 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 248 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 193792 | 0x7f76f7c91700 | 0x7f75c7a36fc0 | 0 | 0 | 0 | 12076326186223688 | 12076326186384727 | 12076326186684886 | 12076326186707146 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 250 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 196800 | 0x7f76f7c91600 | 0x7f75c7a37000 | 0 | 0 | 0 | 12076326186752681 | 12076326186915286 | 12076326187070645 | 12076326187074319 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 252 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 201088 | 0x7f76f7c91500 | 0x7f75c7a37040 | 0 | 0 | 0 | 12076326187124181 | 12076326187292884 | 12076326187704083 | 12076326187729196 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 254 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 204608 | 0x7f76f7c91400 | 0x7f75c7a37080 | 0 | 0 | 0 | 12076326187790570 | 12076326187952562 | 12076326188129841 | 12076326188133036 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 256 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 20 | 24 | 206080 | 0x7f76f7c91300 | 0x7f75c7a370c0 | 0 | 0 | 0 | 12076326188181166 | 12076326188350001 | 12076326188971758 | 12076326188995299 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 258 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 209600 | 0x7f76f7c91a00 | 0x7f75c7a37100 | 0 | 0 | 0 | 12076326189044100 | 12076326189201838 | 12076326189556876 | 12076326189580106 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 260 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 213120 | 0x7f76f7c91900 | 0x7f75c7a37140 | 0 | 0 | 0 | 12076326189627694 | 12076326189788556 | 12076326189967275 | 12076326189970311 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 262 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 218176 | 0x7f76f7c91800 | 0x7f75c7a37180 | 0 | 0 | 0 | 12076326190015445 | 12076326190203594 | 12076326190660713 | 12076326190686291 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 264 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 222208 | 0x7f76f7c91700 | 0x7f75c7a371c0 | 0 | 0 | 0 | 12076326190745031 | 12076326190905992 | 12076326191105991 | 12076326191133202 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 266 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 20 | 24 | 223936 | 0x7f76f7c91600 | 0x7f75c7a37200 | 0 | 0 | 0 | 12076326191175360 | 12076326191334950 | 12076326192037988 | 12076326192064543 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 268 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 227968 | 0x7f76f7c91500 | 0x7f75c7a37240 | 0 | 0 | 0 | 12076326192105990 | 12076326192265987 | 12076326192640066 | 12076326192664358 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 270 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 232000 | 0x7f76f7c91400 | 0x7f75c7a37280 | 0 | 0 | 0 | 12076326192713248 | 12076326192874305 | 12076326193077824 | 12076326193101670 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 272 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 237824 | 0x7f76f7c91300 | 0x7f75c7a372c0 | 0 | 0 | 0 | 12076326193152946 | 12076326193314463 | 12076326193857501 | 12076326193880999 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 274 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 242368 | 0x7f76f7c91a00 | 0x7f75c7a37300 | 0 | 0 | 0 | 12076326193942072 | 12076326194113021 | 12076326194370780 | 12076326194398350 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 276 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 20 | 24 | 243584 | 0x7f76f7c91900 | 0x7f75c7a37340 | 0 | 0 | 0 | 12076326194438775 | 12076326194600539 | 12076326195398936 | 12076326195446718 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 278 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 248128 | 0x7f76f7c91800 | 0x7f75c7a37380 | 0 | 0 | 0 | 12076326195476865 | 12076326195677015 | 12076326196096054 | 12076326196145738 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 280 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 252672 | 0x7f76f7c91700 | 0x7f75c7a373c0 | 0 | 0 | 0 | 12076326196178018 | 12076326196359893 | 12076326196586452 | 12076326196634085 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 282 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 259264 | 0x7f76f7c91600 | 0x7f75c7a37400 | 0 | 0 | 0 | 12076326196660624 | 12076326196833171 | 12076326197443569 | 12076326197495416 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 284 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 264832 | 0x7f76f7c91500 | 0x7f75c7a37440 | 0 | 0 | 0 | 12076326197534979 | 12076326197697808 | 12076326197967087 | 12076326198017276 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 286 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 20 | 24 | 266304 | 0x7f76f7c91400 | 0x7f75c7a37480 | 0 | 0 | 0 | 12076326198043214 | 12076326198220206 | 12076326199205803 | 12076326199272308 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 288 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 28 | 24 | 271872 | 0x7f76f7c91300 | 0x7f75c7a374c0 | 0 | 0 | 0 | 12076326199299058 | 12076326199479402 | 12076326200013480 | 12076326200080911 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 290 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 277440 | 0x7f76f7c91a00 | 0x7f75c7a37500 | 0 | 0 | 0 | 12076326200110796 | 12076326200290759 | 12076326200562598 | 12076326200628659 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 292 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 12 | 24 | 279936 | 0x7f76f7c91900 | 0x7f75c7a37540 | 0 | 0 | 0 | 12076326200654737 | 12076326200825477 | 12076326201564035 | 12076326201633917 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 294 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 286528 | 0x7f76f7c91800 | 0x7f75c7a37580 | 0 | 0 | 0 | 12076326201674473 | 12076326201836194 | 12076326202152673 | 12076326202220447 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 296 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 20 | 24 | 288000 | 0x7f76f7c91700 | 0x7f75c7a375c0 | 0 | 0 | 0 | 12076326202247007 | 12076326202420512 | 12076326203590908 | 12076326203659041 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 298 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 32 | 24 | 294592 | 0x7f76f7c91600 | 0x7f75c7a37600 | 0 | 0 | 0 | 12076326203688676 | 12076326203872027 | 12076326204480344 | 12076326204548744 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 300 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 301184 | 0x7f76f7c91500 | 0x7f75c7a37640 | 0 | 0 | 0 | 12076326204571687 | 12076326204756184 | 12076326205075862 | 12076326205142087 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 302 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 12 | 24 | 304960 | 0x7f76f7c91400 | 0x7f75c7a37680 | 0 | 0 | 0 | 12076326205169147 | 12076326205350901 | 12076326206228818 | 12076326206298105 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 304 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 24 | 24 | 313600 | 0x7f76f7c91300 | 0x7f75c7a376c0 | 0 | 0 | 0 | 12076326206340604 | 12076326206504657 | 12076326206915536 | 12076326206982287 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 306 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 20 | 24 | 314816 | 0x7f76f7c91a00 | 0x7f75c7a37700 | 0 | 0 | 0 | 12076326207017212 | 12076326207200495 | 12076326208746730 | 12076326208815464 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 308 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 20 | 24 | 317568 | 0x7f76f7c91900 | 0x7f75c7a37740 | 0 | 0 | 0 | 12076326208851220 | 12076326209013449 | 12076326209806726 | 12076326209875283 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 310 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 12 | 24 | 320320 | 0x7f76f7c91800 | 0x7f75c7a37780 | 0 | 0 | 0 | 12076326209911841 | 12076326210080965 | 12076326210495044 | 12076326210563202 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 312 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 12 | 24 | 324096 | 0x7f76f7c91700 | 0x7f75c7a377c0 | 0 | 0 | 0 | 12076326210593328 | 12076326210769603 | 12076326211929279 | 12076326211996726 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 314 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 12 | 24 | 328896 | 0x7f76f7c91600 | 0x7f75c7a37800 | 0 | 0 | 0 | 12076326212044795 | 12076326212212318 | 12076326212998075 | 12076326213066314 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 316 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 20 | 24 | 330112 | 0x7f76f7c91500 | 0x7f75c7a37840 | 0 | 0 | 0 | 12076326213095939 | 12076326213270074 | 12076326216318223 | 12076326216385793 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 318 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 20 | 24 | 332864 | 0x7f76f7c91400 | 0x7f75c7a37880 | 0 | 0 | 0 | 12076326216410419 | 12076326216603662 | 12076326218143177 | 12076326218211175 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 320 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 12 | 24 | 335616 | 0x7f76f7c91300 | 0x7f75c7a378c0 | 0 | 0 | 0 | 12076326218242043 | 12076326218420456 | 12076326219210053 | 12076326219276565 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 322 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 12 | 24 | 339392 | 0x7f76f7c91a00 | 0x7f75c7a37900 | 0 | 0 | 0 | 12076326219303325 | 12076326219484292 | 12076326221766204 | 12076326221833106 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 324 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 12 | 24 | 344192 | 0x7f76f7c91900 | 0x7f75c7a37940 | 0 | 0 | 0 | 12076326221877900 | 12076326222045243 | 12076326223580118 | 12076326223649212 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 326 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 20 | 24 | 345408 | 0x7f76f7c91800 | 0x7f75c7a37980 | 0 | 0 | 0 | 12076326223679478 | 12076326223858517 | 12076326229912096 | 12076326229982462 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 328 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 20 | 24 | 348160 | 0x7f76f7c91700 | 0x7f75c7a379c0 | 0 | 0 | 0 | 12076326230016785 | 12076326230196575 | 12076326233237044 | 12076326233306359 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 330 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 12 | 24 | 350912 | 0x7f76f7c91600 | 0x7f75c7a37a00 | 0 | 0 | 0 | 12076326233336234 | 12076326233514803 | 12076326235053998 | 12076326235121813 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 332 | 921341 | 921346 | 4194304 | 256 | 0 | 0 | 12 | 24 | 0 | 0x7f76f7c91500 | 0x7f75c7a37a40 | 0 | 0 | 0 | 12076326235150446 | 12076326235329197 | 12076326239856221 | 12076326239924749 |