39 KiB
39 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBuffer.kd | 0 | 0 | 0 | 926570 | 926576 | 33554432 | 256 | 0 | 0 | 8 | 32 | 6464 | 0x0 | 0x7f5a66404180 | 12076423131080852 | 12076423131128016 | 12076423131454413 | 12076423131561175 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 926570 | 926576 | 32768 | 256 | 0 | 0 | 24 | 24 | 12480 | 0x0 | 0x7f5a66435100 | 12076423146177755 | 12076423146279107 | 12076423146286147 | 12076423146291897 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 4 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 12928 | 0x7f5b720e9900 | 0x7f5a66435140 | 12076423146330890 | 12076423146343746 | 12076423146476545 | 12076423146480187 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 6 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 36 | 24 | 13632 | 0x7f5b720e9800 | 0x7f5a66435180 | 12076423146523117 | 12076423146536224 | 12076423146779262 | 12076423146875672 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 8 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 14080 | 0x7f5b720e9700 | 0x7f5a664351c0 | 12076423146902592 | 12076423146914461 | 12076423147158618 | 12076423147259345 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 10 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 14528 | 0x7f5b720e9600 | 0x7f5a66435200 | 12076423147286606 | 12076423147298297 | 12076423147423416 | 12076423147427027 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 12 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 14976 | 0x7f5b720e9500 | 0x7f5a66435240 | 12076423147454918 | 12076423147466295 | 12076423147592374 | 12076423147595810 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 14 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 15424 | 0x7f5b720e9400 | 0x7f5a66435280 | 12076423147647526 | 12076423147660053 | 12076423147784212 | 12076423147787446 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 16 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 16128 | 0x7f5b720e9300 | 0x7f5a664352c0 | 12076423147814837 | 12076423147826132 | 12076423148076369 | 12076423148175988 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 18 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 16832 | 0x7f5b720e9a00 | 0x7f5a66435300 | 12076423148197679 | 12076423148209168 | 12076423148452846 | 12076423148550915 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 20 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 17536 | 0x7f5b720e9900 | 0x7f5a66435340 | 12076423148573317 | 12076423148584844 | 12076423148709483 | 12076423148712956 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 22 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 18240 | 0x7f5b720e9800 | 0x7f5a66435380 | 12076423148738554 | 12076423148750603 | 12076423148875561 | 12076423148878885 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 24 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 18944 | 0x7f5b720e9700 | 0x7f5a664353c0 | 12076423148916204 | 12076423148927721 | 12076423149052680 | 12076423149055924 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 26 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 19904 | 0x7f5b720e9600 | 0x7f5a66435400 | 12076423149083174 | 12076423149094279 | 12076423149341157 | 12076423149413338 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 28 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 20608 | 0x7f5b720e9500 | 0x7f5a66435440 | 12076423149434617 | 12076423149446436 | 12076423149690113 | 12076423149757668 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 30 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 21312 | 0x7f5b720e9400 | 0x7f5a66435480 | 12076423149779508 | 12076423149790752 | 12076423149916031 | 12076423149919308 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 32 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 22016 | 0x7f5b720e9300 | 0x7f5a664354c0 | 12076423149944865 | 12076423149956671 | 12076423150082590 | 12076423150086148 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 34 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 22720 | 0x7f5b720e9a00 | 0x7f5a66435500 | 12076423150124629 | 12076423150135709 | 12076423150260348 | 12076423150263648 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 36 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 23680 | 0x7f5b720e9900 | 0x7f5a66435540 | 12076423150289766 | 12076423150301307 | 12076423150548185 | 12076423150590766 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 38 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 24384 | 0x7f5b720e9800 | 0x7f5a66435580 | 12076423150612256 | 12076423150624344 | 12076423150868022 | 12076423150933543 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 40 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 25088 | 0x7f5b720e9700 | 0x7f5a664355c0 | 12076423150953750 | 12076423150965781 | 12076423151090100 | 12076423151093440 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 42 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 25792 | 0x7f5b720e9600 | 0x7f5a66435600 | 12076423151120941 | 12076423151132659 | 12076423151257618 | 12076423151260841 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 44 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 26496 | 0x7f5b720e9500 | 0x7f5a66435640 | 12076423151296968 | 12076423151309618 | 12076423151433456 | 12076423151436788 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 46 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 27712 | 0x7f5b720e9400 | 0x7f5a66435680 | 12076423151462305 | 12076423151473936 | 12076423151721454 | 12076423151762854 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 48 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 28416 | 0x7f5b720e9300 | 0x7f5a664356c0 | 12076423151784203 | 12076423151796013 | 12076423152039691 | 12076423152106121 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 50 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 29120 | 0x7f5b720e9a00 | 0x7f5a66435700 | 12076423152126970 | 12076423152139370 | 12076423152263848 | 12076423152266940 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 52 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 30080 | 0x7f5b720e9900 | 0x7f5a66435740 | 12076423152292227 | 12076423152303848 | 12076423152428807 | 12076423152432257 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 54 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 30784 | 0x7f5b720e9800 | 0x7f5a66435780 | 12076423152467102 | 12076423152482086 | 12076423152606245 | 12076423152609417 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 56 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 32000 | 0x7f5b720e9700 | 0x7f5a664357c0 | 12076423152635235 | 12076423152647845 | 12076423152897122 | 12076423152974335 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 58 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 32960 | 0x7f5b720e9600 | 0x7f5a66435800 | 12076423152995274 | 12076423153014241 | 12076423153259679 | 12076423153339694 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 60 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 33920 | 0x7f5b720e9500 | 0x7f5a66435840 | 12076423153360843 | 12076423153372157 | 12076423153496956 | 12076423153500222 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 62 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 34880 | 0x7f5b720e9400 | 0x7f5a66435880 | 12076423153525950 | 12076423153538076 | 12076423153663995 | 12076423153667543 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 64 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 35840 | 0x7f5b720e9300 | 0x7f5a664358c0 | 12076423153703440 | 12076423153716314 | 12076423153841913 | 12076423153845183 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 66 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 37312 | 0x7f5b720e9a00 | 0x7f5a66435900 | 12076423153870420 | 12076423153882233 | 12076423154131510 | 12076423154209840 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 68 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 38272 | 0x7f5b720e9900 | 0x7f5a66435940 | 12076423154231350 | 12076423154249589 | 12076423154493427 | 12076423154571042 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 70 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 39232 | 0x7f5b720e9800 | 0x7f5a66435980 | 12076423154590488 | 12076423154602705 | 12076423154727664 | 12076423154731129 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 72 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 40192 | 0x7f5b720e9700 | 0x7f5a664359c0 | 12076423154758119 | 12076423154769584 | 12076423154895343 | 12076423154898991 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 74 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 41152 | 0x7f5b720e9600 | 0x7f5a66435a00 | 12076423154933876 | 12076423154948462 | 12076423155071981 | 12076423155075569 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 76 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 42624 | 0x7f5b720e9500 | 0x7f5a66435a40 | 12076423155102720 | 12076423155115340 | 12076423155363018 | 12076423155442100 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 78 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 43584 | 0x7f5b720e9400 | 0x7f5a66435a80 | 12076423155462959 | 12076423155473897 | 12076423155720135 | 12076423155773576 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 80 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 44544 | 0x7f5b720e9300 | 0x7f5a66435ac0 | 12076423155796719 | 12076423155809254 | 12076423155934052 | 12076423155937421 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 82 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 45760 | 0x7f5b720e9a00 | 0x7f5a66435b00 | 12076423155963900 | 12076423155975172 | 12076423156101411 | 12076423156104902 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 84 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 46720 | 0x7f5b720e9900 | 0x7f5a66435b40 | 12076423156141730 | 12076423156152930 | 12076423156277889 | 12076423156281039 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 86 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 48448 | 0x7f5b720e9800 | 0x7f5a66435b80 | 12076423156306797 | 12076423156318849 | 12076423156578846 | 12076423156603939 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 88 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 49408 | 0x7f5b720e9700 | 0x7f5a66435bc0 | 12076423156627082 | 12076423156638526 | 12076423156887323 | 12076423156911390 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 90 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 50368 | 0x7f5b720e9600 | 0x7f5a66435c00 | 12076423156930857 | 12076423156942523 | 12076423157066841 | 12076423157070236 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 92 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 51584 | 0x7f5b720e9500 | 0x7f5a66435c40 | 12076423157097586 | 12076423157108921 | 12076423157235640 | 12076423157238839 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 94 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 52544 | 0x7f5b720e9400 | 0x7f5a66435c80 | 12076423157275537 | 12076423157286519 | 12076423157411958 | 12076423157415127 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 96 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 54272 | 0x7f5b720e9300 | 0x7f5a66435cc0 | 12076423157441776 | 12076423157453718 | 12076423157703475 | 12076423157725483 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 98 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 55488 | 0x7f5b720e9a00 | 0x7f5a66435d00 | 12076423157745921 | 12076423157758675 | 12076423158003792 | 12076423158029027 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 100 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 56704 | 0x7f5b720e9900 | 0x7f5a66435d40 | 12076423158050768 | 12076423158064752 | 12076423158189390 | 12076423158192631 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 102 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 58176 | 0x7f5b720e9800 | 0x7f5a66435d80 | 12076423158221264 | 12076423158232750 | 12076423158361229 | 12076423158364350 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 104 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 59392 | 0x7f5b720e9700 | 0x7f5a66435dc0 | 12076423158401349 | 12076423158412268 | 12076423158536747 | 12076423158539887 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 106 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 61376 | 0x7f5b720e9600 | 0x7f5a66435e00 | 12076423158566416 | 12076423158577707 | 12076423158837064 | 12076423158862636 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 108 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 62592 | 0x7f5b720e9500 | 0x7f5a66435e40 | 12076423158884427 | 12076423158895464 | 12076423159180741 | 12076423159214941 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 110 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 63808 | 0x7f5b720e9400 | 0x7f5a66435e80 | 12076423159236331 | 12076423159247940 | 12076423159373859 | 12076423159377413 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 112 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 65280 | 0x7f5b720e9300 | 0x7f5a66435ec0 | 12076423159404864 | 12076423159416738 | 12076423159545857 | 12076423159549112 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 114 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 66496 | 0x7f5b720e9a00 | 0x7f5a66435f00 | 12076423159585700 | 12076423159598497 | 12076423159723135 | 12076423159726341 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 116 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 68480 | 0x7f5b720e9900 | 0x7f5a66435f40 | 12076423159753742 | 12076423159764895 | 12076423160028572 | 12076423160056925 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 118 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 69696 | 0x7f5b720e9800 | 0x7f5a66435f80 | 12076423160081511 | 12076423160093052 | 12076423160337049 | 12076423160360540 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 120 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 70912 | 0x7f5b720e9700 | 0x7f5a66435fc0 | 12076423160382380 | 12076423160394169 | 12076423160519128 | 12076423160522360 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 122 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 72384 | 0x7f5b720e9600 | 0x7f5a66436000 | 12076423160547918 | 12076423160560727 | 12076423160696566 | 12076423160699710 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 124 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 73600 | 0x7f5b720e9500 | 0x7f5a66436040 | 12076423160736138 | 12076423160746965 | 12076423160871764 | 12076423160874966 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 126 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 75840 | 0x7f5b720e9400 | 0x7f5a66436080 | 12076423160900373 | 12076423160912244 | 12076423161168881 | 12076423161197305 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 128 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 77056 | 0x7f5b720e9300 | 0x7f5a664360c0 | 12076423161218915 | 12076423161230641 | 12076423161475118 | 12076423161498404 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 130 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 78272 | 0x7f5b720e9a00 | 0x7f5a66436100 | 12076423161519373 | 12076423161530318 | 12076423161655597 | 12076423161658822 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 132 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 80000 | 0x7f5b720e9900 | 0x7f5a66436140 | 12076423161687145 | 12076423161698636 | 12076423161840235 | 12076423161843425 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 134 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 81216 | 0x7f5b720e9800 | 0x7f5a66436180 | 12076423161879662 | 12076423161890634 | 12076423162016393 | 12076423162019973 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 136 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 83456 | 0x7f5b720e9700 | 0x7f5a664361c0 | 12076423162047204 | 12076423162059273 | 12076423162315590 | 12076423162339347 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 138 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 84928 | 0x7f5b720e9600 | 0x7f5a66436200 | 12076423162359845 | 12076423162371110 | 12076423162616867 | 12076423162639995 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 140 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 86400 | 0x7f5b720e9500 | 0x7f5a66436240 | 12076423162660584 | 12076423162672867 | 12076423162798305 | 12076423162801525 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 142 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 88128 | 0x7f5b720e9400 | 0x7f5a66436280 | 12076423162827063 | 12076423162838785 | 12076423162987744 | 12076423162990968 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 144 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 89600 | 0x7f5b720e9300 | 0x7f5a664362c0 | 12076423163044297 | 12076423163055103 | 12076423163180222 | 12076423163183736 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 146 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 92096 | 0x7f5b720e9a00 | 0x7f5a66436300 | 12076423163211157 | 12076423163222621 | 12076423163474939 | 12076423163498240 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 148 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 93568 | 0x7f5b720e9900 | 0x7f5a66436340 | 12076423163521674 | 12076423163533818 | 12076423163778296 | 12076423163801323 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 150 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 95040 | 0x7f5b720e9800 | 0x7f5a66436380 | 12076423163821641 | 12076423163833175 | 12076423163959414 | 12076423163962763 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 152 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 96768 | 0x7f5b720e9700 | 0x7f5a664363c0 | 12076423163988531 | 12076423163999734 | 12076423164157012 | 12076423164160481 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 154 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 98240 | 0x7f5b720e9600 | 0x7f5a66436400 | 12076423164198992 | 12076423164210292 | 12076423164335250 | 12076423164338902 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 156 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 100736 | 0x7f5b720e9500 | 0x7f5a66436440 | 12076423164364850 | 12076423164375890 | 12076423164630608 | 12076423164651974 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 158 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 102208 | 0x7f5b720e9400 | 0x7f5a66436480 | 12076423164672131 | 12076423164683727 | 12076423164965484 | 12076423164987177 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 160 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 103680 | 0x7f5b720e9300 | 0x7f5a664364c0 | 12076423165013636 | 12076423165024844 | 12076423165150762 | 12076423165154478 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 162 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 105664 | 0x7f5b720e9a00 | 0x7f5a66436500 | 12076423165182580 | 12076423165194602 | 12076423165359240 | 12076423165362414 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 164 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 107136 | 0x7f5b720e9900 | 0x7f5a66436540 | 12076423165398201 | 12076423165409960 | 12076423165536039 | 12076423165539183 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 166 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 109888 | 0x7f5b720e9800 | 0x7f5a66436580 | 12076423165564349 | 12076423165575398 | 12076423165830116 | 12076423165850581 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 168 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 111360 | 0x7f5b720e9700 | 0x7f5a664365c0 | 12076423165870729 | 12076423165883395 | 12076423166128353 | 12076423166152693 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 170 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 112832 | 0x7f5b720e9600 | 0x7f5a66436600 | 12076423166172479 | 12076423166184672 | 12076423166309791 | 12076423166313221 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 172 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 114816 | 0x7f5b720e9500 | 0x7f5a66436640 | 12076423166337817 | 12076423166350751 | 12076423166523549 | 12076423166526848 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 174 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 116288 | 0x7f5b720e9400 | 0x7f5a66436680 | 12076423166562885 | 12076423166574109 | 12076423166699547 | 12076423166702975 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 176 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 119040 | 0x7f5b720e9300 | 0x7f5a664366c0 | 12076423166728342 | 12076423166739867 | 12076423166998744 | 12076423167026937 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 178 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 120768 | 0x7f5b720e9a00 | 0x7f5a66436700 | 12076423167048878 | 12076423167060344 | 12076423167342261 | 12076423167369634 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 180 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 122496 | 0x7f5b720e9900 | 0x7f5a66436740 | 12076423167390342 | 12076423167401460 | 12076423167527539 | 12076423167531044 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 182 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 124736 | 0x7f5b720e9800 | 0x7f5a66436780 | 12076423167556942 | 12076423167568659 | 12076423167751057 | 12076423167754249 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 184 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 126464 | 0x7f5b720e9700 | 0x7f5a664367c0 | 12076423167790827 | 12076423167802577 | 12076423167928815 | 12076423167932139 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 186 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 20 | 24 | 127936 | 0x7f5b720e9600 | 0x7f5a66436800 | 12076423167957997 | 12076423167968975 | 12076423168231052 | 12076423168263184 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 188 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 129664 | 0x7f5b720e9500 | 0x7f5a66436840 | 12076423168284614 | 12076423168295852 | 12076423168543689 | 12076423168571086 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 190 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 131392 | 0x7f5b720e9400 | 0x7f5a66436880 | 12076423168592626 | 12076423168603529 | 12076423168729928 | 12076423168733148 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 192 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 133632 | 0x7f5b720e9300 | 0x7f5a664368c0 | 12076423168760388 | 12076423168771687 | 12076423168962885 | 12076423168966060 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 194 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 135360 | 0x7f5b720e9a00 | 0x7f5a66436900 | 12076423169005944 | 12076423169017125 | 12076423169142723 | 12076423169146385 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 196 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 20 | 24 | 136832 | 0x7f5b720e9900 | 0x7f5a66436940 | 12076423169172825 | 12076423169184163 | 12076423169466080 | 12076423169489784 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 198 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 138560 | 0x7f5b720e9800 | 0x7f5a66436980 | 12076423169510783 | 12076423169521920 | 12076423169767997 | 12076423169787747 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 200 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 140288 | 0x7f5b720e9700 | 0x7f5a664369c0 | 12076423169807003 | 12076423169818397 | 12076423169943836 | 12076423169947434 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 202 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 142784 | 0x7f5b720e9600 | 0x7f5a66436a00 | 12076423169973883 | 12076423169984955 | 12076423170192793 | 12076423170216324 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 204 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 144768 | 0x7f5b720e9500 | 0x7f5a66436a40 | 12076423170248443 | 12076423170259673 | 12076423170387671 | 12076423170391018 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 206 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 20 | 24 | 145728 | 0x7f5b720e9400 | 0x7f5a66436a80 | 12076423170416686 | 12076423170428151 | 12076423170734388 | 12076423170757800 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 208 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 147712 | 0x7f5b720e9300 | 0x7f5a66436ac0 | 12076423170781264 | 12076423170792787 | 12076423171042865 | 12076423171071012 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 210 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 149696 | 0x7f5b720e9a00 | 0x7f5a66436b00 | 12076423171091991 | 12076423171103024 | 12076423171230863 | 12076423171234125 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 212 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 152192 | 0x7f5b720e9900 | 0x7f5a66436b40 | 12076423171260224 | 12076423171271663 | 12076423171498860 | 12076423171524314 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 214 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 154176 | 0x7f5b720e9800 | 0x7f5a66436b80 | 12076423171555622 | 12076423171566860 | 12076423171693419 | 12076423171696745 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 216 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 20 | 24 | 155648 | 0x7f5b720e9700 | 0x7f5a66436bc0 | 12076423171722993 | 12076423171734218 | 12076423172062055 | 12076423172090897 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 218 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 157632 | 0x7f5b720e9600 | 0x7f5a66436c00 | 12076423172112457 | 12076423172123494 | 12076423172373572 | 12076423172401083 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 220 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 159616 | 0x7f5b720e9500 | 0x7f5a66436c40 | 12076423172422674 | 12076423172434211 | 12076423172562690 | 12076423172565980 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 222 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 162368 | 0x7f5b720e9400 | 0x7f5a66436c80 | 12076423172593882 | 12076423172605090 | 12076423172849087 | 12076423172872800 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 224 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 164608 | 0x7f5b720e9300 | 0x7f5a66436cc0 | 12076423172903828 | 12076423172915647 | 12076423173043645 | 12076423173047334 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 226 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 20 | 24 | 166336 | 0x7f5b720e9a00 | 0x7f5a66436d00 | 12076423173074505 | 12076423173085245 | 12076423173459321 | 12076423173486510 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 228 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 168576 | 0x7f5b720e9900 | 0x7f5a66436d40 | 12076423173507269 | 12076423173518201 | 12076423173771158 | 12076423173798670 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 230 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 170816 | 0x7f5b720e9800 | 0x7f5a66436d80 | 12076423173819169 | 12076423173830358 | 12076423173959636 | 12076423173963066 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 232 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 174080 | 0x7f5b720e9700 | 0x7f5a66436dc0 | 12076423173988734 | 12076423173999636 | 12076423174276913 | 12076423174301094 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 234 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 176576 | 0x7f5b720e9600 | 0x7f5a66436e00 | 12076423174332162 | 12076423174343473 | 12076423174478191 | 12076423174481599 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 236 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 20 | 24 | 177792 | 0x7f5b720e9500 | 0x7f5a66436e40 | 12076423174507377 | 12076423174519151 | 12076423174941227 | 12076423174964948 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 238 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 180288 | 0x7f5b720e9400 | 0x7f5a66436e80 | 12076423174988672 | 12076423174999786 | 12076423175266664 | 12076423175294490 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 240 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 182784 | 0x7f5b720e9300 | 0x7f5a66436ec0 | 12076423175315369 | 12076423175327943 | 12076423175462822 | 12076423175466169 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 242 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 186304 | 0x7f5b720e9a00 | 0x7f5a66436f00 | 12076423175492107 | 12076423175504741 | 12076423175818978 | 12076423175845925 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 244 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 189312 | 0x7f5b720e9900 | 0x7f5a66436f40 | 12076423175877423 | 12076423175888578 | 12076423176039296 | 12076423176042810 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 246 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 20 | 24 | 190784 | 0x7f5b720e9800 | 0x7f5a66436f80 | 12076423176070001 | 12076423176081536 | 12076423176597051 | 12076423176624872 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 248 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 193792 | 0x7f5b720e9700 | 0x7f5a66436fc0 | 12076423176645961 | 12076423176656890 | 12076423176957367 | 12076423176984350 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 250 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 196800 | 0x7f5b720e9600 | 0x7f5a66437000 | 12076423177010268 | 12076423177022007 | 12076423177175925 | 12076423177179302 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 252 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 201088 | 0x7f5b720e9500 | 0x7f5a66437040 | 12076423177207334 | 12076423177220085 | 12076423177604721 | 12076423177631983 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 254 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 204608 | 0x7f5b720e9400 | 0x7f5a66437080 | 12076423177663051 | 12076423177674000 | 12076423177848718 | 12076423177852153 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 256 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 20 | 24 | 206080 | 0x7f5b720e9300 | 0x7f5a664370c0 | 12076423177878371 | 12076423177889838 | 12076423178497672 | 12076423178525253 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 258 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 209600 | 0x7f5b720e9a00 | 0x7f5a66437100 | 12076423178548296 | 12076423178559592 | 12076423178886628 | 12076423178909768 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 260 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 213120 | 0x7f5b720e9900 | 0x7f5a66437140 | 12076423178933071 | 12076423178944068 | 12076423179122626 | 12076423179126330 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 262 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 218176 | 0x7f5b720e9800 | 0x7f5a66437180 | 12076423179152819 | 12076423179163586 | 12076423179617661 | 12076423179640676 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 264 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 222208 | 0x7f5b720e9700 | 0x7f5a664371c0 | 12076423179674970 | 12076423179685821 | 12076423179884699 | 12076423179904025 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 266 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 20 | 24 | 223936 | 0x7f5b720e9600 | 0x7f5a66437200 | 12076423179923532 | 12076423179934778 | 12076423180636051 | 12076423180663947 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 268 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 227968 | 0x7f5b720e9500 | 0x7f5a66437240 | 12076423180689134 | 12076423180700531 | 12076423181072047 | 12076423181101300 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 270 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 232000 | 0x7f5b720e9400 | 0x7f5a66437280 | 12076423181122610 | 12076423181134126 | 12076423181335884 | 12076423181362866 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 272 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 237824 | 0x7f5b720e9300 | 0x7f5a664372c0 | 12076423181383605 | 12076423181394924 | 12076423181920839 | 12076423181947823 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 274 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 242368 | 0x7f5b720e9a00 | 0x7f5a66437300 | 12076423181979021 | 12076423181991558 | 12076423182214276 | 12076423182245366 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 276 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 20 | 24 | 243584 | 0x7f5b720e9900 | 0x7f5a66437340 | 12076423182268920 | 12076423182281955 | 12076423183078107 | 12076423183106296 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 278 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 248128 | 0x7f5b720e9800 | 0x7f5a66437380 | 12076423183127826 | 12076423183139067 | 12076423183556503 | 12076423183583613 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 280 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 252672 | 0x7f5b720e9700 | 0x7f5a664373c0 | 12076423183604351 | 12076423183615222 | 12076423183839540 | 12076423183866328 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 282 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 259264 | 0x7f5b720e9600 | 0x7f5a66437400 | 12076423183889371 | 12076423183902099 | 12076423184498094 | 12076423184526254 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 284 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 264832 | 0x7f5b720e9500 | 0x7f5a66437440 | 12076423184558154 | 12076423184569133 | 12076423184837610 | 12076423184864643 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 286 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 20 | 24 | 266304 | 0x7f5b720e9400 | 0x7f5a66437480 | 12076423184886153 | 12076423184897770 | 12076423185880320 | 12076423185908984 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 288 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 28 | 24 | 271872 | 0x7f5b720e9300 | 0x7f5a664374c0 | 12076423185930093 | 12076423185940959 | 12076423186454394 | 12076423186484724 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 290 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 277440 | 0x7f5b720e9a00 | 0x7f5a66437500 | 12076423186505773 | 12076423186516634 | 12076423186787831 | 12076423186814506 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 292 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 12 | 24 | 279936 | 0x7f5b720e9900 | 0x7f5a66437540 | 12076423186835485 | 12076423186846551 | 12076423187583183 | 12076423187611177 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 294 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 286528 | 0x7f5b720e9800 | 0x7f5a66437580 | 12076423187643316 | 12076423187655183 | 12076423187969420 | 12076423187996202 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 296 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 20 | 24 | 288000 | 0x7f5b720e9700 | 0x7f5a664375c0 | 12076423188024354 | 12076423188035819 | 12076423189204128 | 12076423189232780 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 298 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 32 | 24 | 294592 | 0x7f5b720e9600 | 0x7f5a66437600 | 12076423189257306 | 12076423189268447 | 12076423189877241 | 12076423189904598 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 300 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 301184 | 0x7f5b720e9500 | 0x7f5a66437640 | 12076423189926018 | 12076423189937240 | 12076423190254997 | 12076423190288241 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 302 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 12 | 24 | 304960 | 0x7f5b720e9400 | 0x7f5a66437680 | 12076423190309841 | 12076423190321397 | 12076423191197868 | 12076423191226815 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 304 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 24 | 24 | 313600 | 0x7f5b720e9300 | 0x7f5a664376c0 | 12076423191258063 | 12076423191270187 | 12076423191681063 | 12076423191709933 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 306 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 20 | 24 | 314816 | 0x7f5b720e9a00 | 0x7f5a66437700 | 12076423191731804 | 12076423191743463 | 12076423193289848 | 12076423193362173 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 308 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 20 | 24 | 317568 | 0x7f5b720e9900 | 0x7f5a66437740 | 12076423193382221 | 12076423193394280 | 12076423194185473 | 12076423194261034 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 310 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 12 | 24 | 320320 | 0x7f5b720e9800 | 0x7f5a66437780 | 12076423194280129 | 12076423194292351 | 12076423194705468 | 12076423194776441 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 312 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 12 | 24 | 324096 | 0x7f5b720e9700 | 0x7f5a664377c0 | 12076423194801237 | 12076423194813307 | 12076423195970258 | 12076423196045950 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 314 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 12 | 24 | 328896 | 0x7f5b720e9600 | 0x7f5a66437800 | 12076423196076778 | 12076423196088657 | 12076423196872970 | 12076423196944229 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 316 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 20 | 24 | 330112 | 0x7f5b720e9500 | 0x7f5a66437840 | 12076423196965279 | 12076423196977929 | 12076423200024945 | 12076423200099382 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 318 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 20 | 24 | 332864 | 0x7f5b720e9400 | 0x7f5a66437880 | 12076423200120692 | 12076423200134224 | 12076423201673411 | 12076423201744970 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 320 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 12 | 24 | 335616 | 0x7f5b720e9300 | 0x7f5a664378c0 | 12076423201765609 | 12076423201779651 | 12076423202567964 | 12076423202639272 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 322 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 12 | 24 | 339392 | 0x7f5b720e9a00 | 0x7f5a66437900 | 12076423202658938 | 12076423202670683 | 12076423204951625 | 12076423205024424 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 324 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 12 | 24 | 344192 | 0x7f5b720e9900 | 0x7f5a66437940 | 12076423205056924 | 12076423205069224 | 12076423206604091 | 12076423206674941 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 326 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 20 | 24 | 345408 | 0x7f5b720e9800 | 0x7f5a66437980 | 12076423206695790 | 12076423206707771 | 12076423212757481 | 12076423212830269 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 328 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 20 | 24 | 348160 | 0x7f5b720e9700 | 0x7f5a664379c0 | 12076423212853111 | 12076423212865161 | 12076423215903696 | 12076423215980052 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 330 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 12 | 24 | 350912 | 0x7f5b720e9600 | 0x7f5a66437a00 | 12076423216004086 | 12076423216016495 | 12076423217554723 | 12076423217627533 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 332 | 926570 | 926576 | 4194304 | 256 | 0 | 0 | 12 | 24 | 0 | 0x7f5b720e9500 | 0x7f5a66437a40 | 12076423217647701 | 12076423217659682 | 12076423222184925 | 12076423222256645 |