39 KiB
39 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBuffer.kd | 0 | 0 | 0 | 921580 | 921585 | 33554432 | 256 | 0 | 0 | 8 | 32 | 6464 | 0x0 | 0x7fc0c2804180 | 12076328266793044 | 12076328266837802 | 12076328267160519 | 12076328267269900 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 921580 | 921585 | 32768 | 256 | 0 | 0 | 24 | 24 | 12480 | 0x0 | 0x7fc0c2835100 | 12076328282132912 | 12076328282246095 | 12076328282252495 | 12076328282258235 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 4 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 12928 | 0x7fc1ce3b2900 | 0x7fc0c2835140 | 12076328282304692 | 12076328282317774 | 12076328282452973 | 12076328282456624 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 6 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 36 | 24 | 13632 | 0x7fc1ce3b2800 | 0x7fc0c2835180 | 12076328282500335 | 12076328282514412 | 12076328282757290 | 12076328282839105 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 8 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 14080 | 0x7fc1ce3b2700 | 0x7fc0c28351c0 | 12076328282866656 | 12076328282878089 | 12076328283120967 | 12076328283220874 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 10 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 14528 | 0x7fc1ce3b2600 | 0x7fc0c2835200 | 12076328283248405 | 12076328283259845 | 12076328283385284 | 12076328283388756 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 12 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 14976 | 0x7fc1ce3b2500 | 0x7fc0c2835240 | 12076328283411038 | 12076328283422884 | 12076328283548003 | 12076328283551288 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 14 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 15424 | 0x7fc1ce3b2400 | 0x7fc0c2835280 | 12076328283602293 | 12076328283613762 | 12076328283737761 | 12076328283740811 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 16 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 16128 | 0x7fc1ce3b2300 | 0x7fc0c28352c0 | 12076328283768412 | 12076328283780801 | 12076328284062878 | 12076328284160350 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 18 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 16832 | 0x7fc1ce3b2a00 | 0x7fc0c2835300 | 12076328284183183 | 12076328284195517 | 12076328284440794 | 12076328284537421 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 20 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 17536 | 0x7fc1ce3b2900 | 0x7fc0c2835340 | 12076328284559472 | 12076328284572153 | 12076328284696792 | 12076328284700534 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 22 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 18240 | 0x7fc1ce3b2800 | 0x7fc0c2835380 | 12076328284727935 | 12076328284739831 | 12076328284865110 | 12076328284868647 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 24 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 18944 | 0x7fc1ce3b2700 | 0x7fc0c28353c0 | 12076328284906737 | 12076328284918390 | 12076328285042869 | 12076328285046106 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 26 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 19904 | 0x7fc1ce3b2600 | 0x7fc0c2835400 | 12076328285073086 | 12076328285085268 | 12076328285336946 | 12076328285408620 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 28 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 20608 | 0x7fc1ce3b2500 | 0x7fc0c2835440 | 12076328285430571 | 12076328285441905 | 12076328285686702 | 12076328285753501 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 30 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 21312 | 0x7fc1ce3b2400 | 0x7fc0c2835480 | 12076328285776674 | 12076328285788302 | 12076328285912940 | 12076328285916494 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 32 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 22016 | 0x7fc1ce3b2300 | 0x7fc0c28354c0 | 12076328285943133 | 12076328285955020 | 12076328286079659 | 12076328286083084 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 34 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 22720 | 0x7fc1ce3b2a00 | 0x7fc0c2835500 | 12076328286122036 | 12076328286134858 | 12076328286259337 | 12076328286262497 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 36 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 23680 | 0x7fc1ce3b2900 | 0x7fc0c2835540 | 12076328286288716 | 12076328286301257 | 12076328286581894 | 12076328286648665 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 38 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 24384 | 0x7fc1ce3b2800 | 0x7fc0c2835580 | 12076328286669003 | 12076328286680453 | 12076328286923491 | 12076328286990099 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 40 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 25088 | 0x7fc1ce3b2700 | 0x7fc0c28355c0 | 12076328287022319 | 12076328287034210 | 12076328287158849 | 12076328287161748 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 42 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 25792 | 0x7fc1ce3b2600 | 0x7fc0c2835600 | 12076328287194309 | 12076328287206208 | 12076328287331647 | 12076328287334990 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 44 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 26496 | 0x7fc1ce3b2500 | 0x7fc0c2835640 | 12076328287376938 | 12076328287388286 | 12076328287511965 | 12076328287515265 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 46 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 27712 | 0x7fc1ce3b2400 | 0x7fc0c2835680 | 12076328287546493 | 12076328287558205 | 12076328287809402 | 12076328287875505 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 48 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 28416 | 0x7fc1ce3b2300 | 0x7fc0c28356c0 | 12076328287902144 | 12076328287915801 | 12076328288159799 | 12076328288259989 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 50 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 29120 | 0x7fc1ce3b2a00 | 0x7fc0c2835700 | 12076328288281289 | 12076328288292918 | 12076328288416757 | 12076328288420097 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 52 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 30080 | 0x7fc1ce3b2900 | 0x7fc0c2835740 | 12076328288446927 | 12076328288458196 | 12076328288583475 | 12076328288587197 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 54 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 30784 | 0x7fc1ce3b2800 | 0x7fc0c2835780 | 12076328288624767 | 12076328288637555 | 12076328288762673 | 12076328288765689 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 56 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 32000 | 0x7fc1ce3b2700 | 0x7fc0c28357c0 | 12076328288792669 | 12076328288805873 | 12076328289056271 | 12076328289116922 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 58 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 32960 | 0x7fc1ce3b2600 | 0x7fc0c2835800 | 12076328289139163 | 12076328289150030 | 12076328289393547 | 12076328289471471 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 60 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 33920 | 0x7fc1ce3b2500 | 0x7fc0c2835840 | 12076328289493542 | 12076328289505066 | 12076328289630185 | 12076328289633502 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 62 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 34880 | 0x7fc1ce3b2400 | 0x7fc0c2835880 | 12076328289660963 | 12076328289672265 | 12076328289797864 | 12076328289801123 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 64 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 35840 | 0x7fc1ce3b2300 | 0x7fc0c28358c0 | 12076328289839254 | 12076328289853543 | 12076328289978502 | 12076328289981509 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 66 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 37312 | 0x7fc1ce3b2a00 | 0x7fc0c2835900 | 12076328290011795 | 12076328290023942 | 12076328290273219 | 12076328290328403 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 68 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 38272 | 0x7fc1ce3b2900 | 0x7fc0c2835940 | 12076328290350675 | 12076328290363618 | 12076328290606816 | 12076328290661202 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 70 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 39232 | 0x7fc1ce3b2800 | 0x7fc0c2835980 | 12076328290682592 | 12076328290695135 | 12076328290820094 | 12076328290823453 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 72 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 40192 | 0x7fc1ce3b2700 | 0x7fc0c28359c0 | 12076328290849432 | 12076328290860414 | 12076328290985692 | 12076328290988941 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 74 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 41152 | 0x7fc1ce3b2600 | 0x7fc0c2835a00 | 12076328291030689 | 12076328291042172 | 12076328291166171 | 12076328291169607 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 76 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 42624 | 0x7fc1ce3b2500 | 0x7fc0c2835a40 | 12076328291196156 | 12076328291207930 | 12076328291454808 | 12076328291511642 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 78 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 43584 | 0x7fc1ce3b2400 | 0x7fc0c2835a80 | 12076328291534896 | 12076328291547927 | 12076328291791605 | 12076328291816539 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 80 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 44544 | 0x7fc1ce3b2300 | 0x7fc0c2835ac0 | 12076328291840223 | 12076328291851764 | 12076328291976563 | 12076328291979882 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 82 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 45760 | 0x7fc1ce3b2a00 | 0x7fc0c2835b00 | 12076328292010920 | 12076328292022803 | 12076328292148561 | 12076328292151812 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 84 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 46720 | 0x7fc1ce3b2900 | 0x7fc0c2835b40 | 12076328292188039 | 12076328292201201 | 12076328292325840 | 12076328292329182 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 86 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 48448 | 0x7fc1ce3b2800 | 0x7fc0c2835b80 | 12076328292354940 | 12076328292365999 | 12076328292617677 | 12076328292636793 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 88 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 49408 | 0x7fc1ce3b2700 | 0x7fc0c2835bc0 | 12076328292658373 | 12076328292669357 | 12076328292916074 | 12076328292935699 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 90 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 50368 | 0x7fc1ce3b2600 | 0x7fc0c2835c00 | 12076328292954734 | 12076328292965994 | 12076328293090633 | 12076328293093873 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 92 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 51584 | 0x7fc1ce3b2500 | 0x7fc0c2835c40 | 12076328293121103 | 12076328293131912 | 12076328293259431 | 12076328293262406 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 94 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 52544 | 0x7fc1ce3b2400 | 0x7fc0c2835c80 | 12076328293300567 | 12076328293311910 | 12076328293436869 | 12076328293439926 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 96 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 54272 | 0x7fc1ce3b2300 | 0x7fc0c2835cc0 | 12076328293466065 | 12076328293478149 | 12076328293729347 | 12076328293752527 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 98 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 55488 | 0x7fc1ce3b2a00 | 0x7fc0c2835d00 | 12076328293773806 | 12076328293786306 | 12076328294031104 | 12076328294055570 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 100 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 56704 | 0x7fc1ce3b2900 | 0x7fc0c2835d40 | 12076328294076248 | 12076328294088703 | 12076328294213502 | 12076328294216309 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 102 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 58176 | 0x7fc1ce3b2800 | 0x7fc0c2835d80 | 12076328294241656 | 12076328294252862 | 12076328294379900 | 12076328294382888 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 104 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 59392 | 0x7fc1ce3b2700 | 0x7fc0c2835dc0 | 12076328294418545 | 12076328294431580 | 12076328294556859 | 12076328294559737 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 106 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 61376 | 0x7fc1ce3b2600 | 0x7fc0c2835e00 | 12076328294585285 | 12076328294598298 | 12076328294849976 | 12076328294868801 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 108 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 62592 | 0x7fc1ce3b2500 | 0x7fc0c2835e40 | 12076328294889520 | 12076328294902615 | 12076328295151573 | 12076328295175802 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 110 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 63808 | 0x7fc1ce3b2400 | 0x7fc0c2835e80 | 12076328295198935 | 12076328295211893 | 12076328295336691 | 12076328295339857 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 112 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 65280 | 0x7fc1ce3b2300 | 0x7fc0c2835ec0 | 12076328295366046 | 12076328295377651 | 12076328295507410 | 12076328295510384 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 114 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 66496 | 0x7fc1ce3b2a00 | 0x7fc0c2835f00 | 12076328295546761 | 12076328295558289 | 12076328295683568 | 12076328295686752 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 116 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 68480 | 0x7fc1ce3b2900 | 0x7fc0c2835f40 | 12076328295713010 | 12076328295726128 | 12076328295989485 | 12076328296017226 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 118 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 69696 | 0x7fc1ce3b2800 | 0x7fc0c2835f80 | 12076328296038936 | 12076328296051885 | 12076328296296042 | 12076328296319227 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 120 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 70912 | 0x7fc1ce3b2700 | 0x7fc0c2835fc0 | 12076328296340867 | 12076328296353322 | 12076328296477961 | 12076328296480927 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 122 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 72384 | 0x7fc1ce3b2600 | 0x7fc0c2836000 | 12076328296507066 | 12076328296518280 | 12076328296654439 | 12076328296657546 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 124 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 73600 | 0x7fc1ce3b2500 | 0x7fc0c2836040 | 12076328296695366 | 12076328296707398 | 12076328296831877 | 12076328296834715 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 126 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 75840 | 0x7fc1ce3b2400 | 0x7fc0c2836080 | 12076328296860693 | 12076328296872357 | 12076328297132994 | 12076328297165039 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 128 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 77056 | 0x7fc1ce3b2300 | 0x7fc0c28360c0 | 12076328297187260 | 12076328297199394 | 12076328297444991 | 12076328297469595 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 130 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 78272 | 0x7fc1ce3b2a00 | 0x7fc0c2836100 | 12076328297490253 | 12076328297502591 | 12076328297627230 | 12076328297630223 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 132 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 80000 | 0x7fc1ce3b2900 | 0x7fc0c2836140 | 12076328297656091 | 12076328297667389 | 12076328297809788 | 12076328297812753 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 134 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 81216 | 0x7fc1ce3b2800 | 0x7fc0c2836180 | 12076328297849160 | 12076328297860987 | 12076328297985946 | 12076328297989140 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 136 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 83456 | 0x7fc1ce3b2700 | 0x7fc0c28361c0 | 12076328298020028 | 12076328298031386 | 12076328298284983 | 12076328298311640 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 138 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 84928 | 0x7fc1ce3b2600 | 0x7fc0c2836200 | 12076328298331847 | 12076328298343383 | 12076328298589621 | 12076328298616817 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 140 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 86400 | 0x7fc1ce3b2500 | 0x7fc0c2836240 | 12076328298641623 | 12076328298654260 | 12076328298780979 | 12076328298784038 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 142 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 88128 | 0x7fc1ce3b2400 | 0x7fc0c2836280 | 12076328298808974 | 12076328298821618 | 12076328298971377 | 12076328298974672 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 144 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 89600 | 0x7fc1ce3b2300 | 0x7fc0c28362c0 | 12076328299030676 | 12076328299042576 | 12076328299167695 | 12076328299171197 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 146 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 92096 | 0x7fc1ce3b2a00 | 0x7fc0c2836300 | 12076328299197967 | 12076328299211215 | 12076328299464812 | 12076328299487175 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 148 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 93568 | 0x7fc1ce3b2900 | 0x7fc0c2836340 | 12076328299508584 | 12076328299521292 | 12076328299772489 | 12076328299795878 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 150 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 95040 | 0x7fc1ce3b2800 | 0x7fc0c2836380 | 12076328299816136 | 12076328299828489 | 12076328299954088 | 12076328299957138 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 152 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 96768 | 0x7fc1ce3b2700 | 0x7fc0c28363c0 | 12076328299982896 | 12076328299994247 | 12076328300152326 | 12076328300155396 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 154 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 98240 | 0x7fc1ce3b2600 | 0x7fc0c2836400 | 12076328300192926 | 12076328300204965 | 12076328300330244 | 12076328300333618 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 156 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 100736 | 0x7fc1ce3b2500 | 0x7fc0c2836440 | 12076328300359496 | 12076328300370884 | 12076328300624801 | 12076328300647090 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 158 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 102208 | 0x7fc1ce3b2400 | 0x7fc0c2836480 | 12076328300668179 | 12076328300679681 | 12076328300927039 | 12076328300949612 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 160 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 103680 | 0x7fc1ce3b2300 | 0x7fc0c28364c0 | 12076328300969940 | 12076328300980958 | 12076328301106237 | 12076328301109660 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 162 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 105664 | 0x7fc1ce3b2a00 | 0x7fc0c2836500 | 12076328301135007 | 12076328301145916 | 12076328301310395 | 12076328301314070 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 164 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 107136 | 0x7fc1ce3b2900 | 0x7fc0c2836540 | 12076328301349906 | 12076328301361274 | 12076328301486553 | 12076328301489626 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 166 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 109888 | 0x7fc1ce3b2800 | 0x7fc0c2836580 | 12076328301516135 | 12076328301528153 | 12076328301783990 | 12076328301806735 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 168 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 111360 | 0x7fc1ce3b2700 | 0x7fc0c28365c0 | 12076328301828015 | 12076328301841110 | 12076328302090228 | 12076328302113816 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 170 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 112832 | 0x7fc1ce3b2600 | 0x7fc0c2836600 | 12076328302136859 | 12076328302149427 | 12076328302275026 | 12076328302278342 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 172 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 114816 | 0x7fc1ce3b2500 | 0x7fc0c2836640 | 12076328302303909 | 12076328302316945 | 12076328302489104 | 12076328302492410 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 174 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 116288 | 0x7fc1ce3b2400 | 0x7fc0c2836680 | 12076328302528587 | 12076328302541583 | 12076328302667022 | 12076328302670280 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 176 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 119040 | 0x7fc1ce3b2300 | 0x7fc0c28366c0 | 12076328302696369 | 12076328302707982 | 12076328302964139 | 12076328302986678 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 178 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 120768 | 0x7fc1ce3b2a00 | 0x7fc0c2836700 | 12076328303011745 | 12076328303023019 | 12076328303267976 | 12076328303295001 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 180 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 122496 | 0x7fc1ce3b2900 | 0x7fc0c2836740 | 12076328303317523 | 12076328303328936 | 12076328303454215 | 12076328303457353 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 182 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 124736 | 0x7fc1ce3b2800 | 0x7fc0c2836780 | 12076328303482750 | 12076328303494214 | 12076328303676293 | 12076328303679416 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 184 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 126464 | 0x7fc1ce3b2700 | 0x7fc0c28367c0 | 12076328303715833 | 12076328303729252 | 12076328303855491 | 12076328303858879 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 186 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 20 | 24 | 127936 | 0x7fc1ce3b2600 | 0x7fc0c2836800 | 12076328303884727 | 12076328303897250 | 12076328304193568 | 12076328304217075 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 188 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 129664 | 0x7fc1ce3b2500 | 0x7fc0c2836840 | 12076328304238034 | 12076328304250687 | 12076328304496765 | 12076328304519777 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 190 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 131392 | 0x7fc1ce3b2400 | 0x7fc0c2836880 | 12076328304542760 | 12076328304556124 | 12076328304682523 | 12076328304686267 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 192 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 133632 | 0x7fc1ce3b2300 | 0x7fc0c28368c0 | 12076328304712315 | 12076328304724923 | 12076328304916601 | 12076328304919851 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 194 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 135360 | 0x7fc1ce3b2a00 | 0x7fc0c2836900 | 12076328304956910 | 12076328304969240 | 12076328305095799 | 12076328305099445 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 196 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 20 | 24 | 136832 | 0x7fc1ce3b2900 | 0x7fc0c2836940 | 12076328305126014 | 12076328305139319 | 12076328305421876 | 12076328305446179 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 198 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 138560 | 0x7fc1ce3b2800 | 0x7fc0c2836980 | 12076328305468711 | 12076328305481555 | 12076328305732913 | 12076328305759321 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 200 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 140288 | 0x7fc1ce3b2700 | 0x7fc0c28369c0 | 12076328305780941 | 12076328305793393 | 12076328305918831 | 12076328305922043 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 202 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 142784 | 0x7fc1ce3b2600 | 0x7fc0c2836a00 | 12076328305949234 | 12076328305959791 | 12076328306169869 | 12076328306197075 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 204 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 144768 | 0x7fc1ce3b2500 | 0x7fc0c2836a40 | 12076328306228493 | 12076328306239948 | 12076328306370027 | 12076328306373392 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 206 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 20 | 24 | 145728 | 0x7fc1ce3b2400 | 0x7fc0c2836a80 | 12076328306399170 | 12076328306411307 | 12076328306718024 | 12076328306740224 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 208 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 147712 | 0x7fc1ce3b2300 | 0x7fc0c2836ac0 | 12076328306761123 | 12076328306772263 | 12076328307024101 | 12076328307051893 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 210 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 149696 | 0x7fc1ce3b2a00 | 0x7fc0c2836b00 | 12076328307073984 | 12076328307086500 | 12076328307214019 | 12076328307217321 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 212 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 152192 | 0x7fc1ce3b2900 | 0x7fc0c2836b40 | 12076328307242718 | 12076328307254019 | 12076328307481057 | 12076328307507219 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 214 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 154176 | 0x7fc1ce3b2800 | 0x7fc0c2836b80 | 12076328307538868 | 12076328307551136 | 12076328307677535 | 12076328307680822 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 216 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 20 | 24 | 155648 | 0x7fc1ce3b2700 | 0x7fc0c2836bc0 | 12076328307706550 | 12076328307717854 | 12076328308046011 | 12076328308073191 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 218 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 157632 | 0x7fc1ce3b2600 | 0x7fc0c2836c00 | 12076328308094771 | 12076328308107451 | 12076328308359448 | 12076328308385832 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 220 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 159616 | 0x7fc1ce3b2500 | 0x7fc0c2836c40 | 12076328308406601 | 12076328308419448 | 12076328308547447 | 12076328308550799 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 222 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 162368 | 0x7fc1ce3b2400 | 0x7fc0c2836c80 | 12076328308576006 | 12076328308589366 | 12076328308832404 | 12076328308858491 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 224 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 164608 | 0x7fc1ce3b2300 | 0x7fc0c2836cc0 | 12076328308889107 | 12076328308902163 | 12076328309031602 | 12076328309035229 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 226 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 20 | 24 | 166336 | 0x7fc1ce3b2a00 | 0x7fc0c2836d00 | 12076328309060666 | 12076328309071922 | 12076328309446638 | 12076328309476750 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 228 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 168576 | 0x7fc1ce3b2900 | 0x7fc0c2836d40 | 12076328309498029 | 12076328309509357 | 12076328309760075 | 12076328309786235 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 230 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 170816 | 0x7fc1ce3b2800 | 0x7fc0c2836d80 | 12076328309808376 | 12076328309820075 | 12076328309948873 | 12076328309952123 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 232 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 174080 | 0x7fc1ce3b2700 | 0x7fc0c2836dc0 | 12076328309977791 | 12076328309990473 | 12076328310268230 | 12076328310291504 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 234 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 176576 | 0x7fc1ce3b2600 | 0x7fc0c2836e00 | 12076328310323363 | 12076328310334790 | 12076328310470468 | 12076328310473672 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 236 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 20 | 24 | 177792 | 0x7fc1ce3b2500 | 0x7fc0c2836e40 | 12076328310499410 | 12076328310511268 | 12076328310933824 | 12076328310957331 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 238 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 180288 | 0x7fc1ce3b2400 | 0x7fc0c2836e80 | 12076328310980524 | 12076328310991423 | 12076328311257501 | 12076328311284690 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 240 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 182784 | 0x7fc1ce3b2300 | 0x7fc0c2836ec0 | 12076328311304076 | 12076328311315260 | 12076328311450619 | 12076328311453844 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 242 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 186304 | 0x7fc1ce3b2a00 | 0x7fc0c2836f00 | 12076328311481495 | 12076328311491899 | 12076328311806136 | 12076328311832137 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 244 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 189312 | 0x7fc1ce3b2900 | 0x7fc0c2836f40 | 12076328311865519 | 12076328311876855 | 12076328312028694 | 12076328312032049 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 246 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 20 | 24 | 190784 | 0x7fc1ce3b2800 | 0x7fc0c2836f80 | 12076328312058758 | 12076328312071093 | 12076328312587568 | 12076328312613850 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 248 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 193792 | 0x7fc1ce3b2700 | 0x7fc0c2836fc0 | 12076328312635360 | 12076328312647728 | 12076328312949165 | 12076328312975372 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 250 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 196800 | 0x7fc1ce3b2600 | 0x7fc0c2837000 | 12076328312995659 | 12076328313006604 | 12076328313159883 | 12076328313163421 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 252 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 201088 | 0x7fc1ce3b2500 | 0x7fc0c2837040 | 12076328313190341 | 12076328313204043 | 12076328313588519 | 12076328313611744 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 254 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 204608 | 0x7fc1ce3b2400 | 0x7fc0c2837080 | 12076328313643133 | 12076328313654438 | 12076328313829637 | 12076328313832845 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 256 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 20 | 24 | 206080 | 0x7fc1ce3b2300 | 0x7fc0c28370c0 | 12076328313858964 | 12076328313872516 | 12076328314481310 | 12076328314504854 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 258 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 209600 | 0x7fc1ce3b2a00 | 0x7fc0c2837100 | 12076328314527316 | 12076328314539550 | 12076328314869947 | 12076328314892695 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 260 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 213120 | 0x7fc1ce3b2900 | 0x7fc0c2837140 | 12076328314916589 | 12076328314927706 | 12076328315105785 | 12076328315109298 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 262 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 218176 | 0x7fc1ce3b2800 | 0x7fc0c2837180 | 12076328315136568 | 12076328315147544 | 12076328315602740 | 12076328315625367 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 264 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 222208 | 0x7fc1ce3b2700 | 0x7fc0c28371c0 | 12076328315656605 | 12076328315669139 | 12076328315868177 | 12076328315890389 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 266 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 20 | 24 | 223936 | 0x7fc1ce3b2600 | 0x7fc0c2837200 | 12076328315909935 | 12076328315921137 | 12076328316623050 | 12076328316652245 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 268 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 227968 | 0x7fc1ce3b2500 | 0x7fc0c2837240 | 12076328316674667 | 12076328316685770 | 12076328317058246 | 12076328317085961 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 270 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 232000 | 0x7fc1ce3b2400 | 0x7fc0c2837280 | 12076328317112040 | 12076328317123206 | 12076328317325764 | 12076328317352116 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 272 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 237824 | 0x7fc1ce3b2300 | 0x7fc0c28372c0 | 12076328317372964 | 12076328317384003 | 12076328317909438 | 12076328317935410 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 274 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 242368 | 0x7fc1ce3b2a00 | 0x7fc0c2837300 | 12076328317968030 | 12076328317979357 | 12076328318237755 | 12076328318269951 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 276 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 20 | 24 | 243584 | 0x7fc1ce3b2900 | 0x7fc0c2837340 | 12076328318290960 | 12076328318303034 | 12076328319100947 | 12076328319129479 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 278 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 248128 | 0x7fc1ce3b2800 | 0x7fc0c2837380 | 12076328319154806 | 12076328319166066 | 12076328319587502 | 12076328319613749 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 280 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 252672 | 0x7fc1ce3b2700 | 0x7fc0c28373c0 | 12076328319637002 | 12076328319648462 | 12076328319873100 | 12076328319898748 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 282 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 259264 | 0x7fc1ce3b2600 | 0x7fc0c2837400 | 12076328319920669 | 12076328319932939 | 12076328320529253 | 12076328320556331 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 284 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 264832 | 0x7fc1ce3b2500 | 0x7fc0c2837440 | 12076328320588520 | 12076328320601253 | 12076328320871010 | 12076328320894018 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 286 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 20 | 24 | 266304 | 0x7fc1ce3b2400 | 0x7fc0c2837480 | 12076328320915799 | 12076328320926850 | 12076328321911160 | 12076328321941896 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 288 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 28 | 24 | 271872 | 0x7fc1ce3b2300 | 0x7fc0c28374c0 | 12076328321962213 | 12076328321973240 | 12076328322485715 | 12076328322513037 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 290 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 277440 | 0x7fc1ce3b2a00 | 0x7fc0c2837500 | 12076328322538134 | 12076328322549234 | 12076328322820432 | 12076328322842910 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 292 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 12 | 24 | 279936 | 0x7fc1ce3b2900 | 0x7fc0c2837540 | 12076328322865682 | 12076328322877231 | 12076328323614664 | 12076328323648066 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 294 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 286528 | 0x7fc1ce3b2800 | 0x7fc0c2837580 | 12076328323679785 | 12076328323691303 | 12076328324006820 | 12076328324033843 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 296 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 20 | 24 | 288000 | 0x7fc1ce3b2700 | 0x7fc0c28375c0 | 12076328324060243 | 12076328324071620 | 12076328325242329 | 12076328325266614 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 298 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 32 | 24 | 294592 | 0x7fc1ce3b2600 | 0x7fc0c2837600 | 12076328325292813 | 12076328325304088 | 12076328325913202 | 12076328325936920 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 300 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 301184 | 0x7fc1ce3b2500 | 0x7fc0c2837640 | 12076328325963039 | 12076328325975762 | 12076328326294799 | 12076328326323589 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 302 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 12 | 24 | 304960 | 0x7fc1ce3b2400 | 0x7fc0c2837680 | 12076328326349387 | 12076328326360398 | 12076328327238150 | 12076328327267373 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 304 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 24 | 24 | 313600 | 0x7fc1ce3b2300 | 0x7fc0c28376c0 | 12076328327303049 | 12076328327315909 | 12076328327724385 | 12076328327752785 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 306 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 20 | 24 | 314816 | 0x7fc1ce3b2a00 | 0x7fc0c2837700 | 12076328327775457 | 12076328327788385 | 12076328329338130 | 12076328329409243 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 308 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 20 | 24 | 317568 | 0x7fc1ce3b2900 | 0x7fc0c2837740 | 12076328329433268 | 12076328329446494 | 12076328330240888 | 12076328330315778 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 310 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 12 | 24 | 320320 | 0x7fc1ce3b2800 | 0x7fc0c2837780 | 12076328330335795 | 12076328330349046 | 12076328330762483 | 12076328330832368 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 312 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 12 | 24 | 324096 | 0x7fc1ce3b2700 | 0x7fc0c28377c0 | 12076328330856042 | 12076328330867602 | 12076328332025833 | 12076328332098802 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 314 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 12 | 24 | 328896 | 0x7fc1ce3b2600 | 0x7fc0c2837800 | 12076328332133025 | 12076328332148552 | 12076328332933986 | 12076328333006859 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 316 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 20 | 24 | 330112 | 0x7fc1ce3b2500 | 0x7fc0c2837840 | 12076328333028720 | 12076328333040865 | 12076328336096201 | 12076328336166511 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 318 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 20 | 24 | 332864 | 0x7fc1ce3b2400 | 0x7fc0c2837880 | 12076328336195776 | 12076328336207400 | 12076328337749468 | 12076328337820415 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 320 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 12 | 24 | 335616 | 0x7fc1ce3b2300 | 0x7fc0c28378c0 | 12076328337848287 | 12076328337860667 | 12076328338649301 | 12076328338723804 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 322 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 12 | 24 | 339392 | 0x7fc1ce3b2a00 | 0x7fc0c2837900 | 12076328338747668 | 12076328338759380 | 12076328341041122 | 12076328341111622 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 324 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 12 | 24 | 344192 | 0x7fc1ce3b2900 | 0x7fc0c2837940 | 12076328341146376 | 12076328341158241 | 12076328342692949 | 12076328342764133 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 326 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 20 | 24 | 345408 | 0x7fc1ce3b2800 | 0x7fc0c2837980 | 12076328342787035 | 12076328342799028 | 12076328348854340 | 12076328348924932 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 328 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 20 | 24 | 348160 | 0x7fc1ce3b2700 | 0x7fc0c28379c0 | 12076328348949458 | 12076328348960739 | 12076328352004075 | 12076328352077892 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 330 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 12 | 24 | 350912 | 0x7fc1ce3b2600 | 0x7fc0c2837a00 | 12076328352100574 | 12076328352112075 | 12076328353651102 | 12076328353722028 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 332 | 921580 | 921585 | 4194304 | 256 | 0 | 0 | 12 | 24 | 0 | 0x7fc1ce3b2500 | 0x7fc0c2837a40 | 12076328353744509 | 12076328353758782 | 12076328358285786 | 12076328358356250 |