37 KiB
37 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBufferAligned.kd | 0 | 0 | 0 | 225228 | 225228 | 33554432 | 256 | 0 | 0 | 4 | 32 | 4160 | 0x0 | 0x7f9f58604280 | 17618191082395 | 17618191108316 | 17618191348476 | 17618191437046 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 225228 | 225228 | 32768 | 256 | 0 | 0 | 12 | 24 | 13888 | 0x0 | 0x7f9f58623f80 | 17618196106138 | 17618196121120 | 17618196134240 | 17618196153037 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 5 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 14336 | 0x7f9f770e3380 | 0x7f9f58623fc0 | 17618196155947 | 17618196205120 | 17618196297920 | 17618196300333 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 8 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15040 | 0x7f9f770e3200 | 0x7f9f58624000 | 17618196319392 | 17618196329920 | 17618196509440 | 17618196511457 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 11 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15488 | 0x7f9f770e3080 | 0x7f9f58624040 | 17618196525927 | 17618196533920 | 17618196713600 | 17618196715782 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 14 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 15936 | 0x7f9f74a4df00 | 0x7f9f58624080 | 17618196730812 | 17618196739040 | 17618196832960 | 17618196834939 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 17 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 16384 | 0x7f9f74a4dd80 | 0x7f9f586240c0 | 17618196850889 | 17618196858560 | 17618196950400 | 17618196952356 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 20 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 17088 | 0x7f9f74a4dc00 | 0x7f9f58624100 | 17618196979016 | 17618196989760 | 17618197082081 | 17618197084113 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 23 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 16 | 24 | 17792 | 0x7f9f74a4da80 | 0x7f9f58624140 | 17618197103562 | 17618197119521 | 17618197300321 | 17618197302257 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 26 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 16 | 24 | 18496 | 0x7f9f74a4d900 | 0x7f9f58624180 | 17618197324637 | 17618197335201 | 17618197516001 | 17618197518052 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 29 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19200 | 0x7f9f74a4d780 | 0x7f9f586241c0 | 17618197536112 | 17618197550081 | 17618197643521 | 17618197645479 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 32 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19904 | 0x7f9f74a4d600 | 0x7f9f58624200 | 17618197665708 | 17618197676001 | 17618197769281 | 17618197771296 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 35 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 20608 | 0x7f9f770e3480 | 0x7f9f58624240 | 17618197790905 | 17618197801281 | 17618197894401 | 17618197896352 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 38 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 16 | 24 | 21312 | 0x7f9f770e3300 | 0x7f9f58624280 | 17618197916112 | 17618197926561 | 17618198106721 | 17618198108697 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 41 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22016 | 0x7f9f770e3180 | 0x7f9f586242c0 | 17618198125057 | 17618198133921 | 17618198315042 | 17618198317002 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 44 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22720 | 0x7f9f770e3000 | 0x7f9f58624300 | 17618198332811 | 17618198378242 | 17618198471362 | 17618198473408 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 47 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 23424 | 0x7f9f74a4de80 | 0x7f9f58624340 | 17618198494787 | 17618198518082 | 17618198611682 | 17618198613634 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 50 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 24128 | 0x7f9f74a4dd00 | 0x7f9f58624380 | 17618198637114 | 17618198647202 | 17618198740162 | 17618198742191 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 53 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 16 | 24 | 24832 | 0x7f9f74a4db80 | 0x7f9f586243c0 | 17618198760560 | 17618198768962 | 17618198949762 | 17618198951616 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 56 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 16 | 24 | 25536 | 0x7f9f74a4da00 | 0x7f9f58624400 | 17618198968975 | 17618198977922 | 17618199157282 | 17618199159340 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 59 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26240 | 0x7f9f74a4d880 | 0x7f9f58624440 | 17618199174570 | 17618199183522 | 17618199277602 | 17618199279647 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 62 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26944 | 0x7f9f74a4d700 | 0x7f9f58624480 | 17618199294957 | 17618199303682 | 17618199396803 | 17618199398684 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 65 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 27648 | 0x7f9f770e3580 | 0x7f9f586244c0 | 17618199418944 | 17618199429443 | 17618199522243 | 17618199524171 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 68 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 16 | 24 | 28608 | 0x7f9f770e3400 | 0x7f9f58624500 | 17618199540791 | 17618199569603 | 17618199748483 | 17618199750395 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 71 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 16 | 24 | 29312 | 0x7f9f770e3280 | 0x7f9f58624540 | 17618199764875 | 17618199780003 | 17618199959843 | 17618199961880 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 74 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 30016 | 0x7f9f770e3100 | 0x7f9f58624580 | 17618199980360 | 17618199988803 | 17618200080643 | 17618200082597 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 77 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 8 | 24 | 30976 | 0x7f9f74a4df80 | 0x7f9f586245c0 | 17618200097687 | 17618200106723 | 17618200198723 | 17618200200574 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 80 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 31680 | 0x7f9f74a4de00 | 0x7f9f58624600 | 17618200221673 | 17618200232003 | 17618200324643 | 17618200326541 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 83 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 16 | 24 | 32640 | 0x7f9f74a4dc80 | 0x7f9f58624640 | 17618200348270 | 17618200358723 | 17618200538884 | 17618200540875 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 86 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 33600 | 0x7f9f74a4db00 | 0x7f9f58624680 | 17618200557505 | 17618200575364 | 17618200756004 | 17618200757520 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 89 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 34560 | 0x7f9f74a4d980 | 0x7f9f586246c0 | 17618200771340 | 17618200779524 | 17618200873124 | 17618200874537 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 92 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 8 | 24 | 35520 | 0x7f9f74a4d800 | 0x7f9f58624700 | 17618200888617 | 17618200896804 | 17618200990724 | 17618200992094 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 95 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 36224 | 0x7f9f74a4d680 | 0x7f9f58624740 | 17618201012843 | 17618201022404 | 17618201116324 | 17618201117661 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 98 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 37184 | 0x7f9f770e3500 | 0x7f9f58624780 | 17618201132150 | 17618201140164 | 17618201319524 | 17618201321046 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 101 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 38144 | 0x7f9f770e3380 | 0x7f9f586247c0 | 17618201334835 | 17618201343204 | 17618201524164 | 17618201525720 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 104 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 39104 | 0x7f9f770e3200 | 0x7f9f58624800 | 17618201539860 | 17618201547524 | 17618201640325 | 17618201641737 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 107 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 8 | 24 | 40320 | 0x7f9f770e3080 | 0x7f9f58624840 | 17618201655817 | 17618201663845 | 17618201757445 | 17618201758824 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 110 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 41280 | 0x7f9f74a4df00 | 0x7f9f58624880 | 17618201779684 | 17618201790405 | 17618201884485 | 17618201885851 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 113 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 42240 | 0x7f9f74a4dd80 | 0x7f9f586248c0 | 17618201900141 | 17618201908005 | 17618202087205 | 17618202088716 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 116 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 43200 | 0x7f9f74a4dc00 | 0x7f9f58624900 | 17618202102776 | 17618202110565 | 17618202290565 | 17618202292081 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 119 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 8 | 24 | 44160 | 0x7f9f74a4da80 | 0x7f9f58624940 | 17618202306421 | 17618202314565 | 17618202408005 | 17618202409468 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 122 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 45376 | 0x7f9f74a4d900 | 0x7f9f58624980 | 17618202422758 | 17618202430565 | 17618202525765 | 17618202527225 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 125 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 46336 | 0x7f9f74a4d780 | 0x7f9f586249c0 | 17618202546905 | 17618202558085 | 17618202652165 | 17618202653492 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 128 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 47552 | 0x7f9f74a4d600 | 0x7f9f58624a00 | 17618202667991 | 17618202675845 | 17618202855526 | 17618202856877 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 131 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 48512 | 0x7f9f770e3480 | 0x7f9f58624a40 | 17618202870806 | 17618202878726 | 17618203060166 | 17618203061481 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 134 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 8 | 24 | 49472 | 0x7f9f770e3300 | 0x7f9f58624a80 | 17618203076031 | 17618203083846 | 17618203176486 | 17618203177939 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 137 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 50688 | 0x7f9f770e3180 | 0x7f9f58624ac0 | 17618203192828 | 17618203201446 | 17618203295046 | 17618203296426 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 140 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 51648 | 0x7f9f770e3000 | 0x7f9f58624b00 | 17618203316355 | 17618203327206 | 17618203419206 | 17618203420632 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 143 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 52864 | 0x7f9f74a4de80 | 0x7f9f58624b40 | 17618203435752 | 17618203443206 | 17618203622086 | 17618203623507 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 146 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 54080 | 0x7f9f74a4dd00 | 0x7f9f58624b80 | 17618203639407 | 17618203646886 | 17618203825927 | 17618203827312 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 149 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 8 | 24 | 55296 | 0x7f9f74a4db80 | 0x7f9f58624bc0 | 17618203841322 | 17618203849287 | 17618203943207 | 17618203944699 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 152 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 56768 | 0x7f9f74a4da00 | 0x7f9f58624c00 | 17618203959199 | 17618203967047 | 17618204062887 | 17618204064296 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 155 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 57728 | 0x7f9f74a4d880 | 0x7f9f58624c40 | 17618204083326 | 17618204094887 | 17618204188487 | 17618204189783 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 158 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 58944 | 0x7f9f74a4d700 | 0x7f9f58624c80 | 17618204205952 | 17618204213767 | 17618204393767 | 17618204395168 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 161 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 60160 | 0x7f9f770e3580 | 0x7f9f58624cc0 | 17618204409347 | 17618204417287 | 17618204597767 | 17618204599233 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 164 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 8 | 24 | 61376 | 0x7f9f770e3400 | 0x7f9f58624d00 | 17618204612992 | 17618204620807 | 17618204714567 | 17618204715990 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 167 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 62848 | 0x7f9f770e3280 | 0x7f9f58624d40 | 17618204730479 | 17618204738247 | 17618204838567 | 17618204840086 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 170 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 63808 | 0x7f9f770e3100 | 0x7f9f58624d80 | 17618204860276 | 17618204870727 | 17618204964008 | 17618204965423 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 173 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 65024 | 0x7f9f74a4df80 | 0x7f9f58624dc0 | 17618204979683 | 17618204988648 | 17618205168648 | 17618205170098 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 176 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 66240 | 0x7f9f74a4de00 | 0x7f9f58624e00 | 17618205183528 | 17618205191208 | 17618205371368 | 17618205372803 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 179 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 8 | 24 | 67456 | 0x7f9f74a4dc80 | 0x7f9f58624e40 | 17618205387013 | 17618205394888 | 17618205489928 | 17618205491410 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 182 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 68928 | 0x7f9f74a4db00 | 0x7f9f58624e80 | 17618205505570 | 17618205513768 | 17618205616808 | 17618205618187 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 185 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 70144 | 0x7f9f74a4d980 | 0x7f9f58624ec0 | 17618205638116 | 17618205648968 | 17618205741608 | 17618205742914 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 188 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 71616 | 0x7f9f74a4d800 | 0x7f9f58624f00 | 17618205757023 | 17618205764808 | 17618205943528 | 17618205944898 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 191 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 72832 | 0x7f9f74a4d680 | 0x7f9f58624f40 | 17618205959458 | 17618205968168 | 17618206147849 | 17618206149313 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 194 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 8 | 24 | 74048 | 0x7f9f770e3500 | 0x7f9f58624f80 | 17618206163683 | 17618206172009 | 17618206265609 | 17618206267060 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 197 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 75776 | 0x7f9f770e3380 | 0x7f9f58624fc0 | 17618206280560 | 17618206288489 | 17618206394569 | 17618206396077 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 200 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 76992 | 0x7f9f770e3200 | 0x7f9f58625000 | 17618206415636 | 17618206426729 | 17618206520649 | 17618206522144 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 203 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 78464 | 0x7f9f770e3080 | 0x7f9f58625040 | 17618206535973 | 17618206543689 | 17618206724329 | 17618206725639 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 206 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 79936 | 0x7f9f74a4df00 | 0x7f9f58625080 | 17618206740658 | 17618206748649 | 17618206927529 | 17618206928933 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 209 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 8 | 24 | 81408 | 0x7f9f74a4dd80 | 0x7f9f586250c0 | 17618206942953 | 17618206951209 | 17618207046569 | 17618207047920 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 212 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 83136 | 0x7f9f74a4dc00 | 0x7f9f58625100 | 17618207062220 | 17618207070089 | 17618207184649 | 17618207186067 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 215 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 84352 | 0x7f9f74a4da80 | 0x7f9f58625140 | 17618207221866 | 17618207231370 | 17618207325130 | 17618207326653 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 218 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 85824 | 0x7f9f74a4d900 | 0x7f9f58625180 | 17618207341043 | 17618207348970 | 17618207529450 | 17618207530838 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 221 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 87296 | 0x7f9f74a4d780 | 0x7f9f586251c0 | 17618207545198 | 17618207552970 | 17618207734250 | 17618207735733 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 224 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 88768 | 0x7f9f74a4d600 | 0x7f9f58625200 | 17618207750243 | 17618207758090 | 17618207853610 | 17618207855000 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 227 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 90752 | 0x7f9f770e3480 | 0x7f9f58625240 | 17618207869820 | 17618207877770 | 17618207998410 | 17618207999856 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 230 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 91968 | 0x7f9f770e3300 | 0x7f9f58625280 | 17618208019706 | 17618208030570 | 17618208124330 | 17618208125813 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 233 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 93440 | 0x7f9f770e3180 | 0x7f9f586252c0 | 17618208140263 | 17618208148330 | 17618208328331 | 17618208329718 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 236 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 94912 | 0x7f9f770e3000 | 0x7f9f58625300 | 17618208343428 | 17618208351211 | 17618208531211 | 17618208532593 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 239 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 96384 | 0x7f9f74a4de80 | 0x7f9f58625340 | 17618208548072 | 17618208555691 | 17618208649931 | 17618208651430 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 242 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 98368 | 0x7f9f74a4dd00 | 0x7f9f58625380 | 17618208668229 | 17618208676171 | 17618208802731 | 17618208804266 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 245 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 99584 | 0x7f9f74a4db80 | 0x7f9f586253c0 | 17618208824535 | 17618208835051 | 17618208929771 | 17618208931263 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 248 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 101312 | 0x7f9f74a4da00 | 0x7f9f58625400 | 17618208945522 | 17618208953611 | 17618209132971 | 17618209134408 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 251 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 102784 | 0x7f9f74a4d880 | 0x7f9f58625440 | 17618209148207 | 17618209156011 | 17618209338251 | 17618209339662 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 254 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 104256 | 0x7f9f74a4d700 | 0x7f9f58625480 | 17618209353602 | 17618209362251 | 17618209456172 | 17618209457579 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 257 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 106240 | 0x7f9f770e3580 | 0x7f9f586254c0 | 17618209471759 | 17618209479532 | 17618209610092 | 17618209611455 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 260 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 107712 | 0x7f9f770e3400 | 0x7f9f58625500 | 17618209630985 | 17618209642732 | 17618209736172 | 17618209737552 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 263 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 16 | 24 | 109440 | 0x7f9f770e3280 | 0x7f9f58625540 | 17618209752772 | 17618209761612 | 17618209941292 | 17618209942627 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 266 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 16 | 24 | 111168 | 0x7f9f770e3100 | 0x7f9f58625580 | 17618209956547 | 17618209964812 | 17618210144652 | 17618210146052 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 269 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 8 | 24 | 112896 | 0x7f9f74a4df80 | 0x7f9f586255c0 | 17618210163131 | 17618210171052 | 17618210267532 | 17618210268869 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 272 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 115136 | 0x7f9f74a4de00 | 0x7f9f58625600 | 17618210285998 | 17618210293932 | 17618210432332 | 17618210433765 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 275 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 116608 | 0x7f9f74a4dc80 | 0x7f9f58625640 | 17618210453614 | 17618210464332 | 17618210558732 | 17618210560231 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 278 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 16 | 24 | 118336 | 0x7f9f74a4db00 | 0x7f9f58625680 | 17618210575191 | 17618210582733 | 17618210762893 | 17618210764326 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 281 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 16 | 24 | 120064 | 0x7f9f74a4d980 | 0x7f9f586256c0 | 17618210777986 | 17618210786253 | 17618210965453 | 17618210966951 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 284 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 121792 | 0x7f9f74a4d800 | 0x7f9f58625700 | 17618210980781 | 17618210988653 | 17618211085453 | 17618211086788 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 287 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 124032 | 0x7f9f74a4d680 | 0x7f9f58625740 | 17618211100958 | 17618211108653 | 17618211253933 | 17618211255434 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 290 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 125504 | 0x7f9f770e3500 | 0x7f9f58625780 | 17618211275213 | 17618211286093 | 17618211381133 | 17618211382541 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 293 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 127488 | 0x7f9f770e3380 | 0x7f9f586257c0 | 17618211396500 | 17618211404493 | 17618211584653 | 17618211585995 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 296 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 129216 | 0x7f9f770e3200 | 0x7f9f58625800 | 17618211600215 | 17618211608973 | 17618211788814 | 17618211790330 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 299 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 130944 | 0x7f9f770e3080 | 0x7f9f58625840 | 17618211805210 | 17618211814254 | 17618211913774 | 17618211915197 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 302 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 133440 | 0x7f9f74a4df00 | 0x7f9f58625880 | 17618211928947 | 17618211936814 | 17618212092174 | 17618212093533 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 305 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 134912 | 0x7f9f74a4dd80 | 0x7f9f586258c0 | 17618212113252 | 17618212124174 | 17618212219694 | 17618212221189 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 308 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 136896 | 0x7f9f74a4dc00 | 0x7f9f58625900 | 17618212234999 | 17618212242894 | 17618212421454 | 17618212422824 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 311 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 138880 | 0x7f9f74a4da80 | 0x7f9f58625940 | 17618212437744 | 17618212445774 | 17618212626894 | 17618212628269 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 314 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 140864 | 0x7f9f74a4d900 | 0x7f9f58625980 | 17618212642459 | 17618212652814 | 17618212760174 | 17618212761786 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 317 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 143616 | 0x7f9f74a4d780 | 0x7f9f586259c0 | 17618212776135 | 17618212786574 | 17618212957775 | 17618212959231 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 320 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 145344 | 0x7f9f74a4d600 | 0x7f9f58625a00 | 17618212981130 | 17618212991855 | 17618213088015 | 17618213089497 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 323 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 147584 | 0x7f9f770e3480 | 0x7f9f58625a40 | 17618213104107 | 17618213114095 | 17618213295535 | 17618213297002 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 326 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 149568 | 0x7f9f770e3300 | 0x7f9f58625a80 | 17618213311942 | 17618213320175 | 17618213502575 | 17618213503957 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 329 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 151552 | 0x7f9f770e3180 | 0x7f9f58625ac0 | 17618213518346 | 17618213526255 | 17618213635855 | 17618213637303 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 332 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 154304 | 0x7f9f770e3000 | 0x7f9f58625b00 | 17618213651073 | 17618213659375 | 17618213840335 | 17618213841728 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 335 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 156288 | 0x7f9f74a4de80 | 0x7f9f58625b40 | 17618213863478 | 17618213872975 | 17618213974256 | 17618213975595 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 338 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 158784 | 0x7f9f74a4dd00 | 0x7f9f58625b80 | 17618213991474 | 17618213998896 | 17618214186096 | 17618214187749 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 341 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 161024 | 0x7f9f74a4db80 | 0x7f9f58625bc0 | 17618214201799 | 17618214209616 | 17618214394896 | 17618214396264 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 344 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 163264 | 0x7f9f74a4da00 | 0x7f9f58625c00 | 17618214412724 | 17618214421136 | 17618214543056 | 17618214544500 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 347 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 166528 | 0x7f9f74a4d880 | 0x7f9f58625c40 | 17618214560120 | 17618214567856 | 17618214774576 | 17618214798314 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 350 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 168512 | 0x7f9f74a4d700 | 0x7f9f58625c80 | 17618214813434 | 17618214824016 | 17618214934576 | 17618214935901 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 353 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 171264 | 0x7f9f770e3580 | 0x7f9f58625cc0 | 17618214950720 | 17618214958896 | 17618215143537 | 17618215144935 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 356 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 173760 | 0x7f9f770e3400 | 0x7f9f58625d00 | 17618215159645 | 17618215167537 | 17618215356337 | 17618215357680 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 359 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 176256 | 0x7f9f770e3280 | 0x7f9f58625d40 | 17618215372599 | 17618215380497 | 17618215514737 | 17618215516196 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 362 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 179776 | 0x7f9f770e3100 | 0x7f9f58625d80 | 17618215530155 | 17618215537937 | 17618215770097 | 17618215793369 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 365 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 182272 | 0x7f9f74a4df80 | 0x7f9f58625dc0 | 17618215807968 | 17618215818417 | 17618215944817 | 17618215946145 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 368 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 185536 | 0x7f9f74a4de00 | 0x7f9f58625e00 | 17618215961825 | 17618215969777 | 17618216160017 | 17618216161509 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 371 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 188544 | 0x7f9f74a4dc80 | 0x7f9f58625e40 | 17618216176329 | 17618216184657 | 17618216379218 | 17618216380684 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 374 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 191552 | 0x7f9f74a4db00 | 0x7f9f58625e80 | 17618216394874 | 17618216402258 | 17618216562258 | 17618216563539 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 377 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 195840 | 0x7f9f74a4d980 | 0x7f9f58625ec0 | 17618216577879 | 17618216585778 | 17618216869138 | 17618216890631 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 380 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 198592 | 0x7f9f74a4d800 | 0x7f9f58625f00 | 17618216905251 | 17618216915858 | 17618217064498 | 17618217065837 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 383 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 202368 | 0x7f9f74a4d680 | 0x7f9f58625f40 | 17618217081326 | 17618217088818 | 17618217298258 | 17618217319680 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 386 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 205888 | 0x7f9f770e3500 | 0x7f9f58625f80 | 17618217326910 | 17618217336979 | 17618217546579 | 17618217562494 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 389 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 209408 | 0x7f9f770e3380 | 0x7f9f58625fc0 | 17618217570884 | 17618217580979 | 17618217766739 | 17618217768189 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 392 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 214464 | 0x7f9f770e3200 | 0x7f9f58626000 | 17618217782388 | 17618217790419 | 17618218124499 | 17618218147389 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 395 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 217728 | 0x7f9f770e3080 | 0x7f9f58626040 | 17618218163499 | 17618218174259 | 17618218341779 | 17618218343194 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 398 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 222016 | 0x7f9f74a4df00 | 0x7f9f58626080 | 17618218358414 | 17618218366419 | 17618218597300 | 17618218612517 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 401 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 226048 | 0x7f9f74a4dd80 | 0x7f9f586260c0 | 17618218620897 | 17618218631060 | 17618218860180 | 17618218875531 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 404 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 230080 | 0x7f9f74a4dc00 | 0x7f9f58626100 | 17618218885170 | 17618218895540 | 17618219106740 | 17618219121684 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 407 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 235904 | 0x7f9f74a4da80 | 0x7f9f58626140 | 17618219130814 | 17618219139860 | 17618219525460 | 17618219540504 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 410 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 239424 | 0x7f9f74a4d900 | 0x7f9f58626180 | 17618219556213 | 17618219566580 | 17618219753621 | 17618219755178 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 413 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 244224 | 0x7f9f74a4d780 | 0x7f9f586261c0 | 17618219770368 | 17618219778261 | 17618220028661 | 17618220043551 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 416 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 248768 | 0x7f9f74a4d600 | 0x7f9f58626200 | 17618220051461 | 17618220061781 | 17618220309621 | 17618220324514 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 419 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 253312 | 0x7f9f770e3480 | 0x7f9f58626240 | 17618220336254 | 17618220346581 | 17618220583381 | 17618220598407 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 422 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 8 | 24 | 255552 | 0x7f9f770e3300 | 0x7f9f58626280 | 17618220607217 | 17618220617461 | 17618221072022 | 17618221086815 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 425 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 259840 | 0x7f9f770e3180 | 0x7f9f586262c0 | 17618221102294 | 17618221112982 | 17618221339062 | 17618221354368 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 428 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 265664 | 0x7f9f770e3000 | 0x7f9f58626300 | 17618221362478 | 17618221372822 | 17618221671382 | 17618221687069 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 431 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 271232 | 0x7f9f74a4de80 | 0x7f9f58626340 | 17618221696509 | 17618221705782 | 17618222004183 | 17618222023081 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 434 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 8 | 24 | 273216 | 0x7f9f74a4dd00 | 0x7f9f58626380 | 17618222033931 | 17618222044343 | 17618222340823 | 17618222363882 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 437 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 8 | 24 | 275712 | 0x7f9f74a4db80 | 0x7f9f586263c0 | 17618222372982 | 17618222382903 | 17618222940343 | 17618222959277 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 440 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 280768 | 0x7f9f74a4da00 | 0x7f9f58626400 | 17618222974627 | 17618222985304 | 17618223248984 | 17618223271049 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 443 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 287616 | 0x7f9f74a4d880 | 0x7f9f58626440 | 17618223279009 | 17618223289304 | 17618223639064 | 17618223660579 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 446 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 294208 | 0x7f9f74a4d700 | 0x7f9f58626480 | 17618223669169 | 17618223679384 | 17618224029464 | 17618224051000 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 449 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 8 | 24 | 296960 | 0x7f9f770e3580 | 0x7f9f586264c0 | 17618224059899 | 17618224070584 | 17618224417305 | 17618224439310 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 452 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 8 | 24 | 299968 | 0x7f9f770e3400 | 0x7f9f58626500 | 17618224447179 | 17618224457305 | 17618225117305 | 17618225139082 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 455 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 8 | 24 | 302720 | 0x7f9f770e3280 | 0x7f9f58626540 | 17618225155792 | 17618225165305 | 17618225612186 | 17618225633869 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 458 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 305472 | 0x7f9f770e3100 | 0x7f9f58626580 | 17618225643289 | 17618225653146 | 17618226117786 | 17618226141187 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 461 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 308224 | 0x7f9f74a4df80 | 0x7f9f586265c0 | 17618226150206 | 17618226160186 | 17618226622907 | 17618226645704 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 464 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 8 | 24 | 310976 | 0x7f9f74a4de00 | 0x7f9f58626600 | 17618226654264 | 17618226664347 | 17618227116507 | 17618227138201 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 467 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 8 | 24 | 313216 | 0x7f9f74a4dc80 | 0x7f9f58626640 | 17618227146501 | 17618227156667 | 17618228026588 | 17618228047758 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 470 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 8 | 24 | 315968 | 0x7f9f74a4db00 | 0x7f9f58626680 | 17618228064088 | 17618228074748 | 17618228928349 | 17618228949605 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 473 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 318720 | 0x7f9f74a4d980 | 0x7f9f586266c0 | 17618228957595 | 17618228968029 | 17618229854110 | 17618229875412 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 476 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 321472 | 0x7f9f74a4d800 | 0x7f9f58626700 | 17618229885832 | 17618229896030 | 17618230775710 | 17618230801398 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 479 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 8 | 24 | 324224 | 0x7f9f74a4d680 | 0x7f9f58626740 | 17618230810988 | 17618230820830 | 17618231680831 | 17618231702996 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 482 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 8 | 24 | 326464 | 0x7f9f770e3500 | 0x7f9f58626780 | 17618231712345 | 17618231722271 | 17618233420513 | 17618233492750 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 485 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 8 | 24 | 329216 | 0x7f9f770e3380 | 0x7f9f586267c0 | 17618233509350 | 17618233519873 | 17618235184834 | 17618235254645 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 488 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 331968 | 0x7f9f770e3200 | 0x7f9f58626800 | 17618235263955 | 17618235273954 | 17618236998916 | 17618237068419 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 491 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 12 | 24 | 334720 | 0x7f9f770e3080 | 0x7f9f58626840 | 17618237079949 | 17618237094916 | 17618238811558 | 17618238881713 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 494 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 8 | 24 | 337472 | 0x7f9f74a4df00 | 0x7f9f58626880 | 17618238891033 | 17618238900838 | 17618240574599 | 17618240644258 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 497 | 225228 | 225228 | 4194304 | 256 | 0 | 0 | 8 | 24 | 0 | 0x7f9f74a4dd80 | 0x7f9f586268c0 | 17618240652678 | 17618240663239 | 17618244022442 | 17618244098931 |