37 KiB
37 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBufferAligned.kd | 0 | 0 | 0 | 189951 | 189951 | 33554432 | 256 | 0 | 0 | 4 | 32 | 4160 | 0x0 | 0x7fefa1004280 | 17039094299446 | 17039094324187 | 17039094564027 | 17039094645986 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 189951 | 189951 | 32768 | 256 | 0 | 0 | 12 | 24 | 13888 | 0x0 | 0x7fefa1023f80 | 17039099396231 | 17039099412016 | 17039099425136 | 17039099444229 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 5 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 14336 | 0x7fefa40a4380 | 0x7fefa1023fc0 | 17039099447889 | 17039099497936 | 17039099590576 | 17039099592655 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 8 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15040 | 0x7fefa40a4200 | 0x7fefa1024000 | 17039099614844 | 17039099624495 | 17039099802735 | 17039099804779 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 11 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15488 | 0x7fefa40a4080 | 0x7fefa1024040 | 17039099819908 | 17039099828015 | 17039100005775 | 17039100007773 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 14 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 15936 | 0x7fefa1a0df00 | 0x7fefa1024080 | 17039100022623 | 17039100030735 | 17039100124174 | 17039100126240 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 17 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 16384 | 0x7fefa1a0dd80 | 0x7fefa10240c0 | 17039100141629 | 17039100149614 | 17039100241774 | 17039100243766 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 20 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 17088 | 0x7fefa1a0dc00 | 0x7fefa1024100 | 17039100270876 | 17039100281294 | 17039100373934 | 17039100375943 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 23 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 16 | 24 | 17792 | 0x7fefa1a0da80 | 0x7fefa1024140 | 17039100395032 | 17039100404014 | 17039100583534 | 17039100585517 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 26 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 16 | 24 | 18496 | 0x7fefa1a0d900 | 0x7fefa1024180 | 17039100603936 | 17039100628493 | 17039100808013 | 17039100810160 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 29 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19200 | 0x7fefa1a0d780 | 0x7fefa10241c0 | 17039100832800 | 17039100843053 | 17039100936493 | 17039100938447 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 32 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19904 | 0x7fefa1a0d600 | 0x7fefa1024200 | 17039100955956 | 17039100964013 | 17039101057133 | 17039101059043 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 35 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 20608 | 0x7fefa40a4480 | 0x7fefa1024240 | 17039101078833 | 17039101089293 | 17039101182892 | 17039101184900 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 38 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 16 | 24 | 21312 | 0x7fefa40a4300 | 0x7fefa1024280 | 17039101209689 | 17039101220332 | 17039101399852 | 17039101401913 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 41 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22016 | 0x7fefa40a4180 | 0x7fefa10242c0 | 17039101415053 | 17039101424332 | 17039101603532 | 17039101605448 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 44 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22720 | 0x7fefa40a4000 | 0x7fefa1024300 | 17039101623197 | 17039101631851 | 17039101726251 | 17039101728244 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 47 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 23424 | 0x7fefa1a0de80 | 0x7fefa1024340 | 17039101749633 | 17039101765771 | 17039101858891 | 17039101860800 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 50 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 24128 | 0x7fefa1a0dd00 | 0x7fefa1024380 | 17039101883400 | 17039101893771 | 17039101986091 | 17039101987957 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 53 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 16 | 24 | 24832 | 0x7fefa1a0db80 | 0x7fefa10243c0 | 17039102007296 | 17039102018091 | 17039102196970 | 17039102199061 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 56 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 16 | 24 | 25536 | 0x7fefa1a0da00 | 0x7fefa1024400 | 17039102220770 | 17039102245130 | 17039102423370 | 17039102425594 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 59 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26240 | 0x7fefa1a0d880 | 0x7fefa1024440 | 17039102444234 | 17039102453290 | 17039102546410 | 17039102548441 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 62 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26944 | 0x7fefa1a0d700 | 0x7fefa1024480 | 17039102565690 | 17039102591530 | 17039102684809 | 17039102687187 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 65 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 27648 | 0x7fefa40a4580 | 0x7fefa10244c0 | 17039102708996 | 17039102719369 | 17039102811529 | 17039102813423 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 68 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 16 | 24 | 28608 | 0x7fefa40a4400 | 0x7fefa1024500 | 17039102831883 | 17039102840169 | 17039103020489 | 17039103022367 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 71 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 16 | 24 | 29312 | 0x7fefa40a4280 | 0x7fefa1024540 | 17039103036887 | 17039103044969 | 17039103226088 | 17039103227541 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 74 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 30016 | 0x7fefa40a4100 | 0x7fefa1024580 | 17039103242201 | 17039103250248 | 17039103342568 | 17039103343958 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 77 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 8 | 24 | 30976 | 0x7fefa1a0df80 | 0x7fefa10245c0 | 17039103358288 | 17039103366248 | 17039103458088 | 17039103459585 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 80 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 31680 | 0x7fefa1a0de00 | 0x7fefa1024600 | 17039103479564 | 17039103490248 | 17039103583688 | 17039103585171 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 83 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 16 | 24 | 32640 | 0x7fefa1a0dc80 | 0x7fefa1024640 | 17039103600121 | 17039103608487 | 17039103787847 | 17039103789305 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 86 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 33600 | 0x7fefa1a0db00 | 0x7fefa1024680 | 17039103804195 | 17039103812167 | 17039103993927 | 17039103995449 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 89 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 34560 | 0x7fefa1a0d980 | 0x7fefa10246c0 | 17039104009529 | 17039104017287 | 17039104111686 | 17039104113136 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 92 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 8 | 24 | 35520 | 0x7fefa1a0d800 | 0x7fefa1024700 | 17039104127766 | 17039104136326 | 17039104230406 | 17039104231893 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 95 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 36224 | 0x7fefa1a0d680 | 0x7fefa1024740 | 17039104253312 | 17039104262566 | 17039104355686 | 17039104357239 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 98 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 37184 | 0x7fefa40a4500 | 0x7fefa1024780 | 17039104372069 | 17039104380166 | 17039104560006 | 17039104561393 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 101 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 38144 | 0x7fefa40a4380 | 0x7fefa10247c0 | 17039104575863 | 17039104584806 | 17039104764965 | 17039104766357 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 104 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 39104 | 0x7fefa40a4200 | 0x7fefa1024800 | 17039104782307 | 17039104790085 | 17039104882725 | 17039104884054 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 107 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 8 | 24 | 40320 | 0x7fefa40a4080 | 0x7fefa1024840 | 17039104898314 | 17039104906565 | 17039105000005 | 17039105001371 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 110 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 41280 | 0x7fefa1a0df00 | 0x7fefa1024880 | 17039105021140 | 17039105031845 | 17039105124804 | 17039105126467 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 113 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 42240 | 0x7fefa1a0dd80 | 0x7fefa10248c0 | 17039105142187 | 17039105150244 | 17039105329604 | 17039105330901 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 116 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 43200 | 0x7fefa1a0dc00 | 0x7fefa1024900 | 17039105347751 | 17039105355524 | 17039105536484 | 17039105538005 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 119 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 8 | 24 | 44160 | 0x7fefa1a0da80 | 0x7fefa1024940 | 17039105556035 | 17039105564484 | 17039105659203 | 17039105660652 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 122 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 45376 | 0x7fefa1a0d900 | 0x7fefa1024980 | 17039105676921 | 17039105684483 | 17039105778883 | 17039105780239 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 125 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 46336 | 0x7fefa1a0d780 | 0x7fefa10249c0 | 17039105802418 | 17039105813123 | 17039105906083 | 17039105907625 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 128 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 47552 | 0x7fefa1a0d600 | 0x7fefa1024a00 | 17039105922444 | 17039105930883 | 17039106109762 | 17039106111389 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 131 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 48512 | 0x7fefa40a4480 | 0x7fefa1024a40 | 17039106125969 | 17039106134722 | 17039106316002 | 17039106317353 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 134 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 8 | 24 | 49472 | 0x7fefa40a4300 | 0x7fefa1024a80 | 17039106331453 | 17039106339362 | 17039106432322 | 17039106433790 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 137 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 50688 | 0x7fefa40a4180 | 0x7fefa1024ac0 | 17039106448679 | 17039106457602 | 17039106550882 | 17039106552257 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 140 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 51648 | 0x7fefa40a4000 | 0x7fefa1024b00 | 17039106572536 | 17039106583042 | 17039106675201 | 17039106676573 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 143 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 52864 | 0x7fefa1a0de80 | 0x7fefa1024b40 | 17039106693482 | 17039106701601 | 17039106880961 | 17039106882377 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 146 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 54080 | 0x7fefa1a0dd00 | 0x7fefa1024b80 | 17039106896477 | 17039106904481 | 17039107084960 | 17039107086251 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 149 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 8 | 24 | 55296 | 0x7fefa1a0db80 | 0x7fefa1024bc0 | 17039107103821 | 17039107111520 | 17039107206080 | 17039107207478 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 152 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 56768 | 0x7fefa1a0da00 | 0x7fefa1024c00 | 17039107221227 | 17039107229280 | 17039107324160 | 17039107325604 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 155 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 57728 | 0x7fefa1a0d880 | 0x7fefa1024c40 | 17039107346824 | 17039107357280 | 17039107450080 | 17039107451521 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 158 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 58944 | 0x7fefa1a0d700 | 0x7fefa1024c80 | 17039107467850 | 17039107475840 | 17039107655199 | 17039107656655 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 161 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 60160 | 0x7fefa40a4580 | 0x7fefa1024cc0 | 17039107672195 | 17039107680319 | 17039107860479 | 17039107861979 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 164 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 8 | 24 | 61376 | 0x7fefa40a4400 | 0x7fefa1024d00 | 17039107876029 | 17039107884319 | 17039107978079 | 17039107979566 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 167 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 62848 | 0x7fefa40a4280 | 0x7fefa1024d40 | 17039107994925 | 17039108003519 | 17039108103838 | 17039108105232 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 170 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 63808 | 0x7fefa40a4100 | 0x7fefa1024d80 | 17039108125532 | 17039108135998 | 17039108229918 | 17039108231249 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 173 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 65024 | 0x7fefa1a0df80 | 0x7fefa1024dc0 | 17039108248608 | 17039108258078 | 17039108438238 | 17039108439793 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 176 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 66240 | 0x7fefa1a0de00 | 0x7fefa1024e00 | 17039108454772 | 17039108463198 | 17039108643037 | 17039108644447 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 179 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 8 | 24 | 67456 | 0x7fefa1a0dc80 | 0x7fefa1024e40 | 17039108659046 | 17039108667517 | 17039108763197 | 17039108764593 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 182 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 68928 | 0x7fefa1a0db00 | 0x7fefa1024e80 | 17039108782003 | 17039108789917 | 17039108893277 | 17039108894740 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 185 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 70144 | 0x7fefa1a0d980 | 0x7fefa1024ec0 | 17039108916469 | 17039108927197 | 17039109019677 | 17039109021046 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 188 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 71616 | 0x7fefa1a0d800 | 0x7fefa1024f00 | 17039109036736 | 17039109044477 | 17039109225116 | 17039109226530 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 191 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 72832 | 0x7fefa1a0d680 | 0x7fefa1024f40 | 17039109242380 | 17039109251516 | 17039109430396 | 17039109431824 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 194 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 8 | 24 | 74048 | 0x7fefa40a4500 | 0x7fefa1024f80 | 17039109446024 | 17039109454076 | 17039109547196 | 17039109548511 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 197 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 75776 | 0x7fefa40a4380 | 0x7fefa1024fc0 | 17039109562481 | 17039109570715 | 17039109677755 | 17039109679017 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 200 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 76992 | 0x7fefa40a4200 | 0x7fefa1025000 | 17039109698407 | 17039109709755 | 17039109803195 | 17039109804554 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 203 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 78464 | 0x7fefa40a4080 | 0x7fefa1025040 | 17039109819493 | 17039109827835 | 17039110008155 | 17039110009488 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 206 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 79936 | 0x7fefa1a0df00 | 0x7fefa1025080 | 17039110024577 | 17039110033115 | 17039110212474 | 17039110213972 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 209 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 8 | 24 | 81408 | 0x7fefa1a0dd80 | 0x7fefa10250c0 | 17039110229372 | 17039110237914 | 17039110333114 | 17039110334509 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 212 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 83136 | 0x7fefa1a0dc00 | 0x7fefa1025100 | 17039110348838 | 17039110356634 | 17039110471834 | 17039110473295 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 215 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 84352 | 0x7fefa1a0da80 | 0x7fefa1025140 | 17039110507114 | 17039110516474 | 17039110609753 | 17039110611241 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 218 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 85824 | 0x7fefa1a0d900 | 0x7fefa1025180 | 17039110627780 | 17039110636153 | 17039110815673 | 17039110817125 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 221 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 87296 | 0x7fefa1a0d780 | 0x7fefa10251c0 | 17039110831144 | 17039110839193 | 17039111019673 | 17039111021119 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 224 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 88768 | 0x7fefa1a0d600 | 0x7fefa1025200 | 17039111035858 | 17039111043993 | 17039111139032 | 17039111140355 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 227 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 90752 | 0x7fefa40a4480 | 0x7fefa1025240 | 17039111153995 | 17039111162392 | 17039111283672 | 17039111285041 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 230 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 91968 | 0x7fefa40a4300 | 0x7fefa1025280 | 17039111303991 | 17039111311992 | 17039111404952 | 17039111406378 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 233 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 93440 | 0x7fefa40a4180 | 0x7fefa10252c0 | 17039111420587 | 17039111428792 | 17039111608631 | 17039111610012 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 236 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 94912 | 0x7fefa40a4000 | 0x7fefa1025300 | 17039111623952 | 17039111631831 | 17039111812471 | 17039111814016 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 239 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 96384 | 0x7fefa1a0de80 | 0x7fefa1025340 | 17039111828856 | 17039111836631 | 17039111931351 | 17039111932923 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 242 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 98368 | 0x7fefa1a0dd00 | 0x7fefa1025380 | 17039111947652 | 17039111956151 | 17039112082070 | 17039112083358 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 245 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 99584 | 0x7fefa1a0db80 | 0x7fefa10253c0 | 17039112104028 | 17039112114710 | 17039112208630 | 17039112210055 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 248 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 101312 | 0x7fefa1a0da00 | 0x7fefa1025400 | 17039112225814 | 17039112233590 | 17039112413590 | 17039112414879 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 251 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 102784 | 0x7fefa1a0d880 | 0x7fefa1025440 | 17039112429429 | 17039112437750 | 17039112616469 | 17039112617753 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 254 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 104256 | 0x7fefa1a0d700 | 0x7fefa1025480 | 17039112631563 | 17039112639989 | 17039112733589 | 17039112735070 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 257 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 106240 | 0x7fefa40a4580 | 0x7fefa10254c0 | 17039112749679 | 17039112757749 | 17039112888309 | 17039112889695 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 260 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 107712 | 0x7fefa40a4400 | 0x7fefa1025500 | 17039112910055 | 17039112920629 | 17039113014069 | 17039113015512 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 263 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 16 | 24 | 109440 | 0x7fefa40a4280 | 0x7fefa1025540 | 17039113031341 | 17039113040149 | 17039113219028 | 17039113220456 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 266 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 16 | 24 | 111168 | 0x7fefa40a4100 | 0x7fefa1025580 | 17039113234615 | 17039113242548 | 17039113421428 | 17039113422900 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 269 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 8 | 24 | 112896 | 0x7fefa1a0df80 | 0x7fefa10255c0 | 17039113436310 | 17039113444468 | 17039113539988 | 17039113541437 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 272 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 115136 | 0x7fefa1a0de00 | 0x7fefa1025600 | 17039113557226 | 17039113565267 | 17039113703507 | 17039113704882 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 275 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 116608 | 0x7fefa1a0dc80 | 0x7fefa1025640 | 17039113726121 | 17039113736787 | 17039113831187 | 17039113832688 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 278 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 16 | 24 | 118336 | 0x7fefa1a0db00 | 0x7fefa1025680 | 17039113847578 | 17039113855507 | 17039114036627 | 17039114038122 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 281 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 16 | 24 | 120064 | 0x7fefa1a0d980 | 0x7fefa10256c0 | 17039114052552 | 17039114061266 | 17039114243346 | 17039114244836 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 284 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 121792 | 0x7fefa1a0d800 | 0x7fefa1025700 | 17039114258566 | 17039114266546 | 17039114363346 | 17039114364763 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 287 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 124032 | 0x7fefa1a0d680 | 0x7fefa1025740 | 17039114380463 | 17039114388626 | 17039114533266 | 17039114534778 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 290 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 125504 | 0x7fefa40a4500 | 0x7fefa1025780 | 17039114554838 | 17039114565425 | 17039114660305 | 17039114661665 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 293 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 127488 | 0x7fefa40a4380 | 0x7fefa10257c0 | 17039114676394 | 17039114684145 | 17039114863985 | 17039114865479 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 296 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 129216 | 0x7fefa40a4200 | 0x7fefa1025800 | 17039114879638 | 17039114887665 | 17039115067504 | 17039115068943 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 299 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 130944 | 0x7fefa40a4080 | 0x7fefa1025840 | 17039115083393 | 17039115091504 | 17039115191664 | 17039115193109 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 302 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 133440 | 0x7fefa1a0df00 | 0x7fefa1025880 | 17039115206749 | 17039115214704 | 17039115370064 | 17039115371564 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 305 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 134912 | 0x7fefa1a0dd80 | 0x7fefa10258c0 | 17039115393184 | 17039115403504 | 17039115498064 | 17039115499491 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 308 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 136896 | 0x7fefa1a0dc00 | 0x7fefa1025900 | 17039115515030 | 17039115523024 | 17039115701743 | 17039115703215 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 311 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 138880 | 0x7fefa1a0da80 | 0x7fefa1025940 | 17039115718694 | 17039115726703 | 17039115907343 | 17039115909109 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 314 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 140864 | 0x7fefa1a0d900 | 0x7fefa1025980 | 17039115923089 | 17039115931023 | 17039116037743 | 17039116039235 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 317 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 143616 | 0x7fefa1a0d780 | 0x7fefa10259c0 | 17039116053655 | 17039116063182 | 17039116234062 | 17039116235510 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 320 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 145344 | 0x7fefa1a0d600 | 0x7fefa1025a00 | 17039116256119 | 17039116266542 | 17039116362382 | 17039116363836 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 323 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 147584 | 0x7fefa40a4480 | 0x7fefa1025a40 | 17039116378536 | 17039116386222 | 17039116566701 | 17039116568100 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 326 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 149568 | 0x7fefa40a4300 | 0x7fefa1025a80 | 17039116581970 | 17039116590061 | 17039116772781 | 17039116774294 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 329 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 151552 | 0x7fefa40a4180 | 0x7fefa1025ac0 | 17039116787994 | 17039116796141 | 17039116906061 | 17039116907601 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 332 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 154304 | 0x7fefa40a4000 | 0x7fefa1025b00 | 17039116921770 | 17039116929901 | 17039117110860 | 17039117112395 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 335 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 156288 | 0x7fefa1a0de80 | 0x7fefa1025b40 | 17039117134254 | 17039117143980 | 17039117245100 | 17039117246561 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 338 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 158784 | 0x7fefa1a0dd00 | 0x7fefa1025b80 | 17039117262250 | 17039117270540 | 17039117457900 | 17039117459215 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 341 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 161024 | 0x7fefa1a0db80 | 0x7fefa1025bc0 | 17039117473294 | 17039117481420 | 17039117666539 | 17039117667979 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 344 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 163264 | 0x7fefa1a0da00 | 0x7fefa1025c00 | 17039117681938 | 17039117690859 | 17039117812939 | 17039117814315 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 347 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 166528 | 0x7fefa1a0d880 | 0x7fefa1025c40 | 17039117831284 | 17039117840139 | 17039118046378 | 17039118066637 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 350 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 168512 | 0x7fefa1a0d700 | 0x7fefa1025c80 | 17039118091807 | 17039118102378 | 17039118213098 | 17039118214763 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 353 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 171264 | 0x7fefa40a4580 | 0x7fefa1025cc0 | 17039118230183 | 17039118238378 | 17039118421578 | 17039118423017 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 356 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 173760 | 0x7fefa40a4400 | 0x7fefa1025d00 | 17039118436887 | 17039118445258 | 17039118633577 | 17039118635161 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 359 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 176256 | 0x7fefa40a4280 | 0x7fefa1025d40 | 17039118651071 | 17039118658857 | 17039118793257 | 17039118794727 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 362 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 179776 | 0x7fefa40a4100 | 0x7fefa1025d80 | 17039118808076 | 17039118815977 | 17039119047656 | 17039119088818 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 365 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 182272 | 0x7fefa1a0df80 | 0x7fefa1025dc0 | 17039119104198 | 17039119115016 | 17039119242056 | 17039119243514 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 368 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 185536 | 0x7fefa1a0de00 | 0x7fefa1025e00 | 17039119257764 | 17039119265736 | 17039119456456 | 17039119457778 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 371 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 188544 | 0x7fefa1a0dc80 | 0x7fefa1025e40 | 17039119472327 | 17039119480936 | 17039119671815 | 17039119673202 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 374 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 191552 | 0x7fefa1a0db00 | 0x7fefa1025e80 | 17039119687911 | 17039119695975 | 17039119855495 | 17039119857046 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 377 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 195840 | 0x7fefa1a0d980 | 0x7fefa1025ec0 | 17039119872596 | 17039119880295 | 17039120163334 | 17039120204517 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 380 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 198592 | 0x7fefa1a0d800 | 0x7fefa1025f00 | 17039120220276 | 17039120230534 | 17039120379974 | 17039120381441 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 383 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 202368 | 0x7fefa1a0d680 | 0x7fefa1025f40 | 17039120397701 | 17039120405254 | 17039120613413 | 17039120630794 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 386 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 205888 | 0x7fefa40a4500 | 0x7fefa1025f80 | 17039120640484 | 17039120650533 | 17039120859973 | 17039120878407 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 389 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 209408 | 0x7fefa40a4380 | 0x7fefa1025fc0 | 17039120886337 | 17039120896453 | 17039121082052 | 17039121083361 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 392 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 214464 | 0x7fefa40a4200 | 0x7fefa1026000 | 17039121100881 | 17039121108772 | 17039121443172 | 17039121457911 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 395 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 217728 | 0x7fefa40a4080 | 0x7fefa1026040 | 17039121473860 | 17039121484612 | 17039121651331 | 17039121652825 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 398 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 222016 | 0x7fefa1a0df00 | 0x7fefa1026080 | 17039121667505 | 17039121675971 | 17039121905571 | 17039121919288 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 401 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 226048 | 0x7fefa1a0dd80 | 0x7fefa10260c0 | 17039121928487 | 17039121938531 | 17039122167970 | 17039122207029 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 404 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 230080 | 0x7fefa1a0dc00 | 0x7fefa1026100 | 17039122215609 | 17039122225570 | 17039122436290 | 17039122450782 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 407 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 235904 | 0x7fefa1a0da80 | 0x7fefa1026140 | 17039122459952 | 17039122469410 | 17039122855009 | 17039122869061 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 410 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 239424 | 0x7fefa1a0d900 | 0x7fefa1026180 | 17039122887420 | 17039122898049 | 17039123085408 | 17039123086794 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 413 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 244224 | 0x7fefa1a0d780 | 0x7fefa10261c0 | 17039123102954 | 17039123110848 | 17039123361408 | 17039123379706 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 416 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 248768 | 0x7fefa1a0d600 | 0x7fefa1026200 | 17039123390746 | 17039123400928 | 17039123648767 | 17039123662258 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 419 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 253312 | 0x7fefa40a4480 | 0x7fefa1026240 | 17039123672528 | 17039123682847 | 17039123919647 | 17039123933380 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 422 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 8 | 24 | 255552 | 0x7fefa40a4300 | 0x7fefa1026280 | 17039123944050 | 17039123954527 | 17039124408606 | 17039124422156 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 425 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 259840 | 0x7fefa40a4180 | 0x7fefa10262c0 | 17039124438236 | 17039124448766 | 17039124674365 | 17039124688189 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 428 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 265664 | 0x7fefa40a4000 | 0x7fefa1026300 | 17039124696728 | 17039124706365 | 17039125004124 | 17039125017689 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 431 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 271232 | 0x7fefa1a0de80 | 0x7fefa1026340 | 17039125029389 | 17039125038844 | 17039125337724 | 17039125354490 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 434 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 8 | 24 | 273216 | 0x7fefa1a0dd00 | 0x7fefa1026380 | 17039125367729 | 17039125377884 | 17039125673883 | 17039125691160 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 437 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 8 | 24 | 275712 | 0x7fefa1a0db80 | 0x7fefa10263c0 | 17039125700150 | 17039125710363 | 17039126268122 | 17039126309252 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 440 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 280768 | 0x7fefa1a0da00 | 0x7fefa1026400 | 17039126326152 | 17039126336602 | 17039126600121 | 17039126640603 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 443 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 287616 | 0x7fefa1a0d880 | 0x7fefa1026440 | 17039126651393 | 17039126661561 | 17039127011800 | 17039127052161 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 446 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 294208 | 0x7fefa1a0d700 | 0x7fefa1026480 | 17039127061051 | 17039127071000 | 17039127422200 | 17039127462600 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 449 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 8 | 24 | 296960 | 0x7fefa40a4580 | 0x7fefa10264c0 | 17039127471879 | 17039127482199 | 17039127829239 | 17039127869738 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 452 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 8 | 24 | 299968 | 0x7fefa40a4400 | 0x7fefa1026500 | 17039127879148 | 17039127889079 | 17039128550037 | 17039128564608 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 455 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 8 | 24 | 302720 | 0x7fefa40a4280 | 0x7fefa1026540 | 17039128582288 | 17039128591797 | 17039129038996 | 17039129057124 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 458 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 305472 | 0x7fefa40a4100 | 0x7fefa1026580 | 17039129066774 | 17039129076916 | 17039129540755 | 17039129554620 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 461 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 308224 | 0x7fefa1a0df80 | 0x7fefa10265c0 | 17039129563750 | 17039129573555 | 17039130035474 | 17039130049766 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 464 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 8 | 24 | 310976 | 0x7fefa1a0de00 | 0x7fefa1026600 | 17039130058866 | 17039130069074 | 17039130519793 | 17039130560911 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 467 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 8 | 24 | 313216 | 0x7fefa1a0dc80 | 0x7fefa1026640 | 17039130570051 | 17039130580113 | 17039131449712 | 17039131494555 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 470 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 8 | 24 | 315968 | 0x7fefa1a0db00 | 0x7fefa1026680 | 17039131510874 | 17039131521391 | 17039132374670 | 17039132417298 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 473 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 318720 | 0x7fefa1a0d980 | 0x7fefa10266c0 | 17039132427368 | 17039132437230 | 17039133322988 | 17039133365321 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 476 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 321472 | 0x7fefa1a0d800 | 0x7fefa1026700 | 17039133377461 | 17039133391788 | 17039134270666 | 17039134315404 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 479 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 8 | 24 | 324224 | 0x7fefa1a0d680 | 0x7fefa1026740 | 17039134326274 | 17039134341706 | 17039135200904 | 17039135243878 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 482 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 8 | 24 | 326464 | 0x7fefa40a4500 | 0x7fefa1026780 | 17039135253747 | 17039135263144 | 17039136961540 | 17039137016067 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 485 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 8 | 24 | 329216 | 0x7fefa40a4380 | 0x7fefa10267c0 | 17039137033397 | 17039137043780 | 17039138709057 | 17039138766547 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 488 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 331968 | 0x7fefa40a4200 | 0x7fefa1026800 | 17039138776337 | 17039138786017 | 17039140510653 | 17039140571206 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 491 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 12 | 24 | 334720 | 0x7fefa40a4080 | 0x7fefa1026840 | 17039140581355 | 17039140590493 | 17039142305690 | 17039142362285 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 494 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 8 | 24 | 337472 | 0x7fefa1a0df00 | 0x7fefa1026880 | 17039142372124 | 17039142390010 | 17039144062966 | 17039144132994 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 497 | 189951 | 189951 | 4194304 | 256 | 0 | 0 | 8 | 24 | 0 | 0x7fefa1a0dd80 | 0x7fefa10268c0 | 17039144142084 | 17039144169046 | 17039147525999 | 17039147591715 |