43 KiB
43 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | SQ_INSTS_SMEM | SQ_INST_LEVEL_SMEM | SQ_ACCUM_PREV_HIRES | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBuffer.kd | 0 | 0 | 0 | 936496 | 936501 | 33554432 | 256 | 0 | 0 | 8 | 32 | 6464 | 0x0 | 0x7f17e8404180 | 4194304 | 3122666 | 398904176 | 12076630480743351 | 12076630718390515 | 12076630718714354 | 12076630718822006 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 936496 | 936501 | 32768 | 256 | 0 | 0 | 24 | 24 | 12480 | 0x0 | 0x7f17e8435100 | 512 | 21524 | 2754256 | 12076630733442442 | 12076630733749898 | 12076630733756458 | 12076630733761836 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 4 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 12928 | 0x7f18f4030900 | 0x7f17e8435140 | 65536 | 146806 | 18775720 | 12076630733826656 | 12076630734045577 | 12076630734179017 | 12076630734183330 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 6 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 36 | 24 | 13632 | 0x7f18f4030800 | 0x7f17e8435180 | 65536 | 166800 | 21363552 | 12076630734250836 | 12076630734424456 | 12076630734676455 | 12076630734744404 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 8 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 14080 | 0x7f18f4030700 | 0x7f17e84351c0 | 65536 | 145312 | 18687568 | 12076630734769059 | 12076630734956294 | 12076630735209893 | 12076630735278627 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 10 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 14528 | 0x7f18f4030600 | 0x7f17e8435200 | 65536 | 150966 | 19402760 | 12076630735302752 | 12076630735488292 | 12076630735621092 | 12076630735624911 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 12 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 14976 | 0x7f18f4030500 | 0x7f17e8435240 | 65536 | 143290 | 18432448 | 12076630735674393 | 12076630735852771 | 12076630735986530 | 12076630735990331 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 14 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 15424 | 0x7f18f4030400 | 0x7f17e8435280 | 131072 | 227390 | 29160816 | 12076630736069599 | 12076630736239969 | 12076630736372449 | 12076630736376349 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 16 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 16128 | 0x7f18f4030300 | 0x7f17e84352c0 | 131072 | 189048 | 24236312 | 12076630736425691 | 12076630736594848 | 12076630736859327 | 12076630736901155 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 18 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 16832 | 0x7f18f4030a00 | 0x7f17e8435300 | 65536 | 148268 | 19040936 | 12076630736924379 | 12076630737129406 | 12076630737382525 | 12076630737423557 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 20 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 17536 | 0x7f18f4030900 | 0x7f17e8435340 | 131072 | 225494 | 28835256 | 12076630737447872 | 12076630737636284 | 12076630737769244 | 12076630737772967 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 22 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 18240 | 0x7f18f4030800 | 0x7f17e8435380 | 131072 | 224970 | 28826816 | 12076630737822008 | 12076630737987003 | 12076630738122203 | 12076630738126284 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 24 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 18944 | 0x7f18f4030700 | 0x7f17e84353c0 | 131072 | 226920 | 29124800 | 12076630738189021 | 12076630738358362 | 12076630738491961 | 12076630738495431 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 26 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 19904 | 0x7f18f4030600 | 0x7f17e8435400 | 131072 | 188884 | 24133824 | 12076630738544602 | 12076630738707800 | 12076630738967000 | 12076630739033422 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 28 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 20608 | 0x7f18f4030500 | 0x7f17e8435440 | 65536 | 145354 | 18673600 | 12076630739060312 | 12076630739245559 | 12076630739502998 | 12076630739569298 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 30 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 21312 | 0x7f18f4030400 | 0x7f17e8435480 | 131072 | 225206 | 28872752 | 12076630739595898 | 12076630739772117 | 12076630739904916 | 12076630739908349 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 32 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 22016 | 0x7f18f4030300 | 0x7f17e84354c0 | 131072 | 219560 | 28258888 | 12076630739957340 | 12076630740132275 | 12076630740260595 | 12076630740264552 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 34 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 22720 | 0x7f18f4030a00 | 0x7f17e8435500 | 131072 | 264056 | 33825168 | 12076630740326287 | 12076630740491314 | 12076630740667473 | 12076630740671338 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 36 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 23680 | 0x7f18f4030900 | 0x7f17e8435540 | 131072 | 180248 | 23012800 | 12076630740719638 | 12076630740889393 | 12076630741144752 | 12076630741211082 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 38 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 24384 | 0x7f18f4030800 | 0x7f17e8435580 | 65536 | 152108 | 19358000 | 12076630741236900 | 12076630741422351 | 12076630741680270 | 12076630741747320 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 40 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 25088 | 0x7f18f4030700 | 0x7f17e84355c0 | 131072 | 240572 | 30745160 | 12076630741770152 | 12076630741952429 | 12076630742085388 | 12076630742089256 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 42 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 25792 | 0x7f18f4030600 | 0x7f17e8435600 | 131072 | 227926 | 29102264 | 12076630742137025 | 12076630742315147 | 12076630742445387 | 12076630742449195 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 44 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 26496 | 0x7f18f4030500 | 0x7f17e8435640 | 131072 | 238044 | 30586152 | 12076630742511051 | 12076630742675146 | 12076630742808906 | 12076630742812662 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 46 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 27712 | 0x7f18f4030400 | 0x7f17e8435680 | 131072 | 214086 | 27454552 | 12076630742860410 | 12076630743039145 | 12076630743299624 | 12076630743365810 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 48 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 28416 | 0x7f18f4030300 | 0x7f17e84356c0 | 65536 | 151892 | 19296600 | 12076630743392941 | 12076630743572743 | 12076630743826662 | 12076630743893562 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 50 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 29120 | 0x7f18f4030a00 | 0x7f17e8435700 | 131072 | 227084 | 29063024 | 12076630743916916 | 12076630744096741 | 12076630744229700 | 12076630744233504 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 52 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 30080 | 0x7f18f4030900 | 0x7f17e8435740 | 131072 | 229102 | 29379856 | 12076630744284449 | 12076630744448740 | 12076630744578819 | 12076630744582634 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 54 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 30784 | 0x7f18f4030800 | 0x7f17e8435780 | 131072 | 223660 | 28589792 | 12076630744643166 | 12076630744804258 | 12076630744933858 | 12076630744937734 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 56 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 32000 | 0x7f18f4030700 | 0x7f17e84357c0 | 131072 | 188756 | 24135584 | 12076630744985393 | 12076630745172737 | 12076630745435136 | 12076630745501092 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 58 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 32960 | 0x7f18f4030600 | 0x7f17e8435800 | 65536 | 149072 | 19052288 | 12076630745525418 | 12076630745703935 | 12076630745960734 | 12076630746027231 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 60 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 33920 | 0x7f18f4030500 | 0x7f17e8435840 | 131072 | 221292 | 28294208 | 12076630746054892 | 12076630746232413 | 12076630746368733 | 12076630746372603 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 62 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 34880 | 0x7f18f4030400 | 0x7f17e8435880 | 131072 | 224710 | 28664736 | 12076630746420783 | 12076630746583132 | 12076630746718331 | 12076630746721993 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 64 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 35840 | 0x7f18f4030300 | 0x7f17e84358c0 | 131072 | 221994 | 28400584 | 12076630746783147 | 12076630746946171 | 12076630747076730 | 12076630747081081 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 66 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 37312 | 0x7f18f4030a00 | 0x7f17e8435900 | 131072 | 217500 | 27821104 | 12076630747129852 | 12076630747303289 | 12076630747563928 | 12076630747631135 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 68 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 38272 | 0x7f18f4030900 | 0x7f17e8435940 | 65536 | 145802 | 18533032 | 12076630747657163 | 12076630747834007 | 12076630748087127 | 12076630748154638 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 70 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 39232 | 0x7f18f4030800 | 0x7f17e8435980 | 131072 | 227466 | 29112696 | 12076630748178493 | 12076630748364246 | 12076630748501205 | 12076630748504940 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 72 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 40192 | 0x7f18f4030700 | 0x7f17e84359c0 | 131072 | 228766 | 29163784 | 12076630748553921 | 12076630748717684 | 12076630748854324 | 12076630748858297 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 74 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 41152 | 0x7f18f4030600 | 0x7f17e8435a00 | 131072 | 217996 | 27926896 | 12076630748919220 | 12076630749086643 | 12076630749218962 | 12076630749222755 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 76 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 42624 | 0x7f18f4030500 | 0x7f17e8435a40 | 131072 | 183100 | 23413936 | 12076630749271796 | 12076630749443922 | 12076630749703761 | 12076630749770233 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 78 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 43584 | 0x7f18f4030400 | 0x7f17e8435a80 | 65536 | 152676 | 19429816 | 12076630749794378 | 12076630749972560 | 12076630750232559 | 12076630750330926 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 80 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 44544 | 0x7f18f4030300 | 0x7f17e8435ac0 | 131072 | 223680 | 28697848 | 12076630750354861 | 12076630750548078 | 12076630750684717 | 12076630750688662 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 82 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 45760 | 0x7f18f4030a00 | 0x7f17e8435b00 | 131072 | 226080 | 29158928 | 12076630750736942 | 12076630750906636 | 12076630751043756 | 12076630751048231 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 84 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 46720 | 0x7f18f4030900 | 0x7f17e8435b40 | 131072 | 225830 | 28997752 | 12076630751108353 | 12076630751277195 | 12076630751411114 | 12076630751415093 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 86 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 48448 | 0x7f18f4030800 | 0x7f17e8435b80 | 131072 | 180756 | 23135336 | 12076630751465056 | 12076630751622794 | 12076630751892553 | 12076630751963002 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 88 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 49408 | 0x7f18f4030700 | 0x7f17e8435bc0 | 65536 | 149440 | 19114736 | 12076630751989592 | 12076630752170152 | 12076630752426471 | 12076630752493219 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 90 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 50368 | 0x7f18f4030600 | 0x7f17e8435c00 | 131072 | 262266 | 33623728 | 12076630752519848 | 12076630752699110 | 12076630752828069 | 12076630752832029 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 92 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 51584 | 0x7f18f4030500 | 0x7f17e8435c40 | 131072 | 227186 | 29060408 | 12076630752881821 | 12076630753052069 | 12076630753188388 | 12076630753191978 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 94 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 52544 | 0x7f18f4030400 | 0x7f17e8435c80 | 131072 | 230542 | 29470864 | 12076630753253212 | 12076630753416867 | 12076630753551107 | 12076630753554743 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 96 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 54272 | 0x7f18f4030300 | 0x7f17e8435cc0 | 131072 | 177778 | 22873048 | 12076630753602021 | 12076630753773186 | 12076630754037505 | 12076630754103965 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 98 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 55488 | 0x7f18f4030a00 | 0x7f17e8435d00 | 65536 | 173192 | 22154512 | 12076630754130945 | 12076630754309184 | 12076630754565183 | 12076630754631786 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 100 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 56704 | 0x7f18f4030900 | 0x7f17e8435d40 | 131072 | 227532 | 29252136 | 12076630754654709 | 12076630754831742 | 12076630754965662 | 12076630754969194 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 102 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 58176 | 0x7f18f4030800 | 0x7f17e8435d80 | 131072 | 229234 | 29409264 | 12076630755019708 | 12076630755193341 | 12076630755334460 | 12076630755338551 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 104 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 59392 | 0x7f18f4030700 | 0x7f17e8435dc0 | 131072 | 228260 | 29183648 | 12076630755399925 | 12076630755561499 | 12076630755699419 | 12076630755703179 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 106 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 61376 | 0x7f18f4030600 | 0x7f17e8435e00 | 131072 | 225254 | 28764944 | 12076630755751660 | 12076630755919578 | 12076630756178297 | 12076630756245338 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 108 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 62592 | 0x7f18f4030500 | 0x7f17e8435e40 | 65536 | 149242 | 19063064 | 12076630756272358 | 12076630756448696 | 12076630756708375 | 12076630756774753 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 110 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 63808 | 0x7f18f4030400 | 0x7f17e8435e80 | 131072 | 227156 | 29014288 | 12076630756799128 | 12076630756979894 | 12076630757113814 | 12076630757118462 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 112 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 65280 | 0x7f18f4030300 | 0x7f17e8435ec0 | 131072 | 227782 | 28907472 | 12076630757168094 | 12076630757331253 | 12076630757470293 | 12076630757474214 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 114 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 66496 | 0x7f18f4030a00 | 0x7f17e8435f00 | 131072 | 227102 | 29022864 | 12076630757534035 | 12076630757693812 | 12076630757829171 | 12076630757832911 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 116 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 68480 | 0x7f18f4030900 | 0x7f17e8435f40 | 131072 | 227088 | 29089344 | 12076630757880630 | 12076630758053810 | 12076630758311250 | 12076630758378676 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 118 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 69696 | 0x7f18f4030800 | 0x7f17e8435f80 | 65536 | 147704 | 18861032 | 12076630758405416 | 12076630758579409 | 12076630758833328 | 12076630758899234 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 120 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 70912 | 0x7f18f4030700 | 0x7f17e8435fc0 | 131072 | 225116 | 28894504 | 12076630758925974 | 12076630759114927 | 12076630759247406 | 12076630759251199 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 122 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 72384 | 0x7f18f4030600 | 0x7f17e8436000 | 131072 | 226356 | 28938968 | 12076630759300401 | 12076630759463085 | 12076630759602125 | 12076630759606019 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 124 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 73600 | 0x7f18f4030500 | 0x7f17e8436040 | 131072 | 225464 | 28891992 | 12076630759666862 | 12076630759827084 | 12076630759958124 | 12076630759961801 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 126 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 75840 | 0x7f18f4030400 | 0x7f17e8436080 | 131072 | 176088 | 22573592 | 12076630760013808 | 12076630760177483 | 12076630760446122 | 12076630760512545 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 128 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 77056 | 0x7f18f4030300 | 0x7f17e84360c0 | 65536 | 146200 | 18638136 | 12076630760536089 | 12076630760720041 | 12076630760976040 | 12076630761018497 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 130 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 78272 | 0x7f18f4030a00 | 0x7f17e8436100 | 131072 | 264440 | 33553728 | 12076630761040888 | 12076630761222279 | 12076630761352679 | 12076630761356676 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 132 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 80000 | 0x7f18f4030900 | 0x7f17e8436140 | 131072 | 197214 | 25313256 | 12076630761405857 | 12076630761574598 | 12076630761721477 | 12076630761725392 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 134 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 81216 | 0x7f18f4030800 | 0x7f17e8436180 | 131072 | 225482 | 28825616 | 12076630761785584 | 12076630761943076 | 12076630762078116 | 12076630762082105 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 136 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 83456 | 0x7f18f4030700 | 0x7f17e84361c0 | 131072 | 180478 | 23151528 | 12076630762129794 | 12076630762300995 | 12076630762570114 | 12076630762591432 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 138 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 84928 | 0x7f18f4030600 | 0x7f17e8436200 | 65536 | 180078 | 23066240 | 12076630762634322 | 12076630762792833 | 12076630763090272 | 12076630763113874 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 140 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 86400 | 0x7f18f4030500 | 0x7f17e8436240 | 131072 | 233184 | 29574320 | 12076630763158197 | 12076630763319871 | 12076630763454111 | 12076630763458125 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 142 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 88128 | 0x7f18f4030400 | 0x7f17e8436280 | 131072 | 199190 | 25603288 | 12076630763506124 | 12076630763673150 | 12076630763825150 | 12076630763829095 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 144 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 89600 | 0x7f18f4030300 | 0x7f17e84362c0 | 131072 | 230656 | 29615904 | 12076630763911097 | 12076630764071869 | 12076630764206108 | 12076630764210123 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 146 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 92096 | 0x7f18f4030a00 | 0x7f17e8436300 | 131072 | 183604 | 23426328 | 12076630764258634 | 12076630764426907 | 12076630764697786 | 12076630764722096 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 148 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 93568 | 0x7f18f4030900 | 0x7f17e8436340 | 65536 | 144156 | 18434176 | 12076630764763383 | 12076630764925306 | 12076630765180345 | 12076630765204984 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 150 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 95040 | 0x7f18f4030800 | 0x7f17e8436380 | 131072 | 218512 | 27909952 | 12076630765247433 | 12076630765408344 | 12076630765542263 | 12076630765545828 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 152 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 96768 | 0x7f18f4030700 | 0x7f17e84363c0 | 131072 | 230722 | 29479352 | 12076630765596031 | 12076630765765623 | 12076630765923542 | 12076630765927498 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 154 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 98240 | 0x7f18f4030600 | 0x7f17e8436400 | 131072 | 223186 | 28522608 | 12076630765987219 | 12076630766158581 | 12076630766292341 | 12076630766296665 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 156 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 100736 | 0x7f18f4030500 | 0x7f17e8436440 | 131072 | 182648 | 23339480 | 12076630766345836 | 12076630766516660 | 12076630766781619 | 12076630766829576 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 158 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 102208 | 0x7f18f4030400 | 0x7f17e8436480 | 65536 | 186902 | 23869552 | 12076630766854182 | 12076630767035538 | 12076630767288177 | 12076630767338382 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 160 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 103680 | 0x7f18f4030300 | 0x7f17e84364c0 | 131072 | 228500 | 29147816 | 12076630767365653 | 12076630767540816 | 12076630767675696 | 12076630767679337 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 162 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 105664 | 0x7f18f4030a00 | 0x7f17e8436500 | 131072 | 218106 | 27972760 | 12076630767728779 | 12076630767895695 | 12076630768061934 | 12076630768065795 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 164 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 107136 | 0x7f18f4030900 | 0x7f17e8436540 | 131072 | 225908 | 28729320 | 12076630768128412 | 12076630768290893 | 12076630768421293 | 12076630768425354 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 166 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 109888 | 0x7f18f4030800 | 0x7f17e8436580 | 131072 | 180044 | 23043184 | 12076630768473734 | 12076630768640652 | 12076630768907051 | 12076630768931195 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 168 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 111360 | 0x7f18f4030700 | 0x7f17e84365c0 | 65536 | 151132 | 19419864 | 12076630768976980 | 12076630769161450 | 12076630769421129 | 12076630769468905 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 170 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 112832 | 0x7f18f4030600 | 0x7f17e8436600 | 131072 | 265290 | 33842312 | 12076630769492760 | 12076630769670568 | 12076630769807848 | 12076630769811863 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 172 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 114816 | 0x7f18f4030500 | 0x7f17e8436640 | 131072 | 223124 | 28752200 | 12076630769861646 | 12076630770031207 | 12076630770204486 | 12076630770208471 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 174 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 116288 | 0x7f18f4030400 | 0x7f17e8436680 | 131072 | 225756 | 29003960 | 12076630770269695 | 12076630770430726 | 12076630770562085 | 12076630770566086 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 176 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 119040 | 0x7f18f4030300 | 0x7f17e84366c0 | 131072 | 178990 | 22852184 | 12076630770615679 | 12076630770777604 | 12076630771042723 | 12076630771091424 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 178 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 120768 | 0x7f18f4030a00 | 0x7f17e8436700 | 65536 | 144814 | 18524880 | 12076630771118253 | 12076630771294723 | 12076630771554082 | 12076630771600681 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 180 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 122496 | 0x7f18f4030900 | 0x7f17e8436740 | 131072 | 227744 | 29192792 | 12076630771625737 | 12076630771805761 | 12076630771941440 | 12076630771945592 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 182 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 124736 | 0x7f18f4030800 | 0x7f17e8436780 | 131072 | 227082 | 28994272 | 12076630771994333 | 12076630772168479 | 12076630772350719 | 12076630772354974 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 184 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 126464 | 0x7f18f4030700 | 0x7f17e84367c0 | 131072 | 226390 | 29055120 | 12076630772416588 | 12076630772579518 | 12076630772720317 | 12076630772723990 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 186 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 20 | 24 | 127936 | 0x7f18f4030600 | 0x7f17e8436800 | 131072 | 223916 | 28593808 | 12076630772770507 | 12076630772936157 | 12076630773203356 | 12076630773250399 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 188 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 129664 | 0x7f18f4030500 | 0x7f17e8436840 | 65536 | 151472 | 19400720 | 12076630773273172 | 12076630773451355 | 12076630773710074 | 12076630773756300 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 190 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 131392 | 0x7f18f4030400 | 0x7f17e8436880 | 131072 | 257456 | 32738176 | 12076630773781838 | 12076630773955353 | 12076630774097592 | 12076630774101833 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 192 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 133632 | 0x7f18f4030300 | 0x7f17e84368c0 | 131072 | 235504 | 29915176 | 12076630774150303 | 12076630774322232 | 12076630774513271 | 12076630774561378 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 194 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 135360 | 0x7f18f4030a00 | 0x7f17e8436900 | 131072 | 256744 | 32770632 | 12076630774598196 | 12076630774758870 | 12076630774899349 | 12076630774903304 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 196 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 20 | 24 | 136832 | 0x7f18f4030900 | 0x7f17e8436940 | 131072 | 221814 | 28524864 | 12076630774952726 | 12076630775123669 | 12076630775406548 | 12076630775455772 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 198 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 138560 | 0x7f18f4030800 | 0x7f17e8436980 | 65536 | 153198 | 19621168 | 12076630775479025 | 12076630775659987 | 12076630775917906 | 12076630775964748 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 200 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 140288 | 0x7f18f4030700 | 0x7f17e84369c0 | 131072 | 246534 | 31503272 | 12076630775991037 | 12076630776179345 | 12076630776313584 | 12076630776317915 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 202 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 142784 | 0x7f18f4030600 | 0x7f17e8436a00 | 131072 | 219418 | 28232720 | 12076630776366896 | 12076630776538224 | 12076630776749583 | 12076630776771990 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 204 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 144768 | 0x7f18f4030500 | 0x7f17e8436a40 | 131072 | 220666 | 28206928 | 12076630776825820 | 12076630776987982 | 12076630777126861 | 12076630777130848 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 206 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 20 | 24 | 145728 | 0x7f18f4030400 | 0x7f17e8436a80 | 131072 | 220914 | 28364160 | 12076630777180931 | 12076630777346221 | 12076630777653419 | 12076630777700587 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 208 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 147712 | 0x7f18f4030300 | 0x7f17e8436ac0 | 65536 | 144544 | 18398472 | 12076630777724111 | 12076630777900779 | 12076630778160938 | 12076630778209855 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 210 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 149696 | 0x7f18f4030a00 | 0x7f17e8436b00 | 131072 | 215842 | 27686136 | 12076630778236775 | 12076630778412617 | 12076630778548296 | 12076630778552051 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 212 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 152192 | 0x7f18f4030900 | 0x7f17e8436b40 | 131072 | 225646 | 29102320 | 12076630778600181 | 12076630778766375 | 12076630778994215 | 12076630779043365 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 214 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 154176 | 0x7f18f4030800 | 0x7f17e8436b80 | 131072 | 228722 | 29085824 | 12076630779077990 | 12076630779247174 | 12076630779383173 | 12076630779387625 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 216 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 20 | 24 | 155648 | 0x7f18f4030700 | 0x7f17e8436bc0 | 131072 | 225666 | 28944104 | 12076630779437468 | 12076630779610212 | 12076630779939331 | 12076630779987521 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 218 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 157632 | 0x7f18f4030600 | 0x7f17e8436c00 | 65536 | 143190 | 18288432 | 12076630780015714 | 12076630780195010 | 12076630780457889 | 12076630780506937 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 220 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 159616 | 0x7f18f4030500 | 0x7f17e8436c40 | 131072 | 228308 | 29263736 | 12076630780533056 | 12076630780712928 | 12076630780848608 | 12076630780852781 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 222 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 162368 | 0x7f18f4030400 | 0x7f17e8436c80 | 131072 | 229866 | 29433672 | 12076630780901071 | 12076630781073567 | 12076630781318366 | 12076630781368059 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 224 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 164608 | 0x7f18f4030300 | 0x7f17e8436cc0 | 131072 | 223206 | 28804256 | 12076630781410769 | 12076630781575563 | 12076630781712523 | 12076630781719633 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 226 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 20 | 24 | 166336 | 0x7f18f4030a00 | 0x7f17e8436d00 | 131072 | 228840 | 29255776 | 12076630781762894 | 12076630781931561 | 12076630782308040 | 12076630782355576 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 228 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 168576 | 0x7f18f4030900 | 0x7f17e8436d40 | 65536 | 149238 | 18983736 | 12076630782381955 | 12076630782559879 | 12076630782825799 | 12076630782872948 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 230 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 170816 | 0x7f18f4030800 | 0x7f17e8436d80 | 131072 | 230536 | 29506024 | 12076630782898456 | 12076630783077478 | 12076630783220037 | 12076630783223300 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 232 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 174080 | 0x7f18f4030700 | 0x7f17e8436dc0 | 131072 | 229452 | 29219960 | 12076630783272983 | 12076630783446917 | 12076630783756196 | 12076630783801987 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 234 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 176576 | 0x7f18f4030600 | 0x7f17e8436e00 | 131072 | 230522 | 29545328 | 12076630783837322 | 12076630784001795 | 12076630784141955 | 12076630784145506 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 236 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 20 | 24 | 177792 | 0x7f18f4030500 | 0x7f17e8436e40 | 131072 | 209118 | 26916032 | 12076630784193916 | 12076630784367074 | 12076630784792513 | 12076630784840148 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 238 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 180288 | 0x7f18f4030400 | 0x7f17e8436e80 | 65536 | 154162 | 19781176 | 12076630784863591 | 12076630785052512 | 12076630785316192 | 12076630785364583 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 240 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 182784 | 0x7f18f4030300 | 0x7f17e8436ec0 | 131072 | 225288 | 28626392 | 12076630785392425 | 12076630785568191 | 12076630785707071 | 12076630785710817 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 242 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 186304 | 0x7f18f4030a00 | 0x7f17e8436f00 | 131072 | 225312 | 28824128 | 12076630785759147 | 12076630785925150 | 12076630786240509 | 12076630786288993 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 244 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 189312 | 0x7f18f4030900 | 0x7f17e8436f40 | 131072 | 227616 | 28908840 | 12076630786330530 | 12076630786491709 | 12076630786644188 | 12076630786647249 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 246 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 20 | 24 | 190784 | 0x7f18f4030800 | 0x7f17e8436f80 | 131072 | 225682 | 28777744 | 12076630786695389 | 12076630786863228 | 12076630787380186 | 12076630787429053 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 248 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 193792 | 0x7f18f4030700 | 0x7f17e8436fc0 | 65536 | 152368 | 19589216 | 12076630787462896 | 12076630787632665 | 12076630787931705 | 12076630787978586 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 250 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 196800 | 0x7f18f4030600 | 0x7f17e8437000 | 131072 | 223520 | 28545808 | 12076630788015083 | 12076630788183704 | 12076630788338744 | 12076630788342282 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 252 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 201088 | 0x7f18f4030500 | 0x7f17e8437040 | 131072 | 225832 | 29001952 | 12076630788397264 | 12076630788558423 | 12076630788944342 | 12076630788965792 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 254 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 204608 | 0x7f18f4030400 | 0x7f17e8437080 | 131072 | 224964 | 28784144 | 12076630789036884 | 12076630789204501 | 12076630789380341 | 12076630789383810 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 256 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 20 | 24 | 206080 | 0x7f18f4030300 | 0x7f17e84370c0 | 131072 | 228980 | 29111080 | 12076630789433773 | 12076630789606100 | 12076630790217298 | 12076630790265530 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 258 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 209600 | 0x7f18f4030a00 | 0x7f17e8437100 | 65536 | 145750 | 18715544 | 12076630790299653 | 12076630790473458 | 12076630790800497 | 12076630790847332 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 260 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 213120 | 0x7f18f4030900 | 0x7f17e8437140 | 131072 | 244068 | 31342136 | 12076630790884271 | 12076630791056656 | 12076630791234896 | 12076630791238570 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 262 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 218176 | 0x7f18f4030800 | 0x7f17e8437180 | 131072 | 246312 | 31211640 | 12076630791291749 | 12076630791455535 | 12076630791912014 | 12076630791958108 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 264 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 222208 | 0x7f18f4030700 | 0x7f17e84371c0 | 131072 | 228350 | 29181552 | 12076630791998343 | 12076630792167213 | 12076630792367053 | 12076630792414186 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 266 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 20 | 24 | 223936 | 0x7f18f4030600 | 0x7f17e8437200 | 131072 | 221566 | 28882232 | 12076630792444613 | 12076630792615212 | 12076630793319530 | 12076630793367139 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 268 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 227968 | 0x7f18f4030500 | 0x7f17e8437240 | 65536 | 147556 | 18861440 | 12076630793390973 | 12076630793577609 | 12076630793977288 | 12076630794025494 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 270 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 232000 | 0x7f18f4030400 | 0x7f17e8437280 | 131072 | 226096 | 28999416 | 12076630794057984 | 12076630794237608 | 12076630794440007 | 12076630794487543 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 272 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 237824 | 0x7f18f4030300 | 0x7f17e84372c0 | 131072 | 243370 | 30875000 | 12076630794513702 | 12076630794688486 | 12076630795215365 | 12076630795261944 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 274 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 242368 | 0x7f18f4030a00 | 0x7f17e8437300 | 131072 | 232722 | 29537392 | 12076630795298512 | 12076630795460804 | 12076630795684804 | 12076630795732198 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 276 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 20 | 24 | 243584 | 0x7f18f4030900 | 0x7f17e8437340 | 131072 | 226182 | 29068344 | 12076630795757796 | 12076630795931043 | 12076630796730401 | 12076630796781650 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 278 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 248128 | 0x7f18f4030800 | 0x7f17e8437380 | 65536 | 152344 | 19488520 | 12076630796807899 | 12076630796985920 | 12076630797407199 | 12076630797455855 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 280 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 252672 | 0x7f18f4030700 | 0x7f17e84373c0 | 131072 | 228182 | 29192104 | 12076630797479599 | 12076630797659678 | 12076630797888158 | 12076630797935176 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 282 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 259264 | 0x7f18f4030600 | 0x7f17e8437400 | 131072 | 225926 | 28971024 | 12076630797961756 | 12076630798140477 | 12076630798737755 | 12076630798785869 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 284 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 264832 | 0x7f18f4030500 | 0x7f17e8437440 | 131072 | 224962 | 28784784 | 12076630798826785 | 12076630798988955 | 12076630799258554 | 12076630799308010 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 286 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 20 | 24 | 266304 | 0x7f18f4030400 | 0x7f17e8437480 | 131072 | 230724 | 29303736 | 12076630799331574 | 12076630799516793 | 12076630800502071 | 12076630800568915 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 288 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 28 | 24 | 271872 | 0x7f18f4030300 | 0x7f17e84374c0 | 65536 | 147582 | 18854272 | 12076630800600514 | 12076630800779030 | 12076630801311988 | 12076630801378822 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 290 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 277440 | 0x7f18f4030a00 | 0x7f17e8437500 | 131072 | 226488 | 29189608 | 12076630801406563 | 12076630801587508 | 12076630801858547 | 12076630801924547 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 292 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 12 | 24 | 279936 | 0x7f18f4030900 | 0x7f17e8437540 | 131072 | 218074 | 27634208 | 12076630801950315 | 12076630802135506 | 12076630802874544 | 12076630802942130 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 294 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 286528 | 0x7f18f4030800 | 0x7f17e8437580 | 131072 | 219106 | 28138184 | 12076630802981232 | 12076630803157743 | 12076630803474063 | 12076630803541054 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 296 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 20 | 24 | 288000 | 0x7f18f4030700 | 0x7f17e84375c0 | 131072 | 224538 | 28854304 | 12076630803564638 | 12076630803745902 | 12076630804917579 | 12076630804987584 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 298 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 32 | 24 | 294592 | 0x7f18f4030600 | 0x7f17e8437600 | 65536 | 147524 | 18774424 | 12076630805023241 | 12076630805205738 | 12076630805815336 | 12076630805883811 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 300 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 301184 | 0x7f18f4030500 | 0x7f17e8437640 | 131072 | 226012 | 28842272 | 12076630805911944 | 12076630806097255 | 12076630806416295 | 12076630806484218 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 302 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 12 | 24 | 304960 | 0x7f18f4030400 | 0x7f17e8437680 | 131072 | 225610 | 29069248 | 12076630806512471 | 12076630806686534 | 12076630807565251 | 12076630807631983 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 304 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 24 | 24 | 313600 | 0x7f18f4030300 | 0x7f17e84376c0 | 131072 | 254558 | 32850600 | 12076630807668531 | 12076630807834691 | 12076630808246850 | 12076630808315845 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 306 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 20 | 24 | 314816 | 0x7f18f4030a00 | 0x7f17e8437700 | 131072 | 226646 | 29183472 | 12076630808347384 | 12076630808528769 | 12076630810076445 | 12076630810144407 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 308 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 20 | 24 | 317568 | 0x7f18f4030900 | 0x7f17e8437740 | 65536 | 146264 | 18739032 | 12076630810174753 | 12076630810354844 | 12076630811149882 | 12076630811216802 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 310 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 12 | 24 | 320320 | 0x7f18f4030800 | 0x7f17e8437780 | 131072 | 262206 | 33522600 | 12076630811243782 | 12076630811427481 | 12076630811842520 | 12076630811908639 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 312 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 12 | 24 | 324096 | 0x7f18f4030700 | 0x7f17e84377c0 | 131072 | 225932 | 28775136 | 12076630811933695 | 12076630812121879 | 12076630813280116 | 12076630813348357 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 314 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 12 | 24 | 328896 | 0x7f18f4030600 | 0x7f17e8437800 | 131072 | 212086 | 27305448 | 12076630813389683 | 12076630813549235 | 12076630814334513 | 12076630814401756 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 316 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 20 | 24 | 330112 | 0x7f18f4030500 | 0x7f17e8437840 | 131072 | 278198 | 35698600 | 12076630814433465 | 12076630814610672 | 12076630817661224 | 12076630817728875 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 318 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 20 | 24 | 332864 | 0x7f18f4030400 | 0x7f17e8437880 | 65536 | 147728 | 18993832 | 12076630817759983 | 12076630817929703 | 12076630819470179 | 12076630819538611 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 320 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 12 | 24 | 335616 | 0x7f18f4030300 | 0x7f17e84378c0 | 131072 | 230624 | 29452312 | 12076630819562395 | 12076630819751778 | 12076630820541376 | 12076630820609142 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 322 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 12 | 24 | 339392 | 0x7f18f4030a00 | 0x7f17e8437900 | 131072 | 225176 | 29231608 | 12076630820639719 | 12076630820825856 | 12076630823106489 | 12076630823175005 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 324 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 12 | 24 | 344192 | 0x7f18f4030900 | 0x7f17e8437940 | 131072 | 226042 | 28801544 | 12076630823218656 | 12076630823383449 | 12076630824918164 | 12076630824984611 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 326 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 20 | 24 | 345408 | 0x7f18f4030800 | 0x7f17e8437980 | 131072 | 229440 | 29399096 | 12076630825019356 | 12076630825203444 | 12076630831257027 | 12076630831327209 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 328 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 20 | 24 | 348160 | 0x7f18f4030700 | 0x7f17e84379c0 | 65536 | 153238 | 19696104 | 12076630831358758 | 12076630831539747 | 12076630834579258 | 12076630834649489 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 330 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 12 | 24 | 350912 | 0x7f18f4030600 | 0x7f17e8437a00 | 131072 | 223628 | 28401128 | 12076630834684204 | 12076630834850618 | 12076630836389973 | 12076630836458544 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 332 | 936496 | 936501 | 4194304 | 256 | 0 | 0 | 12 | 24 | 0 | 0x7f18f4030500 | 0x7f17e8437a40 | 131072 | 225772 | 28788384 | 12076630836488380 | 12076630836670613 | 12076630841197640 | 12076630841270295 |