66 KiB
66 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | SQ_INSTS_VALU_ADD_F16 | SQ_INSTS_VALU_MUL_F16 | SQ_INSTS_VALU_FMA_F16 | SQ_INSTS_VALU_TRANS_F16 | SQ_INSTS_VALU_ADD_F32 | SQ_INSTS_VALU_MUL_F32 | SQ_INSTS_VALU_FMA_F32 | SQ_INSTS_VALU_TRANS_F32 | TCP_TCC_READ_REQ_sum | TCP_TOTAL_CACHE_ACCESSES_sum | TCP_TCC_WRITE_REQ_sum | TCP_TCC_ATOMIC_WITH_RET_REQ_sum | TCC_EA_RDREQ_32B_sum | TCC_EA_RDREQ_sum | TCC_EA_WRREQ_64B_sum | TCC_EA_WRREQ_sum | SQ_INSTS_VALU_ADD_F64 | SQ_INSTS_VALU_MUL_F64 | SQ_INSTS_VALU_FMA_F64 | SQ_INSTS_VALU_TRANS_F64 | SQ_INSTS_VALU_MFMA_MOPS_F16 | SQ_INSTS_VALU_MFMA_MOPS_BF16 | SQ_INSTS_VALU_MFMA_MOPS_F32 | SQ_INSTS_VALU_MFMA_MOPS_F64 | TCP_TCC_ATOMIC_WITHOUT_RET_REQ_sum | SQ_LDS_IDX_ACTIVE | SQ_LDS_BANK_CONFLICT | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBufferAligned.kd | 0 | 0 | 0 | 234779 | 234779 | 33554432 | 256 | 0 | 0 | 4 | 32 | 4160 | 0x0 | 0x7f6f5c804280 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 8388608.0000000000 | 4194304.0000000000 | 0.0000000000 | 0.0000000000 | 312.0000000000 | 4128768.0000000000 | 4128768.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801452679825 | 17772096258178 | 17801596602238 | 17801596717129 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 234779 | 234779 | 32768 | 256 | 0 | 0 | 12 | 24 | 13888 | 0x0 | 0x7f6f5c823f80 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 8192.0000000000 | 16384.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 8260.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801602429427 | 17801596602238 | 17801602809336 | 17801602817287 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 5 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 14336 | 0x7f6f5f8a6380 | 0x7f6f5c823fc0 | 0 | 0 | 0 | 0 | 0 | 0 | 262144 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097340.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801603409582 | 17801602809336 | 17801604038308 | 17801604038227 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 8 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15040 | 0x7f6f5f8a6200 | 0x7f6f5c824000 | 0 | 0 | 0 | 0 | 0 | 0 | 262144 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194583.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801604637972 | 17801604038308 | 17801605371280 | 17801605371604 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 11 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15488 | 0x7f6f5f8a6080 | 0x7f6f5c824040 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194600.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 262144 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801605965429 | 17801605371280 | 17801606616252 | 17801606616223 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 14 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 15936 | 0x7f6f5d207f00 | 0x7f6f5c824080 | 0 | 0 | 262144 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097339.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801607209018 | 17801606616252 | 17801607772903 | 17801607772554 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 17 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 16384 | 0x7f6f5d207d80 | 0x7f6f5c8240c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097342.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801608365219 | 17801607772903 | 17801608975474 | 17801608975064 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 20 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 17088 | 0x7f6f5d207c00 | 0x7f6f5c824100 | 0 | 0 | 0 | 0 | 0 | 0 | 655360 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097327.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801609580779 | 17801608975474 | 17801610169886 | 17801610170054 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 23 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 16 | 24 | 17792 | 0x7f6f5d207a80 | 0x7f6f5c824140 | 0 | 0 | 0 | 0 | 0 | 0 | 786432 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194600.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801610765239 | 17801610169886 | 17801611454058 | 17801611453852 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 26 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 16 | 24 | 18496 | 0x7f6f5d207900 | 0x7f6f5c824180 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194592.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 786432 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801612046987 | 17801611454058 | 17801612723190 | 17801612723110 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 29 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19200 | 0x7f6f5d207780 | 0x7f6f5c8241c0 | 0 | 0 | 786432 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097344.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801613316626 | 17801612723190 | 17801613910561 | 17801613909621 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 32 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19904 | 0x7f6f5d207600 | 0x7f6f5c824200 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097340.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801614505156 | 17801613910561 | 17801615116493 | 17801615115551 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 35 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 20608 | 0x7f6f5f8a6480 | 0x7f6f5c824240 | 0 | 0 | 0 | 0 | 0 | 0 | 1048576 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097343.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801615719146 | 17801615116493 | 17801616317944 | 17801616317171 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 38 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 16 | 24 | 21312 | 0x7f6f5f8a6300 | 0x7f6f5c824280 | 0 | 0 | 0 | 0 | 0 | 0 | 1310720 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194602.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801616911956 | 17801616317944 | 17801617623716 | 17801617622789 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 41 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22016 | 0x7f6f5f8a6180 | 0x7f6f5c8242c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194590.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 1310720 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801618219184 | 17801617623716 | 17801618905008 | 17801618904237 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 44 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22720 | 0x7f6f5f8a6000 | 0x7f6f5c824300 | 0 | 0 | 1310720 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097345.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801619499802 | 17801618905008 | 17801620085340 | 17801620084317 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 47 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 23424 | 0x7f6f5d207e80 | 0x7f6f5c824340 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097347.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801620677602 | 17801620085340 | 17801621266631 | 17801621265468 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 50 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 24128 | 0x7f6f5d207d00 | 0x7f6f5c824380 | 0 | 0 | 0 | 0 | 0 | 0 | 1441792 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097339.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801621865573 | 17801621266631 | 17801622587443 | 17801622586475 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 53 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 16 | 24 | 24832 | 0x7f6f5d207b80 | 0x7f6f5c8243c0 | 0 | 0 | 0 | 0 | 0 | 0 | 1835008 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194584.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801623180990 | 17801622587443 | 17801623834335 | 17801623833134 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 56 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 16 | 24 | 25536 | 0x7f6f5d207a00 | 0x7f6f5c824400 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194596.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 1835008 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801624426409 | 17801623834335 | 17801625107147 | 17801625106002 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 59 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26240 | 0x7f6f5d207880 | 0x7f6f5c824440 | 0 | 0 | 1835008 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097344.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801625699517 | 17801625107147 | 17801626297398 | 17801626296613 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 62 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26944 | 0x7f6f5d207700 | 0x7f6f5c824480 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097352.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801626890718 | 17801626297398 | 17801627484770 | 17801627484063 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 65 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 27648 | 0x7f6f5f8a6580 | 0x7f6f5c8244c0 | 0 | 0 | 0 | 0 | 0 | 0 | 1835008 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097339.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801628085588 | 17801627484770 | 17801628670221 | 17801628669294 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 68 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 16 | 24 | 28608 | 0x7f6f5f8a6400 | 0x7f6f5c824500 | 0 | 0 | 0 | 0 | 0 | 0 | 2359296 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194601.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801629263689 | 17801628670221 | 17801629936793 | 17801629935792 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 71 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 16 | 24 | 29312 | 0x7f6f5f8a6280 | 0x7f6f5c824540 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194580.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 2359296 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801630530327 | 17801629936793 | 17801631201925 | 17801631200790 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 74 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 30016 | 0x7f6f5f8a6100 | 0x7f6f5c824580 | 0 | 0 | 2359296 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097346.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801631795786 | 17801631201925 | 17801632520497 | 17801632519368 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 77 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 8 | 24 | 30976 | 0x7f6f5d207f80 | 0x7f6f5c8245c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097346.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801633113213 | 17801632520497 | 17801633690428 | 17801633689308 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 80 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 31680 | 0x7f6f5d207e00 | 0x7f6f5c824600 | 0 | 0 | 0 | 0 | 0 | 0 | 2228224 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097343.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801634291413 | 17801633690428 | 17801634858599 | 17801634857659 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 83 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 16 | 24 | 32640 | 0x7f6f5d207c80 | 0x7f6f5c824640 | 0 | 0 | 0 | 0 | 0 | 0 | 2883584 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194582.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801635451974 | 17801634858599 | 17801636131571 | 17801636130558 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 86 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 33600 | 0x7f6f5d207b00 | 0x7f6f5c824680 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194599.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 2883584 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801636724343 | 17801636131571 | 17801637412544 | 17801637411416 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 89 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 34560 | 0x7f6f5d207980 | 0x7f6f5c8246c0 | 0 | 0 | 2883584 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097347.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801638005601 | 17801637412544 | 17801638581515 | 17801638580437 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 92 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 8 | 24 | 35520 | 0x7f6f5d207800 | 0x7f6f5c824700 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097351.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801639175682 | 17801638581515 | 17801639882487 | 17801639881244 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 95 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 36224 | 0x7f6f5d207680 | 0x7f6f5c824740 | 0 | 0 | 0 | 0 | 0 | 0 | 2621440 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097344.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801640483939 | 17801639882487 | 17801641047458 | 17801641046495 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 98 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 37184 | 0x7f6f5f8a6500 | 0x7f6f5c824780 | 0 | 0 | 0 | 0 | 0 | 0 | 3407872 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194583.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801641639681 | 17801641047458 | 17801642314030 | 17801642312924 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 101 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 38144 | 0x7f6f5f8a6380 | 0x7f6f5c8247c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194597.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 3407872 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801642907809 | 17801642314030 | 17801643582362 | 17801643581372 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 104 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 39104 | 0x7f6f5f8a6200 | 0x7f6f5c824800 | 0 | 0 | 3407872 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097356.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801644175697 | 17801643582362 | 17801644769093 | 17801644767963 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 107 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 8 | 24 | 40320 | 0x7f6f5f8a6080 | 0x7f6f5c824840 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097352.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801645363348 | 17801644769093 | 17801645950224 | 17801645949253 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 110 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 41280 | 0x7f6f5d207f00 | 0x7f6f5c824880 | 0 | 0 | 0 | 0 | 0 | 0 | 3014656 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097351.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801646551588 | 17801645950224 | 17801647139356 | 17801647138133 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 113 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 42240 | 0x7f6f5d207d80 | 0x7f6f5c8248c0 | 0 | 0 | 0 | 0 | 0 | 0 | 3932160 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194587.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801647732139 | 17801647139356 | 17801648422088 | 17801648420922 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 116 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 43200 | 0x7f6f5d207c00 | 0x7f6f5c824900 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194573.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 3932160 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801649014797 | 17801648422088 | 17801649685460 | 17801649684480 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 119 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 8 | 24 | 44160 | 0x7f6f5d207a80 | 0x7f6f5c824940 | 0 | 0 | 3932160 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097350.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801650279055 | 17801649685460 | 17801650867071 | 17801650865861 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 122 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 45376 | 0x7f6f5d207900 | 0x7f6f5c824980 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097350.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801651460206 | 17801650867071 | 17801652058602 | 17801652057551 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 125 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 46336 | 0x7f6f5d207780 | 0x7f6f5c8249c0 | 0 | 0 | 0 | 0 | 0 | 0 | 3407872 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097351.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801652659256 | 17801652058602 | 17801653245493 | 17801653244562 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 128 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 47552 | 0x7f6f5d207600 | 0x7f6f5c824a00 | 0 | 0 | 0 | 0 | 0 | 0 | 4456448 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194577.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801653838887 | 17801653245493 | 17801654510465 | 17801654509250 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 131 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 48512 | 0x7f6f5f8a6480 | 0x7f6f5c824a40 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194588.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 4456448 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801655103845 | 17801654510465 | 17801655787597 | 17801655786418 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 134 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 8 | 24 | 49472 | 0x7f6f5f8a6300 | 0x7f6f5c824a80 | 0 | 0 | 4456448 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097354.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801656380563 | 17801655787597 | 17801656979769 | 17801656978368 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 137 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 50688 | 0x7f6f5f8a6180 | 0x7f6f5c824ac0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097357.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801657573604 | 17801656979769 | 17801658218020 | 17801658216837 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 140 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 51648 | 0x7f6f5f8a6000 | 0x7f6f5c824b00 | 0 | 0 | 0 | 0 | 0 | 0 | 3801088 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097349.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801658819383 | 17801658215033 | 17801659419037 | 17801659425707 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 143 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 52864 | 0x7f6f5d207e80 | 0x7f6f5c824b40 | 0 | 0 | 0 | 0 | 0 | 0 | 4980736 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194576.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801660016013 | 17801659419037 | 17801660672161 | 17801660674056 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 146 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 54080 | 0x7f6f5d207d00 | 0x7f6f5c824b80 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194589.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 4980736 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801661267632 | 17801660672161 | 17801661942726 | 17801661944195 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 149 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 8 | 24 | 55296 | 0x7f6f5d207b80 | 0x7f6f5c824bc0 | 0 | 0 | 4980736 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097353.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801662539000 | 17801661942726 | 17801663144010 | 17801663145715 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 152 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 56768 | 0x7f6f5d207a00 | 0x7f6f5c824c00 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097358.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801663739020 | 17801663144010 | 17801664316174 | 17801664318236 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 155 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 57728 | 0x7f6f5d207880 | 0x7f6f5c824c40 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097353.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801664919331 | 17801664316174 | 17801665524658 | 17801665526346 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 158 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 58944 | 0x7f6f5d207700 | 0x7f6f5c824c80 | 0 | 0 | 0 | 0 | 0 | 0 | 5505024 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194558.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801666121331 | 17801665524658 | 17801666808983 | 17801666810684 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 161 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 60160 | 0x7f6f5f8a6580 | 0x7f6f5c824cc0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194557.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 5505024 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801667404569 | 17801666808983 | 17801668080028 | 17801668081812 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 164 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 8 | 24 | 61376 | 0x7f6f5f8a6400 | 0x7f6f5c824d00 | 0 | 0 | 5505024 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097356.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801668675637 | 17801668080028 | 17801669256832 | 17801669258633 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 167 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 62848 | 0x7f6f5f8a6280 | 0x7f6f5c824d40 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097357.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801669852938 | 17801669256832 | 17801670452836 | 17801670454603 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 170 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 63808 | 0x7f6f5f8a6100 | 0x7f6f5c824d80 | 0 | 0 | 0 | 0 | 0 | 0 | 4587520 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097356.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801671057358 | 17801670452836 | 17801671640200 | 17801671641733 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 173 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 65024 | 0x7f6f5d207f80 | 0x7f6f5c824dc0 | 0 | 0 | 0 | 0 | 0 | 0 | 6029312 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194579.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801672236869 | 17801671640200 | 17801672906125 | 17801672907812 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 176 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 66240 | 0x7f6f5d207e00 | 0x7f6f5c824e00 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194559.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 6029312 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801673501467 | 17801672906125 | 17801674183729 | 17801674185850 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 179 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 8 | 24 | 67456 | 0x7f6f5d207c80 | 0x7f6f5c824e40 | 0 | 0 | 6029312 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097358.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801674781035 | 17801674183729 | 17801675351574 | 17801675353261 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 182 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 68928 | 0x7f6f5d207b00 | 0x7f6f5c824e80 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097357.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801675948066 | 17801675351574 | 17801676541498 | 17801676543182 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 185 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 70144 | 0x7f6f5d207980 | 0x7f6f5c824ec0 | 0 | 0 | 0 | 0 | 0 | 0 | 4980736 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097348.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801677155396 | 17801676541498 | 17801677747102 | 17801677748902 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 188 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 71616 | 0x7f6f5d207800 | 0x7f6f5c824f00 | 0 | 0 | 0 | 0 | 0 | 0 | 6553600 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194549.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801678344887 | 17801677747102 | 17801679019107 | 17801679020940 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 191 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 72832 | 0x7f6f5d207680 | 0x7f6f5c824f40 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194556.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 6553600 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801679614885 | 17801679019107 | 17801680258151 | 17801680259819 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 194 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 8 | 24 | 74048 | 0x7f6f5f8a6500 | 0x7f6f5c824f80 | 0 | 0 | 6553600 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097357.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801680853234 | 17801680258151 | 17801681431755 | 17801681433599 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 197 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 75776 | 0x7f6f5f8a6380 | 0x7f6f5c824fc0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097354.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801682027915 | 17801681431755 | 17801682636240 | 17801682638119 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 200 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 76992 | 0x7f6f5f8a6200 | 0x7f6f5c825000 | 0 | 0 | 0 | 0 | 0 | 0 | 5373952 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097352.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801683241134 | 17801682636240 | 17801683814324 | 17801683816060 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 203 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 78464 | 0x7f6f5f8a6080 | 0x7f6f5c825040 | 0 | 0 | 0 | 0 | 0 | 0 | 7077888 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194553.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801684410945 | 17801683814324 | 17801685078489 | 17801685080299 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 206 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 79936 | 0x7f6f5d207f00 | 0x7f6f5c825080 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194567.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 7077888 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801685674624 | 17801685078489 | 17801686356413 | 17801686358507 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 209 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 8 | 24 | 81408 | 0x7f6f5d207d80 | 0x7f6f5c8250c0 | 0 | 0 | 7077888 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097360.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801686951392 | 17801686356413 | 17801687537537 | 17801687539418 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 212 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 83136 | 0x7f6f5d207c00 | 0x7f6f5c825100 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097354.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801688134193 | 17801687537537 | 17801688746342 | 17801688748088 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 215 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 84352 | 0x7f6f5d207a80 | 0x7f6f5c825140 | 0 | 0 | 0 | 0 | 0 | 0 | 5767168 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097358.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801689350773 | 17801688746342 | 17801689939946 | 17801689941808 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 218 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 85824 | 0x7f6f5d207900 | 0x7f6f5c825180 | 0 | 0 | 0 | 0 | 0 | 0 | 7602176 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194572.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801690536603 | 17801689939946 | 17801691210511 | 17801691212406 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 221 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 87296 | 0x7f6f5d207780 | 0x7f6f5c8251c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194569.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 7602176 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801691807241 | 17801691210511 | 17801692476435 | 17801692478085 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 224 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 88768 | 0x7f6f5d207600 | 0x7f6f5c825200 | 0 | 0 | 7602176 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097363.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801693071980 | 17801692476435 | 17801693653719 | 17801693655595 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 227 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 90752 | 0x7f6f5f8a6480 | 0x7f6f5c825240 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097351.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801694250370 | 17801693653719 | 17801694885404 | 17801694887344 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 230 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 91968 | 0x7f6f5f8a6300 | 0x7f6f5c825280 | 0 | 0 | 0 | 0 | 0 | 0 | 6160384 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097357.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801695490759 | 17801694885404 | 17801696071968 | 17801696073525 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 233 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 93440 | 0x7f6f5f8a6180 | 0x7f6f5c8252c0 | 0 | 0 | 0 | 0 | 0 | 0 | 8126464 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194568.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801696668370 | 17801696071968 | 17801697352133 | 17801697353833 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 236 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 94912 | 0x7f6f5f8a6000 | 0x7f6f5c825300 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194561.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 8126464 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801697948348 | 17801697352133 | 17801698603337 | 17801698605082 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 239 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 96384 | 0x7f6f5d207e80 | 0x7f6f5c825340 | 0 | 0 | 8126464 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097362.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801699198997 | 17801698603337 | 17801699772301 | 17801699774283 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 242 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 98368 | 0x7f6f5d207d00 | 0x7f6f5c825380 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097341.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801700368118 | 17801699772301 | 17801700967026 | 17801700968923 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 245 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 99584 | 0x7f6f5d207b80 | 0x7f6f5c8253c0 | 0 | 0 | 0 | 0 | 0 | 0 | 6553600 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097358.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801701570588 | 17801700967026 | 17801702177110 | 17801702179313 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 248 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 101312 | 0x7f6f5d207a00 | 0x7f6f5c825400 | 0 | 0 | 0 | 0 | 0 | 0 | 8650752 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194566.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801702774998 | 17801702177110 | 17801703437754 | 17801703439712 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 251 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 102784 | 0x7f6f5d207880 | 0x7f6f5c825440 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194562.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 8650752 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801704033937 | 17801703437754 | 17801704706879 | 17801704708720 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 254 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 104256 | 0x7f6f5d207700 | 0x7f6f5c825480 | 0 | 0 | 8650752 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097361.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801705302445 | 17801704706879 | 17801705865603 | 17801705867401 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 257 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 106240 | 0x7f6f5f8a6580 | 0x7f6f5c8254c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097342.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801706462956 | 17801705865603 | 17801707080807 | 17801707082601 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 260 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 107712 | 0x7f6f5f8a6400 | 0x7f6f5c825500 | 0 | 0 | 0 | 0 | 0 | 0 | 6946816 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097360.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801707685216 | 17801707080807 | 17801708246572 | 17801708248322 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 263 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 16 | 24 | 109440 | 0x7f6f5f8a6280 | 0x7f6f5c825540 | 0 | 0 | 0 | 0 | 0 | 0 | 9175040 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194554.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801708842957 | 17801708246572 | 17801709530096 | 17801709531850 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 266 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 16 | 24 | 111168 | 0x7f6f5f8a6100 | 0x7f6f5c825580 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194582.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 9175040 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801710127235 | 17801709530096 | 17801710778901 | 17801710780999 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 269 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 8 | 24 | 112896 | 0x7f6f5d207f80 | 0x7f6f5c8255c0 | 0 | 0 | 9175040 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097366.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801711374914 | 17801710778901 | 17801711928185 | 17801711929900 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 272 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 115136 | 0x7f6f5d207e00 | 0x7f6f5c825600 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097336.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801712523896 | 17801711928185 | 17801713133629 | 17801713135560 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 275 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 116608 | 0x7f6f5d207c80 | 0x7f6f5c825640 | 0 | 0 | 0 | 0 | 0 | 0 | 7340032 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097362.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801713737895 | 17801713133629 | 17801714338434 | 17801714340400 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 278 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 16 | 24 | 118336 | 0x7f6f5d207b00 | 0x7f6f5c825680 | 0 | 0 | 0 | 0 | 0 | 0 | 9699328 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194565.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801714934316 | 17801714338434 | 17801715644358 | 17801715646018 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 281 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 16 | 24 | 120064 | 0x7f6f5d207980 | 0x7f6f5c8256c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194596.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 9699328 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801716239933 | 17801715644358 | 17801716913163 | 17801716914736 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 284 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 121792 | 0x7f6f5d207800 | 0x7f6f5c825700 | 0 | 0 | 9699328 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097364.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801717508441 | 17801716913163 | 17801718074767 | 17801718085407 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 287 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 124032 | 0x7f6f5d207680 | 0x7f6f5c825740 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097320.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801718672112 | 17801718074767 | 17801719284851 | 17801719286637 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 290 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 125504 | 0x7f6f5f8a6500 | 0x7f6f5c825780 | 0 | 0 | 0 | 0 | 0 | 0 | 8126464 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097362.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801719887742 | 17801719284851 | 17801720446775 | 17801720448528 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 293 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 127488 | 0x7f6f5f8a6380 | 0x7f6f5c8257c0 | 0 | 0 | 0 | 0 | 0 | 0 | 10747904 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194597.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801721042653 | 17801720446775 | 17801721720380 | 17801721721996 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 296 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 129216 | 0x7f6f5f8a6200 | 0x7f6f5c825800 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194593.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 10747904 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801722317612 | 17801721719892 | 17801722998935 | 17801723001355 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 299 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 130944 | 0x7f6f5f8a6080 | 0x7f6f5c825840 | 0 | 0 | 10747904 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097363.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801723595440 | 17801722998935 | 17801724168858 | 17801724170866 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 302 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 133440 | 0x7f6f5d207f00 | 0x7f6f5c825880 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097323.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801724764701 | 17801724168858 | 17801725392701 | 17801725394955 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 305 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 134912 | 0x7f6f5d207d80 | 0x7f6f5c8258c0 | 0 | 0 | 0 | 0 | 0 | 0 | 8912896 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097361.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801725997530 | 17801725392701 | 17801726578304 | 17801726580476 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 308 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 136896 | 0x7f6f5d207c00 | 0x7f6f5c825900 | 0 | 0 | 0 | 0 | 0 | 0 | 11796480 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194605.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801727175251 | 17801726578304 | 17801727851108 | 17801727853294 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 311 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 138880 | 0x7f6f5d207a80 | 0x7f6f5c825940 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194581.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 11796480 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801728447749 | 17801727851108 | 17801729117671 | 17801729119812 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 314 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 140864 | 0x7f6f5d207900 | 0x7f6f5c825980 | 0 | 0 | 11796480 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097350.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801729713337 | 17801729117671 | 17801730317675 | 17801730320042 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 317 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 143616 | 0x7f6f5d207780 | 0x7f6f5c8259c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097331.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801730913827 | 17801730317675 | 17801731552398 | 17801731554671 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 320 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 145344 | 0x7f6f5d207600 | 0x7f6f5c825a00 | 0 | 0 | 0 | 0 | 0 | 0 | 9699328 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097362.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801732156707 | 17801731552398 | 17801732751441 | 17801732753492 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 323 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 147584 | 0x7f6f5f8a6480 | 0x7f6f5c825a40 | 0 | 0 | 0 | 0 | 0 | 0 | 12845056 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194606.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801733348317 | 17801732751441 | 17801734026805 | 17801734028760 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 326 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 149568 | 0x7f6f5f8a6300 | 0x7f6f5c825a80 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194594.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 12845056 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801734624205 | 17801734026805 | 17801735294168 | 17801735296369 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 329 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 151552 | 0x7f6f5f8a6180 | 0x7f6f5c825ac0 | 0 | 0 | 12845056 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097345.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801735890264 | 17801735294168 | 17801736488891 | 17801736491059 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 332 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 154304 | 0x7f6f5f8a6000 | 0x7f6f5c825b00 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097337.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801737086374 | 17801736488891 | 17801737754815 | 17801737757347 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 335 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 156288 | 0x7f6f5d207e80 | 0x7f6f5c825b40 | 0 | 0 | 0 | 0 | 0 | 0 | 11272192 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097357.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801738360772 | 17801737754815 | 17801738938818 | 17801738940978 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 338 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 158784 | 0x7f6f5d207d00 | 0x7f6f5c825b80 | 0 | 0 | 0 | 0 | 0 | 0 | 14942208 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194637.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801739536043 | 17801738938818 | 17801740209382 | 17801740211526 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 341 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 161024 | 0x7f6f5d207b80 | 0x7f6f5c825bc0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194630.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 14942208 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801740805361 | 17801740209382 | 17801741476425 | 17801741478484 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 344 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 163264 | 0x7f6f5d207a00 | 0x7f6f5c825c00 | 0 | 0 | 14942208 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097341.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801742073200 | 17801741476425 | 17801742810669 | 17801742812831 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 347 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 166528 | 0x7f6f5d207880 | 0x7f6f5c825c40 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097342.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801743407286 | 17801742810669 | 17801744219153 | 17801744285335 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 350 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 168512 | 0x7f6f5d207700 | 0x7f6f5c825c80 | 0 | 0 | 0 | 0 | 0 | 0 | 12845056 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097353.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801744823791 | 17801744219153 | 17801745416916 | 17801745419156 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 353 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 171264 | 0x7f6f5f8a6580 | 0x7f6f5c825cc0 | 0 | 0 | 0 | 0 | 0 | 0 | 17039360 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194640.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801746012272 | 17801745416916 | 17801746833880 | 17801746836041 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 356 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 173760 | 0x7f6f5f8a6400 | 0x7f6f5c825d00 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194641.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 17039360 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801747430746 | 17801746833880 | 17801748067163 | 17801748072080 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 359 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 176256 | 0x7f6f5f8a6280 | 0x7f6f5c825d40 | 0 | 0 | 17039360 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097325.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801748662996 | 17801748067163 | 17801749267166 | 17801749269461 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 362 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 179776 | 0x7f6f5f8a6100 | 0x7f6f5c825d80 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097345.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801749863586 | 17801749267166 | 17801750599650 | 17801750665946 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 365 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 182272 | 0x7f6f5d207f80 | 0x7f6f5c825dc0 | 0 | 0 | 0 | 0 | 0 | 0 | 15990784 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097343.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801751204842 | 17801750599650 | 17801751832133 | 17801751834487 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 368 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 185536 | 0x7f6f5d207e00 | 0x7f6f5c825e00 | 0 | 0 | 0 | 0 | 0 | 0 | 21233664 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194630.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801752428982 | 17801751832133 | 17801753101737 | 17801753166933 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 371 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 188544 | 0x7f6f5d207c80 | 0x7f6f5c825e40 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194628.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 21233664 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801753698070 | 17801753101737 | 17801754395980 | 17801754461441 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 374 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 191552 | 0x7f6f5d207b00 | 0x7f6f5c825e80 | 0 | 0 | 21233664 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097327.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801754992628 | 17801754395980 | 17801755659504 | 17801755661641 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 377 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 195840 | 0x7f6f5d207980 | 0x7f6f5c825ec0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097350.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801756255956 | 17801755659504 | 17801757075028 | 17801757141234 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 380 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 198592 | 0x7f6f5d207800 | 0x7f6f5c825f00 | 0 | 0 | 0 | 0 | 0 | 0 | 19136512 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097335.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801757680751 | 17801757075028 | 17801758313591 | 17801758315835 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 383 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 202368 | 0x7f6f5d207680 | 0x7f6f5c825f40 | 0 | 0 | 0 | 0 | 0 | 0 | 25427968 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194632.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801758910511 | 17801758313591 | 17801759695515 | 17801759758329 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 386 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 205888 | 0x7f6f5f8a6500 | 0x7f6f5c825f80 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194611.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 25427968 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801760291106 | 17801759695515 | 17801760940318 | 17801761003989 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 389 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 209408 | 0x7f6f5f8a6380 | 0x7f6f5c825fc0 | 0 | 0 | 25427968 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097351.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801761536015 | 17801760940318 | 17801762168322 | 17801762232548 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 392 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 214464 | 0x7f6f5f8a6200 | 0x7f6f5c826000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097361.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801762765425 | 17801762168322 | 17801763664326 | 17801763728721 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 395 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 217728 | 0x7f6f5f8a6080 | 0x7f6f5c826040 | 0 | 0 | 0 | 0 | 0 | 0 | 22282240 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097333.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801764268957 | 17801763664326 | 17801764988969 | 17801764990689 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 398 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 222016 | 0x7f6f5d207f00 | 0x7f6f5c826080 | 0 | 0 | 0 | 0 | 0 | 0 | 29622272 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194610.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801765584824 | 17801764988969 | 17801766402253 | 17801766468412 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 401 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 226048 | 0x7f6f5d207d80 | 0x7f6f5c8260c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194599.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 29622272 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801766998279 | 17801766402253 | 17801767675057 | 17801767740750 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 404 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 230080 | 0x7f6f5d207c00 | 0x7f6f5c826100 | 0 | 0 | 29622272 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097343.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801768270217 | 17801767675057 | 17801768934420 | 17801769000019 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 407 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 235904 | 0x7f6f5d207a80 | 0x7f6f5c826140 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097378.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801769530526 | 17801768934420 | 17801770421944 | 17801770489782 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 410 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 239424 | 0x7f6f5d207900 | 0x7f6f5c826180 | 0 | 0 | 0 | 0 | 0 | 0 | 25427968 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097340.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801771027449 | 17801770421944 | 17801771674268 | 17801771677733 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 413 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 244224 | 0x7f6f5d207780 | 0x7f6f5c8261c0 | 0 | 0 | 0 | 0 | 0 | 0 | 33816576 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194608.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801772270368 | 17801771674268 | 17801772980831 | 17801773024449 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 416 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 248768 | 0x7f6f5d207600 | 0x7f6f5c826200 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194610.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 33816576 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801773577105 | 17801772980831 | 17801774312995 | 17801774379626 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 419 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 253312 | 0x7f6f5f8a6480 | 0x7f6f5c826240 | 0 | 0 | 33816576 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097355.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801774909762 | 17801774312995 | 17801775639398 | 17801775705452 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 422 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 8 | 24 | 255552 | 0x7f6f5f8a6300 | 0x7f6f5c826280 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097317.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801776235409 | 17801775639398 | 17801777172843 | 17801777237174 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 425 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 259840 | 0x7f6f5f8a6180 | 0x7f6f5c8262c0 | 0 | 0 | 0 | 0 | 0 | 0 | 31719424 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097353.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801777778341 | 17801777172843 | 17801778495246 | 17801778561101 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 428 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 265664 | 0x7f6f5f8a6000 | 0x7f6f5c826300 | 0 | 0 | 0 | 0 | 0 | 0 | 42205184 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194594.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801779092898 | 17801778495246 | 17801779888370 | 17801779954486 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 431 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 271232 | 0x7f6f5d207e80 | 0x7f6f5c826340 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194606.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 42205184 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801780483833 | 17801779888370 | 17801781255254 | 17801781321172 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 434 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 8 | 24 | 273216 | 0x7f6f5d207d00 | 0x7f6f5c826380 | 0 | 0 | 42205184 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097326.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801781851479 | 17801781255254 | 17801782638938 | 17801782705888 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 437 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 8 | 24 | 275712 | 0x7f6f5d207b80 | 0x7f6f5c8263c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097322.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801783235395 | 17801782638938 | 17801784282782 | 17801784349427 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 440 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 280768 | 0x7f6f5d207a00 | 0x7f6f5c826400 | 0 | 0 | 0 | 0 | 0 | 0 | 38010880 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097376.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801784888654 | 17801784286611 | 17801785640863 | 17801785710463 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 443 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 287616 | 0x7f6f5d207880 | 0x7f6f5c826440 | 0 | 0 | 0 | 0 | 0 | 0 | 50593792 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194616.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801786233560 | 17801785640863 | 17801787073034 | 17801787133498 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 446 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 294208 | 0x7f6f5d207700 | 0x7f6f5c826480 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194622.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 50593792 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801787664545 | 17801787073034 | 17801788513847 | 17801788556452 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 449 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 8 | 24 | 296960 | 0x7f6f5f8a6580 | 0x7f6f5c8264c0 | 0 | 0 | 50593792 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097331.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801789106389 | 17801788513847 | 17801789960580 | 17801790020726 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 452 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 8 | 24 | 299968 | 0x7f6f5f8a6400 | 0x7f6f5c826500 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097327.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801790554152 | 17801789960580 | 17801791705235 | 17801791768312 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 455 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 8 | 24 | 302720 | 0x7f6f5f8a6280 | 0x7f6f5c826540 | 0 | 0 | 0 | 0 | 0 | 0 | 67371008 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097332.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801792307059 | 17801791705235 | 17801793226048 | 17801793287954 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 458 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 305472 | 0x7f6f5f8a6100 | 0x7f6f5c826580 | 0 | 0 | 0 | 0 | 0 | 0 | 67371008 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194557.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801793819091 | 17801793226048 | 17801794784622 | 17801794849316 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 461 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 308224 | 0x7f6f5d207f80 | 0x7f6f5c8265c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194555.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 67371008 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801795377733 | 17801794784622 | 17801796339356 | 17801796400667 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 464 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 8 | 24 | 310976 | 0x7f6f5d207e00 | 0x7f6f5c826600 | 0 | 0 | 67371008 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097328.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801796931794 | 17801796339356 | 17801797883849 | 17801797946429 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 467 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 8 | 24 | 313216 | 0x7f6f5d207c80 | 0x7f6f5c826640 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097314.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801798476845 | 17801797883849 | 17801799852666 | 17801799915350 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 470 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 8 | 24 | 315968 | 0x7f6f5d207b00 | 0x7f6f5c826680 | 0 | 0 | 0 | 0 | 0 | 0 | 134479872 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097325.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801800453796 | 17801799852666 | 17801801805964 | 17801801866371 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 473 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 318720 | 0x7f6f5d207980 | 0x7f6f5c8266c0 | 0 | 0 | 0 | 0 | 0 | 0 | 134479872 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194548.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801802398977 | 17801801805964 | 17801803774941 | 17801803837792 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 476 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 321472 | 0x7f6f5d207800 | 0x7f6f5c826700 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194541.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 134479872 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801804367059 | 17801803774941 | 17801805739278 | 17801805801943 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 479 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 8 | 24 | 324224 | 0x7f6f5d207680 | 0x7f6f5c826740 | 0 | 0 | 134479872 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097322.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801806332000 | 17801805739278 | 17801807683775 | 17801807751434 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 482 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 8 | 24 | 326464 | 0x7f6f5f8a6500 | 0x7f6f5c826780 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097312.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801808275501 | 17801807683775 | 17801810471799 | 17801810538585 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 485 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 8 | 24 | 329216 | 0x7f6f5f8a6380 | 0x7f6f5c8267c0 | 0 | 0 | 0 | 0 | 0 | 0 | 268697600 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097324.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801811078982 | 17801810471799 | 17801813240144 | 17801813302996 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 488 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 331968 | 0x7f6f5f8a6200 | 0x7f6f5c826800 | 0 | 0 | 0 | 0 | 0 | 0 | 268697600 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194543.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801813833723 | 17801813240144 | 17801816051048 | 17801816120056 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 491 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 12 | 24 | 334720 | 0x7f6f5f8a6080 | 0x7f6f5c826840 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194541.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 268697600 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801816644613 | 17801816051048 | 17801818846913 | 17801818913926 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 494 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 8 | 24 | 337472 | 0x7f6f5d207f00 | 0x7f6f5c826880 | 0 | 0 | 268697600 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097325.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801819439923 | 17801818846913 | 17801821616217 | 17801821677708 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 497 | 234779 | 234779 | 4194304 | 256 | 0 | 0 | 8 | 24 | 0 | 0x7f6f5d207d80 | 0x7f6f5c8268c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097312.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17801822209165 | 17801821616217 | 17801826081216 | 17801826148897 |