66 KiB
66 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | SQ_INSTS_VALU_ADD_F16 | SQ_INSTS_VALU_MUL_F16 | SQ_INSTS_VALU_FMA_F16 | SQ_INSTS_VALU_TRANS_F16 | SQ_INSTS_VALU_ADD_F32 | SQ_INSTS_VALU_MUL_F32 | SQ_INSTS_VALU_FMA_F32 | SQ_INSTS_VALU_TRANS_F32 | TCP_TCC_READ_REQ_sum | TCP_TOTAL_CACHE_ACCESSES_sum | TCP_TCC_WRITE_REQ_sum | TCP_TCC_ATOMIC_WITH_RET_REQ_sum | TCC_EA_RDREQ_32B_sum | TCC_EA_RDREQ_sum | TCC_EA_WRREQ_64B_sum | TCC_EA_WRREQ_sum | SQ_INSTS_VALU_ADD_F64 | SQ_INSTS_VALU_MUL_F64 | SQ_INSTS_VALU_FMA_F64 | SQ_INSTS_VALU_TRANS_F64 | SQ_INSTS_VALU_MFMA_MOPS_F16 | SQ_INSTS_VALU_MFMA_MOPS_BF16 | SQ_INSTS_VALU_MFMA_MOPS_F32 | SQ_INSTS_VALU_MFMA_MOPS_F64 | TCP_TCC_ATOMIC_WITHOUT_RET_REQ_sum | SQ_LDS_IDX_ACTIVE | SQ_LDS_BANK_CONFLICT | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBufferAligned.kd | 0 | 0 | 0 | 228689 | 228689 | 33554432 | 256 | 0 | 0 | 4 | 32 | 4160 | 0x0 | 0x7fab9ca04280 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 8388608.0000000000 | 4194304.0000000000 | 0.0000000000 | 0.0000000000 | 309.0000000000 | 4128768.0000000000 | 4128768.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695745996020 | 17666284958929 | 17695893731942 | 17695893846323 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 228689 | 228689 | 32768 | 256 | 0 | 0 | 12 | 24 | 13888 | 0x0 | 0x7fab9ca23f80 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 8192.0000000000 | 16384.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 8260.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695899546920 | 17695893731942 | 17695899908008 | 17695899915190 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 5 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 14336 | 0x7fab9f92d380 | 0x7fab9ca23fc0 | 0 | 0 | 0 | 0 | 0 | 0 | 262144 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097342.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695900506745 | 17695899908008 | 17695901168501 | 17695901168529 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 8 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15040 | 0x7fab9f92d200 | 0x7fab9ca24000 | 0 | 0 | 0 | 0 | 0 | 0 | 262144 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194579.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695901769584 | 17695901168501 | 17695902469155 | 17695902467586 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 11 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15488 | 0x7fab9f92d080 | 0x7fab9ca24040 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194604.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 262144 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695903063681 | 17695902469155 | 17695903728849 | 17695903728244 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 14 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 15936 | 0x7fab9d1cdf00 | 0x7fab9ca24080 | 0 | 0 | 262144 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097343.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695904323509 | 17695903728849 | 17695904921342 | 17695904920284 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 17 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 16384 | 0x7fab9d1cdd80 | 0x7fab9ca240c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097344.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695905514109 | 17695904921342 | 17695906120874 | 17695906120744 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 20 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 17088 | 0x7fab9d1cdc00 | 0x7fab9ca24100 | 0 | 0 | 0 | 0 | 0 | 0 | 655360 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097338.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695906727059 | 17695906120874 | 17695907329527 | 17695907328614 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 23 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 16 | 24 | 17792 | 0x7fab9d1cda80 | 0x7fab9ca24140 | 0 | 0 | 0 | 0 | 0 | 0 | 786432 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194597.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695907923599 | 17695907329527 | 17695908637062 | 17695908636221 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 26 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 16 | 24 | 18496 | 0x7fab9d1cd900 | 0x7fab9ca24180 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194585.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 786432 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695909230926 | 17695908637062 | 17695909927955 | 17695909926728 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 29 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19200 | 0x7fab9d1cd780 | 0x7fab9ca241c0 | 0 | 0 | 786432 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097344.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695910521443 | 17695909927955 | 17695911121408 | 17695911119348 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 32 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19904 | 0x7fab9d1cd600 | 0x7fab9ca24200 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097339.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695911713204 | 17695911121408 | 17695912285261 | 17695912282969 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 35 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 20608 | 0x7fab9f92d480 | 0x7fab9ca24240 | 0 | 0 | 0 | 0 | 0 | 0 | 1048576 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097346.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695912885794 | 17695912285261 | 17695913474554 | 17695913472579 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 38 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 16 | 24 | 21312 | 0x7fab9f92d300 | 0x7fab9ca24280 | 0 | 0 | 0 | 0 | 0 | 0 | 1310720 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194604.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695914066235 | 17695913474554 | 17695914776168 | 17695914774067 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 41 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22016 | 0x7fab9f92d180 | 0x7fab9ca242c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194594.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 1310720 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695915369512 | 17695914776168 | 17695916039381 | 17695916037355 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 44 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22720 | 0x7fab9f92d000 | 0x7fab9ca24300 | 0 | 0 | 1310720 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097343.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695916632040 | 17695916039381 | 17695917194754 | 17695917192936 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 47 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 23424 | 0x7fab9d1cde80 | 0x7fab9ca24340 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097345.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695917787521 | 17695917194754 | 17695918403887 | 17695918402115 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 50 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 24128 | 0x7fab9d1cdd00 | 0x7fab9ca24380 | 0 | 0 | 0 | 0 | 0 | 0 | 1441792 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097343.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695919004350 | 17695918403887 | 17695919605339 | 17695919603605 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 53 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 16 | 24 | 24832 | 0x7fab9d1cdb80 | 0x7fab9ca243c0 | 0 | 0 | 0 | 0 | 0 | 0 | 1835008 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194574.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695920197770 | 17695919605339 | 17695920854953 | 17695920853334 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 56 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 16 | 24 | 25536 | 0x7fab9d1cda00 | 0x7fab9ca24400 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194574.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 1835008 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695921447889 | 17695920854953 | 17695922138327 | 17695922136621 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 59 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26240 | 0x7fab9d1cd880 | 0x7fab9ca24440 | 0 | 0 | 1835008 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097345.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695922731996 | 17695922138327 | 17695923338020 | 17695923335761 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 62 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26944 | 0x7fab9d1cd700 | 0x7fab9ca24480 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097351.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695923931096 | 17695923338020 | 17695924543633 | 17695924541821 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 65 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 27648 | 0x7fab9f92d580 | 0x7fab9ca244c0 | 0 | 0 | 0 | 0 | 0 | 0 | 1835008 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097348.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695925143846 | 17695924543633 | 17695925755486 | 17695925753780 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 68 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 16 | 24 | 28608 | 0x7fab9f92d400 | 0x7fab9ca24500 | 0 | 0 | 0 | 0 | 0 | 0 | 2359296 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194593.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695926349935 | 17695925755486 | 17695927020779 | 17695927019149 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 71 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 16 | 24 | 29312 | 0x7fab9f92d280 | 0x7fab9ca24540 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194586.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 2359296 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695927614344 | 17695927020779 | 17695928338873 | 17695928336975 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 74 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 30016 | 0x7fab9f92d100 | 0x7fab9ca24580 | 0 | 0 | 2359296 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097345.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695928933650 | 17695928338873 | 17695929576967 | 17695929575224 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 77 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 8 | 24 | 30976 | 0x7fab9d1cdf80 | 0x7fab9ca245c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097350.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695930171099 | 17695929576967 | 17695930788820 | 17695930787444 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 80 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 31680 | 0x7fab9d1cde00 | 0x7fab9ca24600 | 0 | 0 | 0 | 0 | 0 | 0 | 2228224 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097345.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695931390949 | 17695930788820 | 17695932001473 | 17695931999963 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 83 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 16 | 24 | 32640 | 0x7fab9d1cdc80 | 0x7fab9ca24640 | 0 | 0 | 0 | 0 | 0 | 0 | 2883584 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194594.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695932594799 | 17695932001473 | 17695933313647 | 17695933312011 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 86 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 33600 | 0x7fab9d1cdb00 | 0x7fab9ca24680 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194580.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 2883584 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695933907106 | 17695933313647 | 17695934621181 | 17695934619378 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 89 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 34560 | 0x7fab9d1cd980 | 0x7fab9ca246c0 | 0 | 0 | 2883584 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097355.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695935215003 | 17695934621181 | 17695935819914 | 17695935818338 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 92 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 8 | 24 | 35520 | 0x7fab9d1cd800 | 0x7fab9ca24700 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097349.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695936412743 | 17695935819914 | 17695937023767 | 17695937022247 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 95 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 36224 | 0x7fab9d1cd680 | 0x7fab9ca24740 | 0 | 0 | 0 | 0 | 0 | 0 | 2621440 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097344.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695937624182 | 17695937023767 | 17695938234500 | 17695938233077 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 98 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 37184 | 0x7fab9f92d500 | 0x7fab9ca24780 | 0 | 0 | 0 | 0 | 0 | 0 | 3407872 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194594.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695938828502 | 17695938234500 | 17695939518994 | 17695939517185 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 101 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 38144 | 0x7fab9f92d380 | 0x7fab9ca247c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194573.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 3407872 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695940111590 | 17695939518994 | 17695940783967 | 17695940782093 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 104 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 39104 | 0x7fab9f92d200 | 0x7fab9ca24800 | 0 | 0 | 3407872 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097351.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695941377798 | 17695940783967 | 17695941995660 | 17695941993762 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 107 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 8 | 24 | 40320 | 0x7fab9f92d080 | 0x7fab9ca24840 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097355.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695942589747 | 17695941995660 | 17695943181113 | 17695943179232 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 110 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 41280 | 0x7fab9d1cdf00 | 0x7fab9ca24880 | 0 | 0 | 0 | 0 | 0 | 0 | 3014656 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097345.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695943781927 | 17695943181113 | 17695944392326 | 17695944390392 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 113 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 42240 | 0x7fab9d1cdd80 | 0x7fab9ca248c0 | 0 | 0 | 0 | 0 | 0 | 0 | 3932160 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194590.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695944985367 | 17695944392326 | 17695945644019 | 17695945642170 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 116 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 43200 | 0x7fab9d1cdc00 | 0x7fab9ca24900 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194569.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 3932160 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695946238505 | 17695945644019 | 17695946963234 | 17695946961417 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 119 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 8 | 24 | 44160 | 0x7fab9d1cda80 | 0x7fab9ca24940 | 0 | 0 | 3932160 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097353.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695947556172 | 17695946963234 | 17695948165166 | 17695948163587 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 122 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 45376 | 0x7fab9d1cd900 | 0x7fab9ca24980 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097356.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695948757152 | 17695948165166 | 17695949354139 | 17695949352317 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 125 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 46336 | 0x7fab9d1cd780 | 0x7fab9ca249c0 | 0 | 0 | 0 | 0 | 0 | 0 | 3407872 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097352.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695949954852 | 17695949354139 | 17695950560232 | 17695950558477 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 128 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 47552 | 0x7fab9d1cd600 | 0x7fab9ca24a00 | 0 | 0 | 0 | 0 | 0 | 0 | 4456448 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194573.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695951153792 | 17695950560232 | 17695951833686 | 17695951832095 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 131 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 48512 | 0x7fab9f92d480 | 0x7fab9ca24a40 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194576.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 4456448 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695952428070 | 17695951833686 | 17695953128900 | 17695953127143 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 134 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 8 | 24 | 49472 | 0x7fab9f92d300 | 0x7fab9ca24a80 | 0 | 0 | 4456448 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097349.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695953722028 | 17695953128900 | 17695954339313 | 17695954337392 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 137 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 50688 | 0x7fab9f92d180 | 0x7fab9ca24ac0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097359.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695954932707 | 17695954339313 | 17695955508285 | 17695955506753 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 140 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 51648 | 0x7fab9f92d000 | 0x7fab9ca24b00 | 0 | 0 | 0 | 0 | 0 | 0 | 3801088 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097352.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695956109387 | 17695955504638 | 17695956705122 | 17695956711552 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 143 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 52864 | 0x7fab9d1cde80 | 0x7fab9ca24b40 | 0 | 0 | 0 | 0 | 0 | 0 | 4980736 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194577.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695957301967 | 17695956705122 | 17695957990246 | 17695957991950 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 146 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 54080 | 0x7fab9d1cdd00 | 0x7fab9ca24b80 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194576.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 4980736 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695958587575 | 17695957990246 | 17695959277291 | 17695959279268 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 149 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 8 | 24 | 55296 | 0x7fab9d1cdb80 | 0x7fab9ca24bc0 | 0 | 0 | 4980736 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097349.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695959873743 | 17695959277291 | 17695960491055 | 17695960492857 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 152 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 56768 | 0x7fab9d1cda00 | 0x7fab9ca24c00 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097360.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695961088572 | 17695960491055 | 17695961685780 | 17695961687877 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 155 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 57728 | 0x7fab9d1cd880 | 0x7fab9ca24c40 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097353.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695962290722 | 17695961685780 | 17695962875384 | 17695962877327 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 158 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 58944 | 0x7fab9d1cd700 | 0x7fab9ca24c80 | 0 | 0 | 0 | 0 | 0 | 0 | 5505024 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194576.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695963473352 | 17695962875384 | 17695964181149 | 17695964182794 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 161 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 60160 | 0x7fab9f92d580 | 0x7fab9ca24cc0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194558.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 5505024 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695964779209 | 17695964181149 | 17695965452833 | 17695965454642 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 164 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 8 | 24 | 61376 | 0x7fab9f92d400 | 0x7fab9ca24d00 | 0 | 0 | 5505024 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097351.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695966048847 | 17695965452833 | 17695966678438 | 17695966680271 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 167 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 62848 | 0x7fab9f92d280 | 0x7fab9ca24d40 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097355.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695967277896 | 17695966678438 | 17695967886442 | 17695967888181 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 170 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 63808 | 0x7fab9f92d100 | 0x7fab9ca24d80 | 0 | 0 | 0 | 0 | 0 | 0 | 4587520 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097354.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695968491946 | 17695967886442 | 17695969084046 | 17695969085941 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 173 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 65024 | 0x7fab9d1cdf80 | 0x7fab9ca24dc0 | 0 | 0 | 0 | 0 | 0 | 0 | 6029312 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194574.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695969681056 | 17695969084046 | 17695970384211 | 17695970385749 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 176 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 66240 | 0x7fab9d1cde00 | 0x7fab9ca24e00 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194566.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 6029312 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695970981464 | 17695970384211 | 17695971672856 | 17695971674596 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 179 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 8 | 24 | 67456 | 0x7fab9d1cdc80 | 0x7fab9ca24e40 | 0 | 0 | 6029312 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097351.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695972269371 | 17695971672856 | 17695972863580 | 17695972865656 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 182 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 68928 | 0x7fab9d1cdb00 | 0x7fab9ca24e80 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097356.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695973460531 | 17695972863580 | 17695974056704 | 17695974058916 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 185 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 70144 | 0x7fab9d1cd980 | 0x7fab9ca24ec0 | 0 | 0 | 0 | 0 | 0 | 0 | 4980736 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097352.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695974673961 | 17695974056704 | 17695975281349 | 17695975283165 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 188 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 71616 | 0x7fab9d1cd800 | 0x7fab9ca24f00 | 0 | 0 | 0 | 0 | 0 | 0 | 6553600 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194548.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695975877730 | 17695975281349 | 17695976567914 | 17695976569783 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 191 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 72832 | 0x7fab9d1cd680 | 0x7fab9ca24f40 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194559.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 6553600 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695977162688 | 17695976567914 | 17695977834158 | 17695977836151 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 194 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 8 | 24 | 74048 | 0x7fab9f92d500 | 0x7fab9ca24f80 | 0 | 0 | 6553600 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097350.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695978430636 | 17695977834158 | 17695979022323 | 17695979024321 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 197 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 75776 | 0x7fab9f92d380 | 0x7fab9ca24fc0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097354.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695979618796 | 17695979022323 | 17695980213207 | 17695980214731 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 200 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 76992 | 0x7fab9f92d200 | 0x7fab9ca25000 | 0 | 0 | 0 | 0 | 0 | 0 | 5373952 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097351.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695980818276 | 17695980213207 | 17695981401531 | 17695981403481 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 203 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 78464 | 0x7fab9f92d080 | 0x7fab9ca25040 | 0 | 0 | 0 | 0 | 0 | 0 | 7077888 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194554.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695981998956 | 17695981401531 | 17695982708576 | 17695982710598 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 206 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 79936 | 0x7fab9d1cdf00 | 0x7fab9ca25080 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194551.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 7077888 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695983305603 | 17695982708576 | 17695984018181 | 17695984019865 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 209 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 8 | 24 | 81408 | 0x7fab9d1cdd80 | 0x7fab9ca250c0 | 0 | 0 | 7077888 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097358.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695984614420 | 17695984018181 | 17695985203945 | 17695985205816 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 212 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 83136 | 0x7fab9d1cdc00 | 0x7fab9ca25100 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097347.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695985799221 | 17695985203945 | 17695986417869 | 17695986419495 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 215 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 84352 | 0x7fab9d1cda80 | 0x7fab9ca25140 | 0 | 0 | 0 | 0 | 0 | 0 | 5767168 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097353.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695987022520 | 17695986417869 | 17695987626994 | 17695987628805 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 218 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 85824 | 0x7fab9d1cd900 | 0x7fab9ca25180 | 0 | 0 | 0 | 0 | 0 | 0 | 7602176 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194557.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695988224950 | 17695987626994 | 17695988908118 | 17695988910123 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 221 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 87296 | 0x7fab9d1cd780 | 0x7fab9ca251c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194574.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 7602176 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695989504438 | 17695988908118 | 17695990183003 | 17695990185121 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 224 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 88768 | 0x7fab9d1cd600 | 0x7fab9ca25200 | 0 | 0 | 7602176 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097360.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695990779036 | 17695990183003 | 17695991361727 | 17695991363491 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 227 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 90752 | 0x7fab9f92d480 | 0x7fab9ca25240 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097350.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695991958886 | 17695991361727 | 17695992587972 | 17695992589930 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 230 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 91968 | 0x7fab9f92d300 | 0x7fab9ca25280 | 0 | 0 | 0 | 0 | 0 | 0 | 6160384 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097355.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695993192925 | 17695992587972 | 17695993794056 | 17695993795860 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 233 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 93440 | 0x7fab9f92d180 | 0x7fab9ca252c0 | 0 | 0 | 0 | 0 | 0 | 0 | 8126464 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194572.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695994391485 | 17695993794056 | 17695995094061 | 17695995095927 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 236 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 94912 | 0x7fab9f92d000 | 0x7fab9ca25300 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194561.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 8126464 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695995691102 | 17695995094061 | 17695996385266 | 17695996387135 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 239 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 96384 | 0x7fab9d1cde80 | 0x7fab9ca25340 | 0 | 0 | 8126464 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097362.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695996981100 | 17695996385266 | 17695997557590 | 17695997559275 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 242 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 98368 | 0x7fab9d1cdd00 | 0x7fab9ca25380 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097339.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695998155000 | 17695997557590 | 17695998787354 | 17695998789004 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 245 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 99584 | 0x7fab9d1cdb80 | 0x7fab9ca253c0 | 0 | 0 | 0 | 0 | 0 | 0 | 6553600 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097355.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17695999390769 | 17695998787354 | 17695999995359 | 17695999997264 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 248 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 101312 | 0x7fab9d1cda00 | 0x7fab9ca25400 | 0 | 0 | 0 | 0 | 0 | 0 | 8650752 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194563.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696000591609 | 17695999995359 | 17696001265283 | 17696001266922 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 251 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 102784 | 0x7fab9d1cd880 | 0x7fab9ca25440 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194587.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 8650752 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696001861457 | 17696001265283 | 17696002547368 | 17696002549380 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 254 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 104256 | 0x7fab9d1cd700 | 0x7fab9ca25480 | 0 | 0 | 8650752 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097363.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696003144805 | 17696002547368 | 17696003740332 | 17696003742129 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 257 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 106240 | 0x7fab9f92d580 | 0x7fab9ca254c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097344.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696004337824 | 17696003740332 | 17696004973457 | 17696004975268 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 260 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 107712 | 0x7fab9f92d400 | 0x7fab9ca25500 | 0 | 0 | 0 | 0 | 0 | 0 | 6946816 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097357.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696005577233 | 17696004973457 | 17696006231061 | 17696006232697 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 263 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 16 | 24 | 109440 | 0x7fab9f92d280 | 0x7fab9ca25540 | 0 | 0 | 0 | 0 | 0 | 0 | 9175040 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194560.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696006829592 | 17696006231061 | 17696007508186 | 17696007509855 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 266 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 16 | 24 | 111168 | 0x7fab9f92d100 | 0x7fab9ca25580 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194598.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 9175040 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696008104360 | 17696007508186 | 17696008772031 | 17696008774053 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 269 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 8 | 24 | 112896 | 0x7fab9d1cdf80 | 0x7fab9ca255c0 | 0 | 0 | 9175040 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097363.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696009368648 | 17696008772031 | 17696009968035 | 17696009969913 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 272 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 115136 | 0x7fab9d1cde00 | 0x7fab9ca25600 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097334.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696010565478 | 17696009968035 | 17696011210439 | 17696011212242 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 275 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 116608 | 0x7fab9d1cdc80 | 0x7fab9ca25640 | 0 | 0 | 0 | 0 | 0 | 0 | 7340032 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097356.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696011813877 | 17696011210439 | 17696012415564 | 17696012417322 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 278 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 16 | 24 | 118336 | 0x7fab9d1cdb00 | 0x7fab9ca25680 | 0 | 0 | 0 | 0 | 0 | 0 | 9699328 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194569.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696013012137 | 17696012415564 | 17696013696848 | 17696013698699 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 281 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 16 | 24 | 120064 | 0x7fab9d1cd980 | 0x7fab9ca256c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194589.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 9699328 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696014294454 | 17696013696848 | 17696014977493 | 17696014979317 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 284 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 121792 | 0x7fab9d1cd800 | 0x7fab9ca25700 | 0 | 0 | 9699328 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097359.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696015573772 | 17696014977493 | 17696016164057 | 17696016165557 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 287 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 124032 | 0x7fab9d1cd680 | 0x7fab9ca25740 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097331.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696016760892 | 17696016164057 | 17696017401342 | 17696017402936 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 290 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 125504 | 0x7fab9f92d500 | 0x7fab9ca25780 | 0 | 0 | 0 | 0 | 0 | 0 | 8126464 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097358.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696018004871 | 17696017401342 | 17696018618146 | 17696018620006 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 293 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 127488 | 0x7fab9f92d380 | 0x7fab9ca257c0 | 0 | 0 | 0 | 0 | 0 | 0 | 10747904 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194599.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696019215381 | 17696018617610 | 17696019904812 | 17696019906893 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 296 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 129216 | 0x7fab9f92d200 | 0x7fab9ca25800 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194590.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 10747904 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696020502268 | 17696019904812 | 17696021180976 | 17696021183201 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 299 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 130944 | 0x7fab9f92d080 | 0x7fab9ca25840 | 0 | 0 | 10747904 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097357.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696021778676 | 17696021180976 | 17696022369779 | 17696022371961 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 302 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 133440 | 0x7fab9d1cdf00 | 0x7fab9ca25880 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097330.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696022967446 | 17696022369779 | 17696023629942 | 17696023632120 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 305 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 134912 | 0x7fab9d1cdd80 | 0x7fab9ca258c0 | 0 | 0 | 0 | 0 | 0 | 0 | 8912896 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097362.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696024235165 | 17696023629942 | 17696024817786 | 17696024819870 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 308 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 136896 | 0x7fab9d1cdc00 | 0x7fab9ca25900 | 0 | 0 | 0 | 0 | 0 | 0 | 11796480 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194606.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696025414385 | 17696024817786 | 17696026104669 | 17696026107048 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 311 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 138880 | 0x7fab9d1cda80 | 0x7fab9ca25940 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194596.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 11796480 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696026701543 | 17696026104669 | 17696027381153 | 17696027383556 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 314 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 140864 | 0x7fab9d1cd900 | 0x7fab9ca25980 | 0 | 0 | 11796480 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097356.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696027977561 | 17696027381153 | 17696028576676 | 17696028578626 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 317 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 143616 | 0x7fab9d1cd780 | 0x7fab9ca259c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097333.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696029171691 | 17696028576676 | 17696029820839 | 17696029822894 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 320 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 145344 | 0x7fab9d1cd600 | 0x7fab9ca25a00 | 0 | 0 | 0 | 0 | 0 | 0 | 9699328 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097365.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696030426979 | 17696029820839 | 17696031005802 | 17696031007454 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 323 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 147584 | 0x7fab9f92d480 | 0x7fab9ca25a40 | 0 | 0 | 0 | 0 | 0 | 0 | 12845056 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194603.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696031601779 | 17696031005802 | 17696032244846 | 17696032246963 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 326 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 149568 | 0x7fab9f92d300 | 0x7fab9ca25a80 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194608.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 12845056 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696032841688 | 17696032244846 | 17696033498769 | 17696033500572 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 329 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 151552 | 0x7fab9f92d180 | 0x7fab9ca25ac0 | 0 | 0 | 12845056 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097342.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696034095817 | 17696033498769 | 17696034678292 | 17696034680342 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 332 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 154304 | 0x7fab9f92d000 | 0x7fab9ca25b00 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097329.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696035274417 | 17696034678292 | 17696035971416 | 17696035973159 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 335 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 156288 | 0x7fab9d1cde80 | 0x7fab9ca25b40 | 0 | 0 | 0 | 0 | 0 | 0 | 11272192 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097357.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696036575214 | 17696035971416 | 17696037147099 | 17696037149580 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 338 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 158784 | 0x7fab9d1cdd00 | 0x7fab9ca25b80 | 0 | 0 | 0 | 0 | 0 | 0 | 14942208 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194630.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696037743535 | 17696037147099 | 17696038426142 | 17696038429057 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 341 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 161024 | 0x7fab9d1cdb80 | 0x7fab9ca25bc0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194638.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 14942208 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696039022803 | 17696038426142 | 17696039713666 | 17696039715965 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 344 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 163264 | 0x7fab9d1cda00 | 0x7fab9ca25c00 | 0 | 0 | 14942208 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097328.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696040311740 | 17696039713666 | 17696040927269 | 17696040929525 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 347 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 166528 | 0x7fab9d1cd880 | 0x7fab9ca25c40 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097337.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696041524120 | 17696040927269 | 17696042231113 | 17696042298180 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 350 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 168512 | 0x7fab9d1cd700 | 0x7fab9ca25c80 | 0 | 0 | 0 | 0 | 0 | 0 | 12845056 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097342.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696042836557 | 17696042231113 | 17696043450796 | 17696043452921 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 353 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 171264 | 0x7fab9f92d580 | 0x7fab9ca25cc0 | 0 | 0 | 0 | 0 | 0 | 0 | 17039360 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194632.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696044048106 | 17696043450796 | 17696044743279 | 17696044748079 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 356 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 173760 | 0x7fab9f92d400 | 0x7fab9ca25d00 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194643.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 17039360 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696045340904 | 17696044743279 | 17696046018643 | 17696046023227 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 359 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 176256 | 0x7fab9f92d280 | 0x7fab9ca25d40 | 0 | 0 | 17039360 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097346.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696046616132 | 17696046018643 | 17696047252406 | 17696047254736 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 362 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 179776 | 0x7fab9f92d100 | 0x7fab9ca25d80 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097343.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696047849071 | 17696047252406 | 17696048586010 | 17696048651751 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 365 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 182272 | 0x7fab9d1cdf80 | 0x7fab9ca25dc0 | 0 | 0 | 0 | 0 | 0 | 0 | 15990784 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097340.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696049191037 | 17696048586010 | 17696049853533 | 17696049856020 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 368 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 185536 | 0x7fab9d1cde00 | 0x7fab9ca25e00 | 0 | 0 | 0 | 0 | 0 | 0 | 21233664 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194655.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696050451725 | 17696049853533 | 17696051126657 | 17696051191997 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 371 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 188544 | 0x7fab9d1cdc80 | 0x7fab9ca25e40 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194638.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 21233664 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696051723543 | 17696051126657 | 17696052419780 | 17696052491434 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 374 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 191552 | 0x7fab9d1cdb00 | 0x7fab9ca25e80 | 0 | 0 | 21233664 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097343.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696053016651 | 17696052419780 | 17696053679144 | 17696053681274 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 377 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 195840 | 0x7fab9d1cd980 | 0x7fab9ca25ec0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097351.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696054276019 | 17696053679144 | 17696055107947 | 17696055173647 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 380 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 198592 | 0x7fab9d1cd800 | 0x7fab9ca25f00 | 0 | 0 | 0 | 0 | 0 | 0 | 19136512 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097330.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696055713173 | 17696055107947 | 17696056358831 | 17696056360867 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 383 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 202368 | 0x7fab9d1cd680 | 0x7fab9ca25f40 | 0 | 0 | 0 | 0 | 0 | 0 | 25427968 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194633.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696056954812 | 17696056358831 | 17696057649554 | 17696057716753 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 386 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 205888 | 0x7fab9f92d500 | 0x7fab9ca25f80 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194614.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 25427968 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696058247339 | 17696057649554 | 17696058952758 | 17696059019010 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 389 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 209408 | 0x7fab9f92d380 | 0x7fab9ca25fc0 | 0 | 0 | 25427968 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097344.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696059549726 | 17696058952758 | 17696060248281 | 17696060313617 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 392 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 214464 | 0x7fab9f92d200 | 0x7fab9ca26000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097367.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696060846344 | 17696060248281 | 17696061695005 | 17696061761171 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 395 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 217728 | 0x7fab9f92d080 | 0x7fab9ca26040 | 0 | 0 | 0 | 0 | 0 | 0 | 22282240 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097334.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696062301217 | 17696061695005 | 17696062934368 | 17696062936981 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 398 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 222016 | 0x7fab9d1cdf00 | 0x7fab9ca26080 | 0 | 0 | 0 | 0 | 0 | 0 | 29622272 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194622.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696063532756 | 17696062934368 | 17696064261732 | 17696064305167 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 401 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 226048 | 0x7fab9d1cdd80 | 0x7fab9ca260c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194604.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 29622272 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696064858283 | 17696064261732 | 17696065597416 | 17696065660843 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 404 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 230080 | 0x7fab9d1cdc00 | 0x7fab9ca26100 | 0 | 0 | 29622272 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097342.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696066195120 | 17696065597416 | 17696066909099 | 17696066975180 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 407 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 235904 | 0x7fab9d1cda80 | 0x7fab9ca26140 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097376.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696067506117 | 17696066909099 | 17696068396943 | 17696068463283 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 410 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 239424 | 0x7fab9d1cd900 | 0x7fab9ca26180 | 0 | 0 | 0 | 0 | 0 | 0 | 25427968 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097349.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696069003079 | 17696068396943 | 17696069699027 | 17696069700931 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 413 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 244224 | 0x7fab9d1cd780 | 0x7fab9ca261c0 | 0 | 0 | 0 | 0 | 0 | 0 | 33816576 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194611.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696070296256 | 17696069699027 | 17696071032790 | 17696071098286 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 416 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 248768 | 0x7fab9d1cd600 | 0x7fab9ca26200 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194603.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 33816576 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696071629683 | 17696071032790 | 17696072381594 | 17696072448122 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 419 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 253312 | 0x7fab9f92d480 | 0x7fab9ca26240 | 0 | 0 | 33816576 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097349.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696072979109 | 17696072381594 | 17696073723518 | 17696073789159 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 422 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 8 | 24 | 255552 | 0x7fab9f92d300 | 0x7fab9ca26280 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097322.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696074322005 | 17696073723518 | 17696075252962 | 17696075318680 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 425 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 259840 | 0x7fab9f92d180 | 0x7fab9ca262c0 | 0 | 0 | 0 | 0 | 0 | 0 | 31719424 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097353.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696075858536 | 17696075252962 | 17696076576645 | 17696076643297 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 428 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 265664 | 0x7fab9f92d000 | 0x7fab9ca26300 | 0 | 0 | 0 | 0 | 0 | 0 | 42205184 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194592.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696077174333 | 17696076576645 | 17696077986249 | 17696078052391 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 431 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 271232 | 0x7fab9d1cde80 | 0x7fab9ca26340 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194606.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 42205184 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696078583968 | 17696077986249 | 17696079364973 | 17696079428947 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 434 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 8 | 24 | 273216 | 0x7fab9d1cdd00 | 0x7fab9ca26380 | 0 | 0 | 42205184 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097327.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696079961403 | 17696079364973 | 17696080771217 | 17696080813882 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 437 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 8 | 24 | 275712 | 0x7fab9d1cdb80 | 0x7fab9ca263c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097322.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696081368948 | 17696080772911 | 17696082410040 | 17696082481410 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 440 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 280768 | 0x7fab9d1cda00 | 0x7fab9ca26400 | 0 | 0 | 0 | 0 | 0 | 0 | 38010880 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097384.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696083013637 | 17696082410040 | 17696083762366 | 17696083826496 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 443 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 287616 | 0x7fab9d1cd880 | 0x7fab9ca26440 | 0 | 0 | 0 | 0 | 0 | 0 | 50593792 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194621.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696084358003 | 17696083762366 | 17696085212934 | 17696085277790 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 446 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 294208 | 0x7fab9d1cd700 | 0x7fab9ca26480 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194621.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 50593792 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696085808897 | 17696085212934 | 17696086670542 | 17696086734303 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 449 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 8 | 24 | 296960 | 0x7fab9f92d580 | 0x7fab9ca264c0 | 0 | 0 | 50593792 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097333.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696087265940 | 17696086670542 | 17696088124790 | 17696088166557 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 452 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 8 | 24 | 299968 | 0x7fab9f92d400 | 0x7fab9ca26500 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097327.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696088719873 | 17696088124790 | 17696089880159 | 17696089944502 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 455 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 8 | 24 | 302720 | 0x7fab9f92d280 | 0x7fab9ca26540 | 0 | 0 | 0 | 0 | 0 | 0 | 67371008 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097332.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696090484269 | 17696089880159 | 17696091435367 | 17696091498373 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 458 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 305472 | 0x7fab9f92d100 | 0x7fab9ca26580 | 0 | 0 | 0 | 0 | 0 | 0 | 67371008 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194554.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696092031670 | 17696091435367 | 17696092987696 | 17696093049824 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 461 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 308224 | 0x7fab9d1cdf80 | 0x7fab9ca265c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194556.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 67371008 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696093582421 | 17696092987696 | 17696094544984 | 17696094609835 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 464 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 8 | 24 | 310976 | 0x7fab9d1cde00 | 0x7fab9ca26600 | 0 | 0 | 67371008 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097331.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696095140142 | 17696094544984 | 17696096160833 | 17696096224884 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 467 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 8 | 24 | 313216 | 0x7fab9d1cdc80 | 0x7fab9ca26640 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097313.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696096756371 | 17696096160833 | 17696098123243 | 17696098188195 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 470 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 8 | 24 | 315968 | 0x7fab9d1cdb00 | 0x7fab9ca26680 | 0 | 0 | 0 | 0 | 0 | 0 | 134479872 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097326.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696098726891 | 17696098123243 | 17696100108054 | 17696100171635 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 473 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 318720 | 0x7fab9d1cd980 | 0x7fab9ca266c0 | 0 | 0 | 0 | 0 | 0 | 0 | 134479872 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194547.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696100703482 | 17696100108054 | 17696102095585 | 17696102149826 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 476 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 321472 | 0x7fab9d1cd800 | 0x7fab9ca26700 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194545.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 134479872 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696102690562 | 17696102095585 | 17696104090475 | 17696104155305 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 479 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 8 | 24 | 324224 | 0x7fab9d1cd680 | 0x7fab9ca26740 | 0 | 0 | 134479872 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097329.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696104685722 | 17696104090475 | 17696106062646 | 17696106129306 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 482 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 8 | 24 | 326464 | 0x7fab9f92d500 | 0x7fab9ca26780 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097313.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696106657812 | 17696106062646 | 17696108856101 | 17696108920345 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 485 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 8 | 24 | 329216 | 0x7fab9f92d380 | 0x7fab9ca267c0 | 0 | 0 | 0 | 0 | 0 | 0 | 268697600 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097322.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696109466212 | 17696108856101 | 17696111624276 | 17696111694816 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 488 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 331968 | 0x7fab9f92d200 | 0x7fab9ca26800 | 0 | 0 | 0 | 0 | 0 | 0 | 268697600 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194547.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696112221192 | 17696111624276 | 17696114445411 | 17696114515674 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 491 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 12 | 24 | 334720 | 0x7fab9f92d080 | 0x7fab9ca26840 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194542.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 268697600 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696115042441 | 17696114445411 | 17696117288626 | 17696117353873 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 494 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 8 | 24 | 337472 | 0x7fab9d1cdf00 | 0x7fab9ca26880 | 0 | 0 | 268697600 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097321.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696117884560 | 17696117288626 | 17696120082241 | 17696120153423 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 497 | 228689 | 228689 | 4194304 | 256 | 0 | 0 | 8 | 24 | 0 | 0x7fab9d1cdd80 | 0x7fab9ca268c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097313.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17696120678200 | 17696120082241 | 17696124552345 | 17696124620781 |