66 KiB
66 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | SQ_INSTS_VALU_ADD_F16 | SQ_INSTS_VALU_MUL_F16 | SQ_INSTS_VALU_FMA_F16 | SQ_INSTS_VALU_TRANS_F16 | SQ_INSTS_VALU_ADD_F32 | SQ_INSTS_VALU_MUL_F32 | SQ_INSTS_VALU_FMA_F32 | SQ_INSTS_VALU_TRANS_F32 | TCP_TCC_READ_REQ_sum | TCP_TOTAL_CACHE_ACCESSES_sum | TCP_TCC_WRITE_REQ_sum | TCP_TCC_ATOMIC_WITH_RET_REQ_sum | TCC_EA_RDREQ_32B_sum | TCC_EA_RDREQ_sum | TCC_EA_WRREQ_64B_sum | TCC_EA_WRREQ_sum | SQ_INSTS_VALU_ADD_F64 | SQ_INSTS_VALU_MUL_F64 | SQ_INSTS_VALU_FMA_F64 | SQ_INSTS_VALU_TRANS_F64 | SQ_INSTS_VALU_MFMA_MOPS_F16 | SQ_INSTS_VALU_MFMA_MOPS_BF16 | SQ_INSTS_VALU_MFMA_MOPS_F32 | SQ_INSTS_VALU_MFMA_MOPS_F64 | TCP_TCC_ATOMIC_WITHOUT_RET_REQ_sum | SQ_LDS_IDX_ACTIVE | SQ_LDS_BANK_CONFLICT | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBufferAligned.kd | 0 | 0 | 0 | 241894 | 241894 | 33554432 | 256 | 0 | 0 | 4 | 32 | 4160 | 0x0 | 0x7f6e9cc04280 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 8388608.0000000000 | 4194304.0000000000 | 0.0000000000 | 0.0000000000 | 310.0000000000 | 4128768.0000000000 | 4128768.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931286038190 | 17901582538237 | 17931431845031 | 17931431958331 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 241894 | 241894 | 32768 | 256 | 0 | 0 | 12 | 24 | 13888 | 0x0 | 0x7f6e9cc23f80 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 8192.0000000000 | 16384.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 8262.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931437652391 | 17931431845031 | 17931438008283 | 17931438016542 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 5 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 14336 | 0x7f6e9fb92380 | 0x7f6e9cc23fc0 | 0 | 0 | 0 | 0 | 0 | 0 | 262144 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097343.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931438610067 | 17931438008283 | 17931439296934 | 17931439297600 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 8 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15040 | 0x7f6e9fb92200 | 0x7f6e9cc24000 | 0 | 0 | 0 | 0 | 0 | 0 | 262144 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194598.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931439896726 | 17931439296934 | 17931440654066 | 17931440654347 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 11 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15488 | 0x7f6e9fb92080 | 0x7f6e9cc24040 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194586.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 262144 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931441249002 | 17931440654066 | 17931441888957 | 17931441888907 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 14 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 15936 | 0x7f6e9d3fbf00 | 0x7f6e9cc24080 | 0 | 0 | 262144 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097342.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931442483772 | 17931441888957 | 17931443061927 | 17931443061768 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 17 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 16384 | 0x7f6e9d3fbd80 | 0x7f6e9cc240c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097350.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931443654893 | 17931443061927 | 17931444270097 | 17931444270318 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 20 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 17088 | 0x7f6e9d3fbc00 | 0x7f6e9cc24100 | 0 | 0 | 0 | 0 | 0 | 0 | 655360 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097341.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931444878293 | 17931444270097 | 17931445513628 | 17931445513617 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 23 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 16 | 24 | 17792 | 0x7f6e9d3fba80 | 0x7f6e9cc24140 | 0 | 0 | 0 | 0 | 0 | 0 | 786432 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194601.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931446109953 | 17931445513628 | 17931446796999 | 17931446796706 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 26 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 16 | 24 | 18496 | 0x7f6e9d3fb900 | 0x7f6e9cc24180 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194592.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 786432 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931447390461 | 17931446796999 | 17931448085010 | 17931448085344 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 29 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19200 | 0x7f6e9d3fb780 | 0x7f6e9cc241c0 | 0 | 0 | 786432 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097346.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931448679459 | 17931448085010 | 17931449284541 | 17931449283804 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 32 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19904 | 0x7f6e9d3fb600 | 0x7f6e9cc24200 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097349.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931449878840 | 17931449284541 | 17931450461831 | 17931450460825 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 35 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 20608 | 0x7f6e9fb92480 | 0x7f6e9cc24240 | 0 | 0 | 0 | 0 | 0 | 0 | 1048576 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097346.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931451064630 | 17931450461831 | 17931451643121 | 17931451642216 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 38 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 16 | 24 | 21312 | 0x7f6e9fb92300 | 0x7f6e9cc24280 | 0 | 0 | 0 | 0 | 0 | 0 | 1310720 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194598.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931452238161 | 17931451643121 | 17931452901692 | 17931452902205 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 41 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22016 | 0x7f6e9fb92180 | 0x7f6e9cc242c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194591.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 1310720 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931453495930 | 17931452901692 | 17931454162023 | 17931454161224 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 44 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22720 | 0x7f6e9fb92000 | 0x7f6e9cc24300 | 0 | 0 | 1310720 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097348.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931454757129 | 17931454162023 | 17931455333553 | 17931455332625 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 47 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 23424 | 0x7f6e9d3fbe80 | 0x7f6e9cc24340 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097348.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931455927240 | 17931455333553 | 17931456583484 | 17931456582484 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 50 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 24128 | 0x7f6e9d3fbd00 | 0x7f6e9cc24380 | 0 | 0 | 0 | 0 | 0 | 0 | 1441792 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097343.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931457186039 | 17931456583484 | 17931457769414 | 17931457768915 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 53 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 16 | 24 | 24832 | 0x7f6e9d3fbb80 | 0x7f6e9cc243c0 | 0 | 0 | 0 | 0 | 0 | 0 | 1835008 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194588.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931458364860 | 17931457769414 | 17931459054866 | 17931459054263 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 56 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 16 | 24 | 25536 | 0x7f6e9d3fba00 | 0x7f6e9cc24400 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194575.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 1835008 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931459649358 | 17931459054866 | 17931460315677 | 17931460314952 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 59 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26240 | 0x7f6e9d3fb880 | 0x7f6e9cc24440 | 0 | 0 | 1835008 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097347.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931460910027 | 17931460315677 | 17931461506727 | 17931461506243 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 62 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26944 | 0x7f6e9d3fb700 | 0x7f6e9cc24480 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097353.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931462101478 | 17931461506727 | 17931462694257 | 17931462693633 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 65 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 27648 | 0x7f6e9fb92580 | 0x7f6e9cc244c0 | 0 | 0 | 0 | 0 | 0 | 0 | 1835008 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097345.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931463295288 | 17931462694257 | 17931463897788 | 17931463897254 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 68 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 16 | 24 | 28608 | 0x7f6e9fb92400 | 0x7f6e9cc24500 | 0 | 0 | 0 | 0 | 0 | 0 | 2359296 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194603.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931464492269 | 17931463897788 | 17931465197479 | 17931465196962 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 71 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 16 | 24 | 29312 | 0x7f6e9fb92280 | 0x7f6e9cc24540 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194600.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 2359296 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931465792187 | 17931465197479 | 17931466490450 | 17931466490150 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 74 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 30016 | 0x7f6e9fb92100 | 0x7f6e9cc24580 | 0 | 0 | 2359296 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097339.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931467085385 | 17931466490450 | 17931467694941 | 17931467694110 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 77 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 8 | 24 | 30976 | 0x7f6e9d3fbf80 | 0x7f6e9cc245c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097356.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931468289745 | 17931467694941 | 17931468887111 | 17931468886380 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 80 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 31680 | 0x7f6e9d3fbe00 | 0x7f6e9cc24600 | 0 | 0 | 0 | 0 | 0 | 0 | 2228224 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097345.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931469488906 | 17931468887111 | 17931470086641 | 17931470086261 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 83 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 16 | 24 | 32640 | 0x7f6e9d3fbc80 | 0x7f6e9cc24640 | 0 | 0 | 0 | 0 | 0 | 0 | 2883584 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194594.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931470682256 | 17931470086641 | 17931471372412 | 17931471371759 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 86 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 33600 | 0x7f6e9d3fbb00 | 0x7f6e9cc24680 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194599.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 2883584 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931471966224 | 17931471372412 | 17931472621223 | 17931472620428 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 89 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 34560 | 0x7f6e9d3fb980 | 0x7f6e9cc246c0 | 0 | 0 | 2883584 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097351.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931473214744 | 17931472621223 | 17931473825234 | 17931473824429 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 92 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 8 | 24 | 35520 | 0x7f6e9d3fb800 | 0x7f6e9cc24700 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097358.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931474420014 | 17931473825234 | 17931475014364 | 17931475013719 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 95 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 36224 | 0x7f6e9d3fb680 | 0x7f6e9cc24740 | 0 | 0 | 0 | 0 | 0 | 0 | 2621440 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097349.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931475616154 | 17931475014364 | 17931476214534 | 17931476213720 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 98 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 37184 | 0x7f6e9fb92500 | 0x7f6e9cc24780 | 0 | 0 | 0 | 0 | 0 | 0 | 3407872 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194589.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931476809445 | 17931476214534 | 17931477471985 | 17931477471269 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 101 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 38144 | 0x7f6e9fb92380 | 0x7f6e9cc247c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194599.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 3407872 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931478066654 | 17931477471985 | 17931478786077 | 17931478785096 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 104 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 39104 | 0x7f6e9fb92200 | 0x7f6e9cc24800 | 0 | 0 | 3407872 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097352.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931479380772 | 17931478786077 | 17931479982247 | 17931479981507 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 107 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 8 | 24 | 40320 | 0x7f6e9fb92080 | 0x7f6e9cc24840 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097355.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931480577002 | 17931479982247 | 17931481180658 | 17931481179897 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 110 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 41280 | 0x7f6e9d3fbf00 | 0x7f6e9cc24880 | 0 | 0 | 0 | 0 | 0 | 0 | 3014656 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097353.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931481783572 | 17931481180658 | 17931482389948 | 17931482389477 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 113 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 42240 | 0x7f6e9d3fbd80 | 0x7f6e9cc248c0 | 0 | 0 | 0 | 0 | 0 | 0 | 3932160 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194587.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931482984303 | 17931482389948 | 17931483666759 | 17931483665896 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 116 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 43200 | 0x7f6e9d3fbc00 | 0x7f6e9cc24900 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194584.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 3932160 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931484260321 | 17931483666759 | 17931484937490 | 17931484936684 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 119 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 8 | 24 | 44160 | 0x7f6e9d3fba80 | 0x7f6e9cc24940 | 0 | 0 | 3932160 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097349.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931485531900 | 17931484937490 | 17931486110620 | 17931486110215 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 122 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 45376 | 0x7f6e9d3fb900 | 0x7f6e9cc24980 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097360.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931486706081 | 17931486110620 | 17931487349511 | 17931487348905 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 125 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 46336 | 0x7f6e9d3fb780 | 0x7f6e9cc249c0 | 0 | 0 | 0 | 0 | 0 | 0 | 3407872 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097355.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931487951860 | 17931487349511 | 17931488539121 | 17931488538166 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 128 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 47552 | 0x7f6e9d3fb600 | 0x7f6e9cc24a00 | 0 | 0 | 0 | 0 | 0 | 0 | 4456448 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194576.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931489132651 | 17931488539121 | 17931489830013 | 17931489829184 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 131 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 48512 | 0x7f6e9fb92480 | 0x7f6e9cc24a40 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194573.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 4456448 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931490425310 | 17931489830013 | 17931491077703 | 17931491077114 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 134 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 8 | 24 | 49472 | 0x7f6e9fb92300 | 0x7f6e9cc24a80 | 0 | 0 | 4456448 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097359.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931491671899 | 17931491077703 | 17931492247954 | 17931492246995 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 137 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 50688 | 0x7f6e9fb92180 | 0x7f6e9cc24ac0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097360.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931492843600 | 17931492247954 | 17931493456284 | 17931493455485 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 140 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 51648 | 0x7f6e9fb92000 | 0x7f6e9cc24b00 | 0 | 0 | 0 | 0 | 0 | 0 | 3801088 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097354.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931494058810 | 17931493453590 | 17931494682874 | 17931494689224 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 143 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 52864 | 0x7f6e9d3fbe80 | 0x7f6e9cc24b40 | 0 | 0 | 0 | 0 | 0 | 0 | 4980736 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194581.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931495280200 | 17931494682874 | 17931495959518 | 17931495961423 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 146 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 54080 | 0x7f6e9d3fbd00 | 0x7f6e9cc24b80 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194567.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 4980736 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931496557148 | 17931495959518 | 17931497225602 | 17931497227582 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 149 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 8 | 24 | 55296 | 0x7f6e9d3fbb80 | 0x7f6e9cc24bc0 | 0 | 0 | 4980736 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097359.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931497822167 | 17931497225602 | 17931498439046 | 17931498440972 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 152 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 56768 | 0x7f6e9d3fba00 | 0x7f6e9cc24c00 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097360.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931499036607 | 17931498439046 | 17931499676811 | 17931499678731 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 155 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 57728 | 0x7f6e9d3fb880 | 0x7f6e9cc24c40 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097354.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931500282406 | 17931499676811 | 17931500871695 | 17931500873582 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 158 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 58944 | 0x7f6e9d3fb700 | 0x7f6e9cc24c80 | 0 | 0 | 0 | 0 | 0 | 0 | 5505024 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194564.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931501469007 | 17931500871695 | 17931502181619 | 17931502183809 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 161 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 60160 | 0x7f6e9fb92580 | 0x7f6e9cc24cc0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194582.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 5505024 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931502779455 | 17931502181619 | 17931503448824 | 17931503450778 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 164 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 8 | 24 | 61376 | 0x7f6e9fb92400 | 0x7f6e9cc24d00 | 0 | 0 | 5505024 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097357.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931504045804 | 17931503448824 | 17931504632348 | 17931504634249 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 167 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 62848 | 0x7f6e9fb92280 | 0x7f6e9cc24d40 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097354.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931505229384 | 17931504632348 | 17931505819072 | 17931505821200 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 170 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 63808 | 0x7f6e9fb92100 | 0x7f6e9cc24d80 | 0 | 0 | 0 | 0 | 0 | 0 | 4587520 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097354.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931506426265 | 17931505819072 | 17931507024196 | 17931507026030 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 173 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 65024 | 0x7f6e9d3fbf80 | 0x7f6e9cc24dc0 | 0 | 0 | 0 | 0 | 0 | 0 | 6029312 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194578.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931507622745 | 17931507024196 | 17931508323720 | 17931508325528 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 176 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 66240 | 0x7f6e9d3fbe00 | 0x7f6e9cc24e00 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194563.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 6029312 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931508920573 | 17931508323720 | 17931509606605 | 17931509608486 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 179 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 8 | 24 | 67456 | 0x7f6e9d3fbc80 | 0x7f6e9cc24e40 | 0 | 0 | 6029312 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097358.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931510204242 | 17931509606605 | 17931510819569 | 17931510821676 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 182 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 68928 | 0x7f6e9d3fbb00 | 0x7f6e9cc24e80 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097358.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931511418772 | 17931510819569 | 17931512037173 | 17931512038886 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 185 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 70144 | 0x7f6e9d3fb980 | 0x7f6e9cc24ec0 | 0 | 0 | 0 | 0 | 0 | 0 | 4980736 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097355.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931512653431 | 17931512037173 | 17931513258617 | 17931513260716 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 188 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 71616 | 0x7f6e9d3fb800 | 0x7f6e9cc24f00 | 0 | 0 | 0 | 0 | 0 | 0 | 6553600 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194552.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931513855281 | 17931513258617 | 17931514545022 | 17931514546714 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 191 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 72832 | 0x7f6e9d3fb680 | 0x7f6e9cc24f40 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194581.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 6553600 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931515141570 | 17931514545022 | 17931515831586 | 17931515833583 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 194 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 8 | 24 | 74048 | 0x7f6e9fb92500 | 0x7f6e9cc24f80 | 0 | 0 | 6553600 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097358.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931516429018 | 17931515831586 | 17931517042150 | 17931517043903 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 197 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 75776 | 0x7f6e9fb92380 | 0x7f6e9cc24fc0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097344.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931517640008 | 17931517042150 | 17931518263594 | 17931518265393 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 200 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 76992 | 0x7f6e9fb92200 | 0x7f6e9cc25000 | 0 | 0 | 0 | 0 | 0 | 0 | 5373952 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097353.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931518868678 | 17931518263594 | 17931519465199 | 17931519467023 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 203 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 78464 | 0x7f6e9fb92080 | 0x7f6e9cc25040 | 0 | 0 | 0 | 0 | 0 | 0 | 7077888 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194554.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931520062218 | 17931519465199 | 17931520784243 | 17931520786160 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 206 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 79936 | 0x7f6e9d3fbf00 | 0x7f6e9cc25080 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194565.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 7077888 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931521382056 | 17931520784243 | 17931522085367 | 17931522087588 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 209 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 8 | 24 | 81408 | 0x7f6e9d3fbd80 | 0x7f6e9cc250c0 | 0 | 0 | 7077888 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097358.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931522682734 | 17931522085367 | 17931523270492 | 17931523272329 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 212 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 83136 | 0x7f6e9d3fbc00 | 0x7f6e9cc25100 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097347.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931523866774 | 17931523270492 | 17931524491296 | 17931524493099 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 215 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 84352 | 0x7f6e9d3fba80 | 0x7f6e9cc25140 | 0 | 0 | 0 | 0 | 0 | 0 | 5767168 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097358.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931525096034 | 17931524491296 | 17931525708420 | 17931525710099 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 218 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 85824 | 0x7f6e9d3fb900 | 0x7f6e9cc25180 | 0 | 0 | 0 | 0 | 0 | 0 | 7602176 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194573.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931526306344 | 17931525708420 | 17931526994504 | 17931526996417 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 221 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 87296 | 0x7f6e9d3fb780 | 0x7f6e9cc251c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194553.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 7602176 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931527591412 | 17931526994504 | 17931528246509 | 17931528248406 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 224 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 88768 | 0x7f6e9d3fb600 | 0x7f6e9cc25200 | 0 | 0 | 7602176 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097362.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931528842192 | 17931528246509 | 17931529476753 | 17931529478686 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 227 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 90752 | 0x7f6e9fb92480 | 0x7f6e9cc25240 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097335.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931530074181 | 17931529476753 | 17931530826677 | 17931530828443 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 230 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 91968 | 0x7f6e9fb92300 | 0x7f6e9cc25280 | 0 | 0 | 0 | 0 | 0 | 0 | 6160384 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097358.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931531433128 | 17931530826677 | 17931531999482 | 17931532001354 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 233 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 93440 | 0x7f6e9fb92180 | 0x7f6e9cc252c0 | 0 | 0 | 0 | 0 | 0 | 0 | 8126464 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194567.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931532597259 | 17931531999482 | 17931533262526 | 17931533264443 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 236 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 94912 | 0x7f6e9fb92000 | 0x7f6e9cc25300 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194571.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 8126464 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931533859808 | 17931533262526 | 17931534553410 | 17931534555321 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 239 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 96384 | 0x7f6e9d3fbe80 | 0x7f6e9cc25340 | 0 | 0 | 8126464 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097364.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931535150757 | 17931534553410 | 17931535729414 | 17931535731462 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 242 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 98368 | 0x7f6e9d3fbd00 | 0x7f6e9cc25380 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097346.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931536326058 | 17931535729414 | 17931536952138 | 17931536954092 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 245 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 99584 | 0x7f6e9d3fbb80 | 0x7f6e9cc253c0 | 0 | 0 | 0 | 0 | 0 | 0 | 6553600 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097360.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931537557087 | 17931536952138 | 17931538132943 | 17931538134973 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 248 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 101312 | 0x7f6e9d3fba00 | 0x7f6e9cc25400 | 0 | 0 | 0 | 0 | 0 | 0 | 8650752 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194575.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931538730908 | 17931538132943 | 17931539416147 | 17931539417951 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 251 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 102784 | 0x7f6e9d3fb880 | 0x7f6e9cc25440 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194578.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 8650752 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931540012337 | 17931539416147 | 17931540689271 | 17931540691100 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 254 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 104256 | 0x7f6e9d3fb700 | 0x7f6e9cc25480 | 0 | 0 | 8650752 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097364.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931541285685 | 17931540689271 | 17931541863195 | 17931541865161 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 257 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 106240 | 0x7f6e9fb92580 | 0x7f6e9cc254c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097336.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931542461496 | 17931541863195 | 17931543071999 | 17931543073901 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 260 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 107712 | 0x7f6e9fb92400 | 0x7f6e9cc25500 | 0 | 0 | 0 | 0 | 0 | 0 | 6946816 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097360.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931543676636 | 17931543071999 | 17931544244324 | 17931544246152 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 263 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 16 | 24 | 109440 | 0x7f6e9fb92280 | 0x7f6e9cc25540 | 0 | 0 | 0 | 0 | 0 | 0 | 9175040 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194559.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931544841427 | 17931544244324 | 17931545518408 | 17931545520351 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 266 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 16 | 24 | 111168 | 0x7f6e9fb92100 | 0x7f6e9cc25580 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194577.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 9175040 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931546116386 | 17931545518408 | 17931546798412 | 17931546800329 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 269 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 8 | 24 | 112896 | 0x7f6e9d3fbf80 | 0x7f6e9cc255c0 | 0 | 0 | 9175040 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097362.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931547394984 | 17931546798412 | 17931547992976 | 17931547994750 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 272 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 115136 | 0x7f6e9d3fbe00 | 0x7f6e9cc25600 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097342.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931548590135 | 17931547992976 | 17931549231701 | 17931549233739 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 275 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 116608 | 0x7f6e9d3fbc80 | 0x7f6e9cc25640 | 0 | 0 | 0 | 0 | 0 | 0 | 7340032 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097364.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931549837084 | 17931549231701 | 17931550560345 | 17931550562126 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 278 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 16 | 24 | 118336 | 0x7f6e9d3fbb00 | 0x7f6e9cc25680 | 0 | 0 | 0 | 0 | 0 | 0 | 9699328 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194573.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931551158042 | 17931550560345 | 17931551839870 | 17931551841815 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 281 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 16 | 24 | 120064 | 0x7f6e9d3fb980 | 0x7f6e9cc256c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194577.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 9699328 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931552436090 | 17931551839870 | 17931553116994 | 17931553118883 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 284 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 121792 | 0x7f6e9d3fb800 | 0x7f6e9cc25700 | 0 | 0 | 9699328 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097366.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931553713499 | 17931553116994 | 17931554314278 | 17931554316564 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 287 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 124032 | 0x7f6e9d3fb680 | 0x7f6e9cc25740 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097341.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931554912219 | 17931554314278 | 17931555538122 | 17931555540163 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 290 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 125504 | 0x7f6e9fb92500 | 0x7f6e9cc25780 | 0 | 0 | 0 | 0 | 0 | 0 | 8126464 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097365.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931556142889 | 17931555538122 | 17931556724366 | 17931556726204 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 293 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 127488 | 0x7f6e9fb92380 | 0x7f6e9cc257c0 | 0 | 0 | 0 | 0 | 0 | 0 | 10747904 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194607.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931557321530 | 17931556724119 | 17931558004122 | 17931558006153 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 296 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 129216 | 0x7f6e9fb92200 | 0x7f6e9cc25800 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194597.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 10747904 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931558602298 | 17931558004122 | 17931559300765 | 17931559302911 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 299 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 130944 | 0x7f6e9fb92080 | 0x7f6e9cc25840 | 0 | 0 | 10747904 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097361.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931559898526 | 17931559300765 | 17931560506529 | 17931560508851 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 302 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 133440 | 0x7f6e9d3fbf00 | 0x7f6e9cc25880 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097329.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931561105146 | 17931560506529 | 17931561747653 | 17931561749580 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 305 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 134912 | 0x7f6e9d3fbd80 | 0x7f6e9cc258c0 | 0 | 0 | 0 | 0 | 0 | 0 | 8912896 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097367.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931562354445 | 17931561747653 | 17931562940776 | 17931562943191 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 308 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 136896 | 0x7f6e9d3fbc00 | 0x7f6e9cc25900 | 0 | 0 | 0 | 0 | 0 | 0 | 11796480 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194603.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931563538616 | 17931562940776 | 17931564187980 | 17931564189970 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 311 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 138880 | 0x7f6e9d3fba80 | 0x7f6e9cc25940 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194591.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 11796480 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931564785335 | 17931564187980 | 17931565474224 | 17931565476378 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 314 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 140864 | 0x7f6e9d3fb900 | 0x7f6e9cc25980 | 0 | 0 | 11796480 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097357.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931566071644 | 17931565474224 | 17931566694868 | 17931566696898 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 317 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 143616 | 0x7f6e9d3fb780 | 0x7f6e9cc259c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097336.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931567292013 | 17931566694868 | 17931567959991 | 17931567961997 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 320 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 145344 | 0x7f6e9d3fb600 | 0x7f6e9cc25a00 | 0 | 0 | 0 | 0 | 0 | 0 | 9699328 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097368.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931568565802 | 17931567959991 | 17931569174235 | 17931569176507 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 323 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 147584 | 0x7f6e9fb92480 | 0x7f6e9cc25a40 | 0 | 0 | 0 | 0 | 0 | 0 | 12845056 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194602.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931569772022 | 17931569174235 | 17931570474879 | 17931570476895 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 326 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 149568 | 0x7f6e9fb92300 | 0x7f6e9cc25a80 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194588.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 12845056 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931571073240 | 17931570474879 | 17931571772323 | 17931571774493 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 329 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 151552 | 0x7f6e9fb92180 | 0x7f6e9cc25ac0 | 0 | 0 | 12845056 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097341.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931572370728 | 17931571772323 | 17931572986887 | 17931572988863 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 332 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 154304 | 0x7f6e9fb92000 | 0x7f6e9cc25b00 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097334.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931573584468 | 17931572986887 | 17931574282410 | 17931574284721 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 335 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 156288 | 0x7f6e9d3fbe80 | 0x7f6e9cc25b40 | 0 | 0 | 0 | 0 | 0 | 0 | 11272192 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097361.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931574889296 | 17931574282410 | 17931575496174 | 17931575498251 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 338 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 158784 | 0x7f6e9d3fbd00 | 0x7f6e9cc25b80 | 0 | 0 | 0 | 0 | 0 | 0 | 14942208 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194650.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931576093206 | 17931575496174 | 17931576775058 | 17931576777109 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 341 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 161024 | 0x7f6e9d3fbb80 | 0x7f6e9cc25bc0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194618.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 14942208 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931577372395 | 17931576775058 | 17931578192502 | 17931578194994 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 344 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 163264 | 0x7f6e9d3fba00 | 0x7f6e9cc25c00 | 0 | 0 | 14942208 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097345.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931578790250 | 17931578192502 | 17931579403066 | 17931579405135 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 347 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 166528 | 0x7f6e9d3fb880 | 0x7f6e9cc25c40 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097333.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931580000810 | 17931579403066 | 17931580705950 | 17931580772301 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 350 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 168512 | 0x7f6e9d3fb700 | 0x7f6e9cc25c80 | 0 | 0 | 0 | 0 | 0 | 0 | 12845056 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097359.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931581311688 | 17931580705950 | 17931581915873 | 17931581917973 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 353 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 171264 | 0x7f6e9fb92580 | 0x7f6e9cc25cc0 | 0 | 0 | 0 | 0 | 0 | 0 | 17039360 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194630.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931582514219 | 17931581915873 | 17931583195717 | 17931583199922 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 356 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 173760 | 0x7f6e9fb92400 | 0x7f6e9cc25d00 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194650.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 17039360 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931583793157 | 17931583195717 | 17931584492041 | 17931584495450 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 359 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 176256 | 0x7f6e9fb92280 | 0x7f6e9cc25d40 | 0 | 0 | 17039360 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097332.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931585088735 | 17931584492041 | 17931585731085 | 17931585733129 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 362 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 179776 | 0x7f6e9fb92100 | 0x7f6e9cc25d80 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097343.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931586330864 | 17931585731085 | 17931587059409 | 17931587125825 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 365 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 182272 | 0x7f6e9d3fbf80 | 0x7f6e9cc25dc0 | 0 | 0 | 0 | 0 | 0 | 0 | 15990784 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097334.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931587666081 | 17931587059409 | 17931588302132 | 17931588304186 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 368 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 185536 | 0x7f6e9d3fbe00 | 0x7f6e9cc25e00 | 0 | 0 | 0 | 0 | 0 | 0 | 21233664 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194637.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931588900091 | 17931588302132 | 17931589600376 | 17931589604254 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 371 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 188544 | 0x7f6e9d3fbc80 | 0x7f6e9cc25e40 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194638.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 21233664 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931590198359 | 17931589600376 | 17931590891420 | 17931590957780 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 374 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 191552 | 0x7f6e9d3fbb00 | 0x7f6e9cc25e80 | 0 | 0 | 21233664 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097330.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931591488777 | 17931590891420 | 17931592157664 | 17931592159900 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 377 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 195840 | 0x7f6e9d3fb980 | 0x7f6e9cc25ec0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097358.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931592754706 | 17931592157664 | 17931593527108 | 17931593592905 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 380 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 198592 | 0x7f6e9d3fb800 | 0x7f6e9cc25f00 | 0 | 0 | 0 | 0 | 0 | 0 | 19136512 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097336.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931594134402 | 17931593527108 | 17931594792712 | 17931594795115 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 383 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 202368 | 0x7f6e9d3fb680 | 0x7f6e9cc25f40 | 0 | 0 | 0 | 0 | 0 | 0 | 25427968 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194635.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931595390441 | 17931594792712 | 17931596131116 | 17931596172121 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 386 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 205888 | 0x7f6e9fb92500 | 0x7f6e9cc25f80 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194617.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 25427968 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931596730138 | 17931596131116 | 17931597435120 | 17931597499649 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 389 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 209408 | 0x7f6e9fb92380 | 0x7f6e9cc25fc0 | 0 | 0 | 25427968 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097338.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931598032976 | 17931597435120 | 17931598744884 | 17931598749228 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 392 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 214464 | 0x7f6e9fb92200 | 0x7f6e9cc26000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097368.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931599342333 | 17931598744884 | 17931600182488 | 17931600247061 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 395 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 217728 | 0x7f6e9fb92080 | 0x7f6e9cc26040 | 0 | 0 | 0 | 0 | 0 | 0 | 22282240 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097351.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931600787878 | 17931600182488 | 17931601464092 | 17931601465971 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 398 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 222016 | 0x7f6e9d3fbf00 | 0x7f6e9cc26080 | 0 | 0 | 0 | 0 | 0 | 0 | 29622272 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194630.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931602061946 | 17931601464092 | 17931602801376 | 17931602865856 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 401 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 226048 | 0x7f6e9d3fbd80 | 0x7f6e9cc260c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194603.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 29622272 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931603398593 | 17931602801376 | 17931604125700 | 17931604167174 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 404 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 230080 | 0x7f6e9d3fbc00 | 0x7f6e9cc26100 | 0 | 0 | 29622272 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097361.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931604722900 | 17931604125700 | 17931605480264 | 17931605520101 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 407 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 235904 | 0x7f6e9d3fba80 | 0x7f6e9cc26140 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097376.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931606086757 | 17931605480264 | 17931606955148 | 17931606995814 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 410 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 239424 | 0x7f6e9d3fb900 | 0x7f6e9cc26180 | 0 | 0 | 0 | 0 | 0 | 0 | 25427968 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097342.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931607560800 | 17931606955148 | 17931608246192 | 17931608248343 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 413 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 244224 | 0x7f6e9d3fb780 | 0x7f6e9cc261c0 | 0 | 0 | 0 | 0 | 0 | 0 | 33816576 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194615.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931608844459 | 17931608246192 | 17931609611636 | 17931609676138 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 416 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 248768 | 0x7f6e9d3fb600 | 0x7f6e9cc26200 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194579.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 33816576 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931610209875 | 17931609611636 | 17931610958360 | 17931611022265 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 419 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 253312 | 0x7f6e9fb92480 | 0x7f6e9cc26240 | 0 | 0 | 33816576 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097364.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931611557032 | 17931610958360 | 17931612305884 | 17931612371252 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 422 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 8 | 24 | 255552 | 0x7f6e9fb92300 | 0x7f6e9cc26280 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097317.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931612903549 | 17931612305884 | 17931613820769 | 17931613866315 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 425 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 259840 | 0x7f6e9fb92180 | 0x7f6e9cc262c0 | 0 | 0 | 0 | 0 | 0 | 0 | 31719424 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097362.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931614427051 | 17931613820769 | 17931615158693 | 17931615200042 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 428 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 265664 | 0x7f6e9fb92000 | 0x7f6e9cc26300 | 0 | 0 | 0 | 0 | 0 | 0 | 42205184 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194603.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931615755938 | 17931615158693 | 17931616559977 | 17931616600717 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 431 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 271232 | 0x7f6e9d3fbe80 | 0x7f6e9cc26340 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194608.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 42205184 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931617156584 | 17931616559977 | 17931617946061 | 17931617986613 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 434 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 8 | 24 | 273216 | 0x7f6e9d3fbd00 | 0x7f6e9cc26380 | 0 | 0 | 42205184 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097325.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931618543039 | 17931617946061 | 17931619305905 | 17931619346270 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 437 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 8 | 24 | 275712 | 0x7f6e9d3fbb80 | 0x7f6e9cc263c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097324.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931619902566 | 17931619306204 | 17931620967809 | 17931621012118 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 440 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 280768 | 0x7f6e9d3fba00 | 0x7f6e9cc26400 | 0 | 0 | 0 | 0 | 0 | 0 | 38010880 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097361.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931621572975 | 17931620967809 | 17931622320133 | 17931622384395 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 443 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 287616 | 0x7f6e9d3fb880 | 0x7f6e9cc26440 | 0 | 0 | 0 | 0 | 0 | 0 | 50593792 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194613.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931622917472 | 17931622320133 | 17931623768938 | 17931623833069 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 446 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 294208 | 0x7f6e9d3fb700 | 0x7f6e9cc26480 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194628.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 50593792 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931624364546 | 17931623768938 | 17931625206383 | 17931625271104 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 449 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 8 | 24 | 296960 | 0x7f6e9fb92580 | 0x7f6e9cc264c0 | 0 | 0 | 50593792 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097337.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931625801801 | 17931625206383 | 17931626646708 | 17931626711539 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 452 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 8 | 24 | 299968 | 0x7f6e9fb92400 | 0x7f6e9cc26500 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097330.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931627244095 | 17931626646708 | 17931628401754 | 17931628442136 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 455 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 8 | 24 | 302720 | 0x7f6e9fb92280 | 0x7f6e9cc26540 | 0 | 0 | 0 | 0 | 0 | 0 | 67371008 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097334.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931629006942 | 17931628401754 | 17931629968640 | 17931630008287 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 458 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 305472 | 0x7f6e9fb92100 | 0x7f6e9cc26580 | 0 | 0 | 0 | 0 | 0 | 0 | 67371008 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194564.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931630567123 | 17931629968640 | 17931631527365 | 17931631573349 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 461 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 308224 | 0x7f6e9d3fbf80 | 0x7f6e9cc265c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194555.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 67371008 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931632125065 | 17931631527365 | 17931633089450 | 17931633153790 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 464 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 8 | 24 | 310976 | 0x7f6e9d3fbe00 | 0x7f6e9cc26600 | 0 | 0 | 67371008 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097335.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931633686256 | 17931633089450 | 17931634658096 | 17931634722531 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 467 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 8 | 24 | 313216 | 0x7f6e9d3fbc80 | 0x7f6e9cc26640 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097318.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931635254798 | 17931634658096 | 17931636619383 | 17931636683862 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 470 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 8 | 24 | 315968 | 0x7f6e9d3fbb00 | 0x7f6e9cc26680 | 0 | 0 | 0 | 0 | 0 | 0 | 134479872 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097328.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931637225489 | 17931636619383 | 17931638586269 | 17931638651434 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 473 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 318720 | 0x7f6e9d3fb980 | 0x7f6e9cc266c0 | 0 | 0 | 0 | 0 | 0 | 0 | 134479872 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194552.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931639184531 | 17931638586269 | 17931640539396 | 17931640581956 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 476 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 321472 | 0x7f6e9d3fb800 | 0x7f6e9cc26700 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194541.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 134479872 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931641136283 | 17931640539396 | 17931642509323 | 17931642575417 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 479 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 8 | 24 | 324224 | 0x7f6e9d3fb680 | 0x7f6e9cc26740 | 0 | 0 | 134479872 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097327.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931643105564 | 17931642509323 | 17931644479730 | 17931644544398 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 482 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 8 | 24 | 326464 | 0x7f6e9fb92500 | 0x7f6e9cc26780 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097316.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931645076035 | 17931644479730 | 17931647283580 | 17931647349139 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 485 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 8 | 24 | 329216 | 0x7f6e9fb92380 | 0x7f6e9cc267c0 | 0 | 0 | 0 | 0 | 0 | 0 | 268697600 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097324.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931647895496 | 17931647283580 | 17931650068549 | 17931650129161 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 488 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 331968 | 0x7f6e9fb92200 | 0x7f6e9cc26800 | 0 | 0 | 0 | 0 | 0 | 0 | 268697600 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194543.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931650666867 | 17931650068549 | 17931652892399 | 17931652957191 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 491 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 12 | 24 | 334720 | 0x7f6e9fb92080 | 0x7f6e9cc26840 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 4194304.0000000000 | 8388608.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 4194543.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 268697600 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931653489098 | 17931652892399 | 17931655726169 | 17931655794451 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 494 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 8 | 24 | 337472 | 0x7f6e9d3fbf00 | 0x7f6e9cc26880 | 0 | 0 | 268697600 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097332.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931656324888 | 17931655726169 | 17931658520898 | 17931658589382 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 497 | 241894 | 241894 | 4194304 | 256 | 0 | 0 | 8 | 24 | 0 | 0x7f6e9d3fbd80 | 0x7f6e9cc268c0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 2097152.0000000000 | 2097152.0000000000 | 0.0000000000 | 0.0000000000 | 0.0000000000 | 2097315.0000000000 | 0.0000000000 | 0.0000000000 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0 | 0.0000000000 | 0 | 0 | 17931659117799 | 17931658520898 | 17931662975634 | 17931663048012 |