38 KiB
38 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | SQ_INSTS_LDS | SQ_INST_LEVEL_LDS | SQ_ACCUM_PREV_HIRES | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBufferAligned.kd | 0 | 0 | 0 | 231235 | 231235 | 33554432 | 256 | 0 | 0 | 4 | 32 | 4160 | 0x0 | 0x7fa30bc04280 | 0 | 0 | 0 | 17723322357090 | 17722609008058 | 17723469569786 | 17723469683016 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 231235 | 231235 | 32768 | 256 | 0 | 0 | 12 | 24 | 13888 | 0x0 | 0x7fa30bc23f80 | 0 | 0 | 0 | 17723474867387 | 17723469569786 | 17723474996356 | 17723475001123 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 5 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 14336 | 0x7fa3325bd380 | 0x7fa30bc23fc0 | 0 | 0 | 0 | 17723475036342 | 17723474996356 | 17723475368197 | 17723475370774 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 8 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15040 | 0x7fa3325bd200 | 0x7fa30bc24000 | 0 | 0 | 0 | 17723475407493 | 17723475368197 | 17723475775878 | 17723475778044 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 11 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15488 | 0x7fa3325bd080 | 0x7fa30bc24040 | 0 | 0 | 0 | 17723475810163 | 17723475775878 | 17723476171559 | 17723476173814 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 14 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 15936 | 0x7fa330143f00 | 0x7fa30bc24080 | 0 | 0 | 0 | 17723476207393 | 17723476171559 | 17723476476199 | 17723476478446 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 17 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 16384 | 0x7fa330143d80 | 0x7fa30bc240c0 | 0 | 0 | 0 | 17723476511006 | 17723476476199 | 17723476780040 | 17723476782239 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 20 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 17088 | 0x7fa330143c00 | 0x7fa30bc24100 | 0 | 0 | 0 | 17723476825498 | 17723476780040 | 17723477082760 | 17723477084991 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 23 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 16 | 24 | 17792 | 0x7fa330143a80 | 0x7fa30bc24140 | 0 | 0 | 0 | 17723477117380 | 17723477082760 | 17723477476041 | 17723477478451 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 26 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 16 | 24 | 18496 | 0x7fa330143900 | 0x7fa30bc24180 | 0 | 0 | 0 | 17723477509481 | 17723477476041 | 17723477866122 | 17723477868322 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 29 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19200 | 0x7fa330143780 | 0x7fa30bc241c0 | 0 | 0 | 0 | 17723477899311 | 17723477866122 | 17723478193163 | 17723478195453 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 32 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19904 | 0x7fa330143600 | 0x7fa30bc24200 | 0 | 0 | 0 | 17723478228143 | 17723478193163 | 17723478507083 | 17723478509176 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 35 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 20608 | 0x7fa3325bd480 | 0x7fa30bc24240 | 0 | 0 | 0 | 17723478548905 | 17723478507083 | 17723478810284 | 17723478812598 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 38 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 16 | 24 | 21312 | 0x7fa3325bd300 | 0x7fa30bc24280 | 0 | 0 | 0 | 17723478845807 | 17723478810284 | 17723479219245 | 17723479220748 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 41 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22016 | 0x7fa3325bd180 | 0x7fa30bc242c0 | 0 | 0 | 0 | 17723479252647 | 17723479219245 | 17723479585805 | 17723479587518 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 44 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22720 | 0x7fa3325bd000 | 0x7fa30bc24300 | 0 | 0 | 0 | 17723479618918 | 17723479585805 | 17723479863246 | 17723479864801 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 47 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 23424 | 0x7fa330143e80 | 0x7fa30bc24340 | 0 | 0 | 0 | 17723479896111 | 17723479863246 | 17723480141007 | 17723480142644 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 50 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 24128 | 0x7fa330143d00 | 0x7fa30bc24380 | 0 | 0 | 0 | 17723480181553 | 17723480141007 | 17723480417487 | 17723480419127 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 53 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 16 | 24 | 24832 | 0x7fa330143b80 | 0x7fa30bc243c0 | 0 | 0 | 0 | 17723480451757 | 17723480417487 | 17723480780368 | 17723480781928 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 56 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 16 | 24 | 25536 | 0x7fa330143a00 | 0x7fa30bc24400 | 0 | 0 | 0 | 17723480812718 | 17723480780368 | 17723481144849 | 17723481146319 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 59 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26240 | 0x7fa330143880 | 0x7fa30bc24440 | 0 | 0 | 0 | 17723481176988 | 17723481144849 | 17723481428049 | 17723481429812 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 62 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26944 | 0x7fa330143700 | 0x7fa30bc24480 | 0 | 0 | 0 | 17723481460871 | 17723481428049 | 17723481705490 | 17723481707055 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 65 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 27648 | 0x7fa3325bd580 | 0x7fa30bc244c0 | 0 | 0 | 0 | 17723481745974 | 17723481705490 | 17723481982130 | 17723481983828 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 68 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 16 | 24 | 28608 | 0x7fa3325bd400 | 0x7fa30bc24500 | 0 | 0 | 0 | 17723482014977 | 17723481982130 | 17723482354611 | 17723482356409 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 71 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 16 | 24 | 29312 | 0x7fa3325bd280 | 0x7fa30bc24540 | 0 | 0 | 0 | 17723482388088 | 17723482354611 | 17723482725172 | 17723482726969 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 74 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 30016 | 0x7fa3325bd100 | 0x7fa30bc24580 | 0 | 0 | 0 | 17723482758599 | 17723482725172 | 17723483003412 | 17723483005032 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 77 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 8 | 24 | 30976 | 0x7fa330143f80 | 0x7fa30bc245c0 | 0 | 0 | 0 | 17723483036082 | 17723483003412 | 17723483280053 | 17723483281576 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 80 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 31680 | 0x7fa330143e00 | 0x7fa30bc24600 | 0 | 0 | 0 | 17723483319545 | 17723483280053 | 17723483557173 | 17723483558869 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 83 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 16 | 24 | 32640 | 0x7fa330143c80 | 0x7fa30bc24640 | 0 | 0 | 0 | 17723483589958 | 17723483557173 | 17723483920534 | 17723483922120 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 86 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 33600 | 0x7fa330143b00 | 0x7fa30bc24680 | 0 | 0 | 0 | 17723483953719 | 17723483920534 | 17723484284535 | 17723484286200 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 89 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 34560 | 0x7fa330143980 | 0x7fa30bc246c0 | 0 | 0 | 0 | 17723484318270 | 17723484284535 | 17723484566295 | 17723484567923 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 92 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 8 | 24 | 35520 | 0x7fa330143800 | 0x7fa30bc24700 | 0 | 0 | 0 | 17723484599153 | 17723484566295 | 17723484844376 | 17723484845936 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 95 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 36224 | 0x7fa330143680 | 0x7fa30bc24740 | 0 | 0 | 0 | 17723484883755 | 17723484844376 | 17723485127097 | 17723485128699 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 98 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 37184 | 0x7fa3325bd500 | 0x7fa30bc24780 | 0 | 0 | 0 | 17723485159699 | 17723485127097 | 17723485492857 | 17723485494470 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 101 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 38144 | 0x7fa3325bd380 | 0x7fa30bc247c0 | 0 | 0 | 0 | 17723485526729 | 17723485492857 | 17723485858618 | 17723485860251 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 104 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 39104 | 0x7fa3325bd200 | 0x7fa30bc24800 | 0 | 0 | 0 | 17723485891680 | 17723485858618 | 17723486132539 | 17723486134314 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 107 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 8 | 24 | 40320 | 0x7fa3325bd080 | 0x7fa30bc24840 | 0 | 0 | 0 | 17723486166723 | 17723486132539 | 17723486413499 | 17723486415147 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 110 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 41280 | 0x7fa330143f00 | 0x7fa30bc24880 | 0 | 0 | 0 | 17723486453816 | 17723486413499 | 17723486691580 | 17723486693160 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 113 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 42240 | 0x7fa330143d80 | 0x7fa30bc248c0 | 0 | 0 | 0 | 17723486724059 | 17723486691580 | 17723487057020 | 17723487058561 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 116 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 43200 | 0x7fa330143c00 | 0x7fa30bc24900 | 0 | 0 | 0 | 17723487090280 | 17723487057020 | 17723487434461 | 17723487436231 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 119 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 8 | 24 | 44160 | 0x7fa330143a80 | 0x7fa30bc24940 | 0 | 0 | 0 | 17723487467301 | 17723487434461 | 17723487714782 | 17723487716364 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 122 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 45376 | 0x7fa330143900 | 0x7fa30bc24980 | 0 | 0 | 0 | 17723487748204 | 17723487714782 | 17723487992702 | 17723487994297 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 125 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 46336 | 0x7fa330143780 | 0x7fa30bc249c0 | 0 | 0 | 0 | 17723488032306 | 17723487992702 | 17723488268223 | 17723488269820 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 128 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 47552 | 0x7fa330143600 | 0x7fa30bc24a00 | 0 | 0 | 0 | 17723488300800 | 17723488268223 | 17723488633824 | 17723488635541 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 131 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 48512 | 0x7fa3325bd480 | 0x7fa30bc24a40 | 0 | 0 | 0 | 17723488667260 | 17723488633824 | 17723488998784 | 17723489000372 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 134 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 8 | 24 | 49472 | 0x7fa3325bd300 | 0x7fa30bc24a80 | 0 | 0 | 0 | 17723489031461 | 17723488998784 | 17723489276865 | 17723489278485 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 137 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 50688 | 0x7fa3325bd180 | 0x7fa30bc24ac0 | 0 | 0 | 0 | 17723489310664 | 17723489276865 | 17723489552865 | 17723489554548 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 140 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 51648 | 0x7fa3325bd000 | 0x7fa30bc24b00 | 0 | 0 | 0 | 17723489593327 | 17723489552865 | 17723489831266 | 17723489832831 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 143 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 52864 | 0x7fa330143e80 | 0x7fa30bc24b40 | 0 | 0 | 0 | 17723489863550 | 17723489831266 | 17723490197507 | 17723490199202 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 146 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 54080 | 0x7fa330143d00 | 0x7fa30bc24b80 | 0 | 0 | 0 | 17723490231021 | 17723490197507 | 17723490571427 | 17723490573113 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 149 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 8 | 24 | 55296 | 0x7fa330143b80 | 0x7fa30bc24bc0 | 0 | 0 | 0 | 17723490604152 | 17723490571427 | 17723490855428 | 17723490856985 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 152 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 56768 | 0x7fa330143a00 | 0x7fa30bc24c00 | 0 | 0 | 0 | 17723490888775 | 17723490855428 | 17723491133349 | 17723491135068 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 155 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 57728 | 0x7fa330143880 | 0x7fa30bc24c40 | 0 | 0 | 0 | 17723491173448 | 17723491133349 | 17723491413509 | 17723491415061 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 158 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 58944 | 0x7fa330143700 | 0x7fa30bc24c80 | 0 | 0 | 0 | 17723491445501 | 17723491413509 | 17723491776870 | 17723491778422 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 161 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 60160 | 0x7fa3325bd580 | 0x7fa30bc24cc0 | 0 | 0 | 0 | 17723491809652 | 17723491776870 | 17723492145991 | 17723492147683 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 164 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 8 | 24 | 61376 | 0x7fa3325bd400 | 0x7fa30bc24d00 | 0 | 0 | 0 | 17723492179482 | 17723492145991 | 17723492423431 | 17723492424956 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 167 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 62848 | 0x7fa3325bd280 | 0x7fa30bc24d40 | 0 | 0 | 0 | 17723492455985 | 17723492423431 | 17723492706632 | 17723492708079 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 170 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 63808 | 0x7fa3325bd100 | 0x7fa30bc24d80 | 0 | 0 | 0 | 17723492746368 | 17723492706632 | 17723492985192 | 17723492986772 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 173 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 65024 | 0x7fa330143f80 | 0x7fa30bc24dc0 | 0 | 0 | 0 | 17723493018541 | 17723492985192 | 17723493354953 | 17723493356433 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 176 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 66240 | 0x7fa330143e00 | 0x7fa30bc24e00 | 0 | 0 | 0 | 17723493387642 | 17723493354953 | 17723493717994 | 17723493719444 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 179 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 8 | 24 | 67456 | 0x7fa330143c80 | 0x7fa30bc24e40 | 0 | 0 | 0 | 17723493751023 | 17723493717994 | 17723494000074 | 17723494001727 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 182 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 68928 | 0x7fa330143b00 | 0x7fa30bc24e80 | 0 | 0 | 0 | 17723494033066 | 17723494000074 | 17723494304395 | 17723494305929 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 185 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 70144 | 0x7fa330143980 | 0x7fa30bc24ec0 | 0 | 0 | 0 | 17723494345288 | 17723494304395 | 17723494583116 | 17723494584752 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 188 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 71616 | 0x7fa330143800 | 0x7fa30bc24f00 | 0 | 0 | 0 | 17723494615551 | 17723494583116 | 17723494947596 | 17723494949113 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 191 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 72832 | 0x7fa330143680 | 0x7fa30bc24f40 | 0 | 0 | 0 | 17723494980792 | 17723494947596 | 17723495309837 | 17723495311374 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 194 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 8 | 24 | 74048 | 0x7fa3325bd500 | 0x7fa30bc24f80 | 0 | 0 | 0 | 17723495342033 | 17723495309837 | 17723495586638 | 17723495588277 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 197 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 75776 | 0x7fa3325bd380 | 0x7fa30bc24fc0 | 0 | 0 | 0 | 17723495619406 | 17723495586638 | 17723495877358 | 17723495878910 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 200 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 76992 | 0x7fa3325bd200 | 0x7fa30bc25000 | 0 | 0 | 0 | 17723495917429 | 17723495877358 | 17723496164879 | 17723496166573 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 203 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 78464 | 0x7fa3325bd080 | 0x7fa30bc25040 | 0 | 0 | 0 | 17723496198942 | 17723496164879 | 17723496535599 | 17723496537213 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 206 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 79936 | 0x7fa330143f00 | 0x7fa30bc25080 | 0 | 0 | 0 | 17723496569423 | 17723496535599 | 17723496901360 | 17723496903094 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 209 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 8 | 24 | 81408 | 0x7fa330143d80 | 0x7fa30bc250c0 | 0 | 0 | 0 | 17723496934053 | 17723496901360 | 17723497181201 | 17723497182877 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 212 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 83136 | 0x7fa330143c00 | 0x7fa30bc25100 | 0 | 0 | 0 | 17723497213446 | 17723497181201 | 17723497477841 | 17723497479350 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 215 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 84352 | 0x7fa330143a80 | 0x7fa30bc25140 | 0 | 0 | 0 | 17723497529899 | 17723497477841 | 17723497756882 | 17723497758793 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 218 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 85824 | 0x7fa330143900 | 0x7fa30bc25180 | 0 | 0 | 0 | 17723497789842 | 17723497756882 | 17723498129843 | 17723498131783 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 221 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 87296 | 0x7fa330143780 | 0x7fa30bc251c0 | 0 | 0 | 0 | 17723498163333 | 17723498129843 | 17723498498963 | 17723498500484 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 224 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 88768 | 0x7fa330143600 | 0x7fa30bc25200 | 0 | 0 | 0 | 17723498532183 | 17723498498963 | 17723498779124 | 17723498780677 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 227 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 90752 | 0x7fa3325bd480 | 0x7fa30bc25240 | 0 | 0 | 0 | 17723498811806 | 17723498779124 | 17723499082645 | 17723499084139 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 230 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 91968 | 0x7fa3325bd300 | 0x7fa30bc25280 | 0 | 0 | 0 | 17723499123338 | 17723499082645 | 17723499368405 | 17723499369982 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 233 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 93440 | 0x7fa3325bd180 | 0x7fa30bc252c0 | 0 | 0 | 0 | 17723499401771 | 17723499368405 | 17723499735606 | 17723499737263 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 236 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 94912 | 0x7fa3325bd000 | 0x7fa30bc25300 | 0 | 0 | 0 | 17723499768102 | 17723499735606 | 17723500099287 | 17723500100794 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 239 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 96384 | 0x7fa330143e80 | 0x7fa30bc25340 | 0 | 0 | 0 | 17723500132313 | 17723500099287 | 17723500379607 | 17723500381167 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 242 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 98368 | 0x7fa330143d00 | 0x7fa30bc25380 | 0 | 0 | 0 | 17723500412226 | 17723500379607 | 17723500693208 | 17723500694659 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 245 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 99584 | 0x7fa330143b80 | 0x7fa30bc253c0 | 0 | 0 | 0 | 17723500733328 | 17723500693208 | 17723500975128 | 17723500976692 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 248 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 101312 | 0x7fa330143a00 | 0x7fa30bc25400 | 0 | 0 | 0 | 17723501007901 | 17723500975128 | 17723501339769 | 17723501341483 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 251 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 102784 | 0x7fa330143880 | 0x7fa30bc25440 | 0 | 0 | 0 | 17723501372432 | 17723501339769 | 17723501702650 | 17723501704204 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 254 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 104256 | 0x7fa330143700 | 0x7fa30bc25480 | 0 | 0 | 0 | 17723501736183 | 17723501702650 | 17723501981210 | 17723501982856 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 257 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 106240 | 0x7fa3325bd580 | 0x7fa30bc254c0 | 0 | 0 | 0 | 17723502014076 | 17723501981210 | 17723502303611 | 17723502305498 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 260 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 107712 | 0x7fa3325bd400 | 0x7fa30bc25500 | 0 | 0 | 0 | 17723502344357 | 17723502303611 | 17723502590812 | 17723502592391 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 263 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 16 | 24 | 109440 | 0x7fa3325bd280 | 0x7fa30bc25540 | 0 | 0 | 0 | 17723502623440 | 17723502590812 | 17723502953212 | 17723502954782 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 266 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 16 | 24 | 111168 | 0x7fa3325bd100 | 0x7fa30bc25580 | 0 | 0 | 0 | 17723502986561 | 17723502953212 | 17723503315453 | 17723503317063 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 269 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 8 | 24 | 112896 | 0x7fa330143f80 | 0x7fa30bc255c0 | 0 | 0 | 0 | 17723503347782 | 17723503315453 | 17723503593534 | 17723503595156 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 272 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 115136 | 0x7fa330143e00 | 0x7fa30bc25600 | 0 | 0 | 0 | 17723503626505 | 17723503593534 | 17723503918174 | 17723503919668 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 275 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 116608 | 0x7fa330143c80 | 0x7fa30bc25640 | 0 | 0 | 0 | 17723503958067 | 17723503918174 | 17723504207295 | 17723504208931 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 278 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 16 | 24 | 118336 | 0x7fa330143b00 | 0x7fa30bc25680 | 0 | 0 | 0 | 17723504240080 | 17723504207295 | 17723504572416 | 17723504573992 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 281 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 16 | 24 | 120064 | 0x7fa330143980 | 0x7fa30bc256c0 | 0 | 0 | 0 | 17723504605271 | 17723504572416 | 17723504935136 | 17723504936663 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 284 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 121792 | 0x7fa330143800 | 0x7fa30bc25700 | 0 | 0 | 0 | 17723504968222 | 17723504935136 | 17723505213537 | 17723505215096 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 287 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 124032 | 0x7fa330143680 | 0x7fa30bc25740 | 0 | 0 | 0 | 17723505246665 | 17723505213537 | 17723505545858 | 17723505547467 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 290 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 125504 | 0x7fa3325bd500 | 0x7fa30bc25780 | 0 | 0 | 0 | 17723505586476 | 17723505545858 | 17723505825058 | 17723505826690 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 293 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 127488 | 0x7fa3325bd380 | 0x7fa30bc257c0 | 0 | 0 | 0 | 17723505858300 | 17723505825058 | 17723506190179 | 17723506192021 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 296 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 129216 | 0x7fa3325bd200 | 0x7fa30bc25800 | 0 | 0 | 0 | 17723506224700 | 17723506190179 | 17723506558660 | 17723506560152 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 299 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 130944 | 0x7fa3325bd080 | 0x7fa30bc25840 | 0 | 0 | 0 | 17723506590691 | 17723506558660 | 17723506841700 | 17723506843275 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 302 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 133440 | 0x7fa330143f00 | 0x7fa30bc25880 | 0 | 0 | 0 | 17723506875984 | 17723506841700 | 17723507178981 | 17723507180666 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 305 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 134912 | 0x7fa330143d80 | 0x7fa30bc258c0 | 0 | 0 | 0 | 17723507219726 | 17723507178981 | 17723507457061 | 17723507458620 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 308 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 136896 | 0x7fa330143c00 | 0x7fa30bc25900 | 0 | 0 | 0 | 17723507488699 | 17723507457061 | 17723507820262 | 17723507821920 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 311 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 138880 | 0x7fa330143a80 | 0x7fa30bc25940 | 0 | 0 | 0 | 17723507853190 | 17723507820262 | 17723508183623 | 17723508185201 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 314 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 140864 | 0x7fa330143900 | 0x7fa30bc25980 | 0 | 0 | 0 | 17723508216001 | 17723508183623 | 17723508474183 | 17723508475804 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 317 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 143616 | 0x7fa330143780 | 0x7fa30bc259c0 | 0 | 0 | 0 | 17723508506823 | 17723508474183 | 17723508832104 | 17723508833745 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 320 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 145344 | 0x7fa330143600 | 0x7fa30bc25a00 | 0 | 0 | 0 | 17723508872394 | 17723508832104 | 17723509112585 | 17723509114198 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 323 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 147584 | 0x7fa3325bd480 | 0x7fa30bc25a40 | 0 | 0 | 0 | 17723509145087 | 17723509112585 | 17723509475625 | 17723509477169 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 326 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 149568 | 0x7fa3325bd300 | 0x7fa30bc25a80 | 0 | 0 | 0 | 17723509508978 | 17723509475625 | 17723509838986 | 17723509840620 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 329 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 151552 | 0x7fa3325bd180 | 0x7fa30bc25ac0 | 0 | 0 | 0 | 17723509871879 | 17723509838986 | 17723510132587 | 17723510134343 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 332 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 154304 | 0x7fa3325bd000 | 0x7fa30bc25b00 | 0 | 0 | 0 | 17723510165782 | 17723510132587 | 17723510500907 | 17723510502483 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 335 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 156288 | 0x7fa330143e80 | 0x7fa30bc25b40 | 0 | 0 | 0 | 17723510541872 | 17723510500907 | 17723510787948 | 17723510789506 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 338 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 158784 | 0x7fa330143d00 | 0x7fa30bc25b80 | 0 | 0 | 0 | 17723510820035 | 17723510787948 | 17723511157709 | 17723511159337 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 341 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 161024 | 0x7fa330143b80 | 0x7fa30bc25bc0 | 0 | 0 | 0 | 17723511190916 | 17723511157709 | 17723511520750 | 17723511522438 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 344 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 163264 | 0x7fa330143a00 | 0x7fa30bc25c00 | 0 | 0 | 0 | 17723511552477 | 17723511520750 | 17723511834830 | 17723511836510 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 347 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 166528 | 0x7fa330143880 | 0x7fa30bc25c40 | 0 | 0 | 0 | 17723511867659 | 17723511834830 | 17723512224911 | 17723512247579 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 350 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 168512 | 0x7fa330143700 | 0x7fa30bc25c80 | 0 | 0 | 0 | 17723512267349 | 17723512224911 | 17723512529072 | 17723512530752 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 353 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 171264 | 0x7fa3325bd580 | 0x7fa30bc25cc0 | 0 | 0 | 0 | 17723512561471 | 17723512529072 | 17723512894032 | 17723512895773 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 356 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 173760 | 0x7fa3325bd400 | 0x7fa30bc25d00 | 0 | 0 | 0 | 17723512927052 | 17723512894032 | 17723513260113 | 17723513261764 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 359 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 176256 | 0x7fa3325bd280 | 0x7fa30bc25d40 | 0 | 0 | 0 | 17723513292603 | 17723513260113 | 17723513578834 | 17723513580416 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 362 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 179776 | 0x7fa3325bd100 | 0x7fa30bc25d80 | 0 | 0 | 0 | 17723513612445 | 17723513578834 | 17723513996754 | 17723514014885 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 365 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 182272 | 0x7fa330143f80 | 0x7fa30bc25dc0 | 0 | 0 | 0 | 17723514037094 | 17723513996754 | 17723514327635 | 17723514329327 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 368 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 185536 | 0x7fa330143e00 | 0x7fa30bc25e00 | 0 | 0 | 0 | 17723514360666 | 17723514327635 | 17723514712596 | 17723514737427 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 371 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 188544 | 0x7fa330143c80 | 0x7fa30bc25e40 | 0 | 0 | 0 | 17723514749167 | 17723514712596 | 17723515104917 | 17723515128257 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 374 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 191552 | 0x7fa330143b00 | 0x7fa30bc25e80 | 0 | 0 | 0 | 17723515139607 | 17723515104917 | 17723515469237 | 17723515470928 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 377 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 195840 | 0x7fa330143980 | 0x7fa30bc25ec0 | 0 | 0 | 0 | 17723515502548 | 17723515469237 | 17723515939158 | 17723515960216 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 380 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 198592 | 0x7fa330143800 | 0x7fa30bc25f00 | 0 | 0 | 0 | 17723515979016 | 17723515939158 | 17723516284439 | 17723516285988 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 383 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 202368 | 0x7fa330143680 | 0x7fa30bc25f40 | 0 | 0 | 0 | 17723516317097 | 17723516284439 | 17723516677880 | 17723516694728 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 386 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 205888 | 0x7fa3325bd500 | 0x7fa30bc25f80 | 0 | 0 | 0 | 17723516712227 | 17723516677880 | 17723517074521 | 17723517092738 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 389 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 209408 | 0x7fa3325bd380 | 0x7fa30bc25fc0 | 0 | 0 | 0 | 17723517108048 | 17723517074521 | 17723517453721 | 17723517455489 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 392 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 214464 | 0x7fa3325bd200 | 0x7fa30bc26000 | 0 | 0 | 0 | 17723517487638 | 17723517453721 | 17723517973882 | 17723517992095 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 395 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 217728 | 0x7fa3325bd080 | 0x7fa30bc26040 | 0 | 0 | 0 | 17723518015095 | 17723517973882 | 17723518338683 | 17723518340267 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 398 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 222016 | 0x7fa330143f00 | 0x7fa30bc26080 | 0 | 0 | 0 | 17723518372916 | 17723518338683 | 17723518754844 | 17723518776096 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 401 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 226048 | 0x7fa330143d80 | 0x7fa30bc260c0 | 0 | 0 | 0 | 17723518786935 | 17723518754844 | 17723519188925 | 17723519210225 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 404 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 230080 | 0x7fa330143c00 | 0x7fa30bc26100 | 0 | 0 | 0 | 17723519221924 | 17723519188925 | 17723519596766 | 17723519614555 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 407 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 235904 | 0x7fa330143a80 | 0x7fa30bc26140 | 0 | 0 | 0 | 17723519629874 | 17723519596766 | 17723520173727 | 17723520191360 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 410 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 239424 | 0x7fa330143900 | 0x7fa30bc26180 | 0 | 0 | 0 | 17723520214019 | 17723520173727 | 17723520549568 | 17723520551121 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 413 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 244224 | 0x7fa330143780 | 0x7fa30bc261c0 | 0 | 0 | 0 | 17723520581930 | 17723520549568 | 17723520993569 | 17723521010489 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 416 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 248768 | 0x7fa330143600 | 0x7fa30bc26200 | 0 | 0 | 0 | 17723521027159 | 17723520993569 | 17723521428929 | 17723521447398 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 419 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 253312 | 0x7fa3325bd480 | 0x7fa30bc26240 | 0 | 0 | 0 | 17723521462288 | 17723521428929 | 17723521857090 | 17723521874308 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 422 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 8 | 24 | 255552 | 0x7fa3325bd300 | 0x7fa30bc26280 | 0 | 0 | 0 | 17723521890497 | 17723521857090 | 17723522498052 | 17723522520681 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 425 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 259840 | 0x7fa3325bd180 | 0x7fa30bc262c0 | 0 | 0 | 0 | 17723522540151 | 17723522498052 | 17723522923172 | 17723522946671 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 428 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 265664 | 0x7fa3325bd000 | 0x7fa30bc26300 | 0 | 0 | 0 | 17723522958331 | 17723522923172 | 17723523418213 | 17723523438889 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 431 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 271232 | 0x7fa330143e80 | 0x7fa30bc26340 | 0 | 0 | 0 | 17723523450448 | 17723523418213 | 17723523913574 | 17723523930656 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 434 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 8 | 24 | 273216 | 0x7fa330143d00 | 0x7fa30bc26380 | 0 | 0 | 0 | 17723523946096 | 17723523913574 | 17723524401735 | 17723524420524 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 437 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 8 | 24 | 275712 | 0x7fa330143b80 | 0x7fa30bc263c0 | 0 | 0 | 0 | 17723524435424 | 17723524401735 | 17723525148937 | 17723525166405 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 440 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 280768 | 0x7fa330143a00 | 0x7fa30bc26400 | 0 | 0 | 0 | 17723525190375 | 17723525148937 | 17723525608618 | 17723525624834 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 443 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 287616 | 0x7fa330143880 | 0x7fa30bc26440 | 0 | 0 | 0 | 17723525641693 | 17723525608618 | 17723526147179 | 17723526171700 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 446 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 294208 | 0x7fa330143700 | 0x7fa30bc26480 | 0 | 0 | 0 | 17723526183740 | 17723526147179 | 17723526698220 | 17723526716207 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 449 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 8 | 24 | 296960 | 0x7fa3325bd580 | 0x7fa30bc264c0 | 0 | 0 | 0 | 17723526730686 | 17723526698220 | 17723527236621 | 17723527253733 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 452 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 8 | 24 | 299968 | 0x7fa3325bd400 | 0x7fa30bc26500 | 0 | 0 | 0 | 17723527270013 | 17723527236621 | 17723528083183 | 17723528100402 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 455 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 8 | 24 | 302720 | 0x7fa3325bd280 | 0x7fa30bc26540 | 0 | 0 | 0 | 17723528124241 | 17723528083183 | 17723528718224 | 17723528735396 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 458 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 305472 | 0x7fa3325bd100 | 0x7fa30bc26580 | 0 | 0 | 0 | 17723528751216 | 17723528718224 | 17723529370385 | 17723529387690 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 461 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 308224 | 0x7fa330143f80 | 0x7fa30bc265c0 | 0 | 0 | 0 | 17723529403549 | 17723529370385 | 17723530025427 | 17723530042183 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 464 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 8 | 24 | 310976 | 0x7fa330143e00 | 0x7fa30bc26600 | 0 | 0 | 0 | 17723530058163 | 17723530025427 | 17723530666868 | 17723530687707 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 467 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 8 | 24 | 313216 | 0x7fa330143c80 | 0x7fa30bc26640 | 0 | 0 | 0 | 17723530699667 | 17723530666868 | 17723531727190 | 17723531745660 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 470 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 8 | 24 | 315968 | 0x7fa330143b00 | 0x7fa30bc26680 | 0 | 0 | 0 | 17723531767190 | 17723531727091 | 17723532785813 | 17723532834153 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 473 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 318720 | 0x7fa330143980 | 0x7fa30bc266c0 | 0 | 0 | 0 | 17723532845733 | 17723532785813 | 17723533910454 | 17723533975274 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 476 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 321472 | 0x7fa330143800 | 0x7fa30bc26700 | 0 | 0 | 0 | 17723533987714 | 17723533910454 | 17723535049017 | 17723535116886 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 479 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 8 | 24 | 324224 | 0x7fa330143680 | 0x7fa30bc26740 | 0 | 0 | 0 | 17723535129265 | 17723535049017 | 17723536167899 | 17723536233958 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 482 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 8 | 24 | 326464 | 0x7fa3325bd500 | 0x7fa30bc26780 | 0 | 0 | 0 | 17723536245908 | 17723536167899 | 17723538119102 | 17723538189509 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 485 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 8 | 24 | 329216 | 0x7fa3325bd380 | 0x7fa30bc267c0 | 0 | 0 | 0 | 17723538209718 | 17723538119102 | 17723540046466 | 17723540119101 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 488 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 331968 | 0x7fa3325bd200 | 0x7fa30bc26800 | 0 | 0 | 0 | 17723540130700 | 17723540046466 | 17723542043909 | 17723542124041 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 491 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 12 | 24 | 334720 | 0x7fa3325bd080 | 0x7fa30bc26840 | 0 | 0 | 0 | 17723542136650 | 17723542043909 | 17723544032073 | 17723544101401 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 494 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 8 | 24 | 337472 | 0x7fa330143f00 | 0x7fa30bc26880 | 0 | 0 | 0 | 17723544113960 | 17723544032073 | 17723545969036 | 17723546036092 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 497 | 231235 | 231235 | 4194304 | 256 | 0 | 0 | 8 | 24 | 0 | 0x7fa330143d80 | 0x7fa30bc268c0 | 0 | 0 | 0 | 17723546048142 | 17723545969036 | 17723549595763 | 17723549672401 |