39 KiB
39 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBuffer.kd | 0 | 0 | 0 | 868283 | 868288 | 33554432 | 256 | 0 | 0 | 8 | 32 | 6464 | 0x0 | 0x7f5a48204180 | 12075279053950779 | 12075279053995252 | 12075279054317649 | 12075279054425581 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 868283 | 868288 | 32768 | 256 | 0 | 0 | 24 | 24 | 12480 | 0x0 | 0x7f5a48235100 | 12075279069097283 | 12075279069200263 | 12075279069206983 | 12075279069213048 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 4 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 12928 | 0x7f5b53d76900 | 0x7f5a48235140 | 12075279069257901 | 12075279069270663 | 12075279069401861 | 12075279069405856 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 6 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 36 | 24 | 13632 | 0x7f5b53d76800 | 0x7f5a48235180 | 12075279069449257 | 12075279069462821 | 12075279069708258 | 12075279069804848 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 8 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 14080 | 0x7f5b53d76700 | 0x7f5a482351c0 | 12075279069832469 | 12075279069843777 | 12075279070090815 | 12075279070189262 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 10 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 14528 | 0x7f5b53d76600 | 0x7f5a48235200 | 12075279070216092 | 12075279070227773 | 12075279070353052 | 12075279070356743 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 12 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 14976 | 0x7f5b53d76500 | 0x7f5a48235240 | 12075279070384525 | 12075279070395772 | 12075279070521211 | 12075279070524825 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 14 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 15424 | 0x7f5b53d76400 | 0x7f5a48235280 | 12075279070581621 | 12075279070598810 | 12075279070722489 | 12075279070725869 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 16 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 16128 | 0x7f5b53d76300 | 0x7f5a482352c0 | 12075279070754442 | 12075279070767448 | 12075279071013686 | 12075279071110694 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 18 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 16832 | 0x7f5b53d76a00 | 0x7f5a48235300 | 12075279071133787 | 12075279071146005 | 12075279071392562 | 12075279071489167 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 20 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 17536 | 0x7f5b53d76900 | 0x7f5a48235340 | 12075279071516218 | 12075279071527441 | 12075279071652080 | 12075279071655767 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 22 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 18240 | 0x7f5b53d76800 | 0x7f5a48235380 | 12075279071686885 | 12075279071698959 | 12075279071823918 | 12075279071827466 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 24 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 18944 | 0x7f5b53d76700 | 0x7f5a482353c0 | 12075279071871478 | 12075279071883277 | 12075279072007756 | 12075279072013982 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 26 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 19904 | 0x7f5b53d76600 | 0x7f5a48235400 | 12075279072044429 | 12075279072055916 | 12075279072309993 | 12075279072381876 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 28 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 20608 | 0x7f5b53d76500 | 0x7f5a48235440 | 12075279072404719 | 12075279072416392 | 12075279072661030 | 12075279072728129 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 30 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 21312 | 0x7f5b53d76400 | 0x7f5a48235480 | 12075279072750461 | 12075279072762309 | 12075279072887108 | 12075279072890431 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 32 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 22016 | 0x7f5b53d76300 | 0x7f5a482354c0 | 12075279072918593 | 12075279072929827 | 12075279073054626 | 12075279073058123 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 34 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 22720 | 0x7f5b53d76a00 | 0x7f5a48235500 | 12075279073095853 | 12075279073107266 | 12075279073231744 | 12075279073235092 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 36 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 23680 | 0x7f5b53d76900 | 0x7f5a48235540 | 12075279073262122 | 12075279073276864 | 12075279073564381 | 12075279073630266 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 38 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 24384 | 0x7f5b53d76800 | 0x7f5a48235580 | 12075279073651565 | 12075279073665500 | 12075279073916218 | 12075279073982070 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 40 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 25088 | 0x7f5b53d76700 | 0x7f5a482355c0 | 12075279074008909 | 12075279074021497 | 12075279074146455 | 12075279074149681 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 42 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 25792 | 0x7f5b53d76600 | 0x7f5a48235600 | 12075279074177913 | 12075279074189495 | 12075279074315094 | 12075279074318424 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 44 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 26496 | 0x7f5b53d76500 | 0x7f5a48235640 | 12075279074356145 | 12075279074368853 | 12075279074493332 | 12075279074496736 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 46 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 27712 | 0x7f5b53d76400 | 0x7f5a48235680 | 12075279074523996 | 12075279074535572 | 12075279074779889 | 12075279074846135 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 48 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 28416 | 0x7f5b53d76300 | 0x7f5a482356c0 | 12075279074867485 | 12075279074879248 | 12075279075127726 | 12075279075223977 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 50 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 29120 | 0x7f5b53d76a00 | 0x7f5a48235700 | 12075279075245327 | 12075279075256365 | 12075279075381004 | 12075279075384596 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 52 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 30080 | 0x7f5b53d76900 | 0x7f5a48235740 | 12075279075411405 | 12075279075423083 | 12075279075548042 | 12075279075551546 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 54 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 30784 | 0x7f5b53d76800 | 0x7f5a48235780 | 12075279075588755 | 12075279075606281 | 12075279075730920 | 12075279075734446 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 56 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 32000 | 0x7f5b53d76700 | 0x7f5a482357c0 | 12075279075760995 | 12075279075773320 | 12075279076020357 | 12075279076092491 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 58 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 32960 | 0x7f5b53d76600 | 0x7f5a48235800 | 12075279076116676 | 12075279076127876 | 12075279076373634 | 12075279076451508 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 60 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 33920 | 0x7f5b53d76500 | 0x7f5a48235840 | 12075279076473549 | 12075279076484993 | 12075279076609792 | 12075279076613429 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 62 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 34880 | 0x7f5b53d76400 | 0x7f5a48235880 | 12075279076641701 | 12075279076653151 | 12075279076779230 | 12075279076782723 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 64 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 35840 | 0x7f5b53d76300 | 0x7f5a482358c0 | 12075279076818850 | 12075279076831709 | 12075279076956508 | 12075279076959482 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 66 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 37312 | 0x7f5b53d76a00 | 0x7f5a48235900 | 12075279076986031 | 12075279076998748 | 12075279077246905 | 12075279077307869 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 68 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 38272 | 0x7f5b53d76900 | 0x7f5a48235940 | 12075279077330261 | 12075279077343865 | 12075279077588982 | 12075279077644575 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 70 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 39232 | 0x7f5b53d76800 | 0x7f5a48235980 | 12075279077667197 | 12075279077679381 | 12075279077804020 | 12075279077807648 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 72 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 40192 | 0x7f5b53d76700 | 0x7f5a482359c0 | 12075279077834428 | 12075279077847540 | 12075279077973138 | 12075279077976371 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 74 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 41152 | 0x7f5b53d76600 | 0x7f5a48235a00 | 12075279078018079 | 12075279078029938 | 12075279078154097 | 12075279078157418 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 76 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 42624 | 0x7f5b53d76500 | 0x7f5a48235a40 | 12075279078182945 | 12075279078197456 | 12075279078446414 | 12075279078475980 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 78 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 43584 | 0x7f5b53d76400 | 0x7f5a48235a80 | 12075279078498041 | 12075279078510413 | 12075279078758251 | 12075279078782239 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 80 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 44544 | 0x7f5b53d76300 | 0x7f5a48235ac0 | 12075279078803198 | 12075279078816170 | 12075279078940649 | 12075279078943819 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 82 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 45760 | 0x7f5b53d76a00 | 0x7f5a48235b00 | 12075279078969837 | 12075279078982729 | 12075279079108647 | 12075279079112012 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 84 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 46720 | 0x7f5b53d76900 | 0x7f5a48235b40 | 12075279079154240 | 12075279079168007 | 12075279079293126 | 12075279079296444 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 86 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 48448 | 0x7f5b53d76800 | 0x7f5a48235b80 | 12075279079322984 | 12075279079335685 | 12075279079591363 | 12075279079610838 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 88 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 49408 | 0x7f5b53d76700 | 0x7f5a48235bc0 | 12075279079633200 | 12075279079646242 | 12075279079890080 | 12075279079909694 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 90 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 50368 | 0x7f5b53d76600 | 0x7f5a48235c00 | 12075279079929731 | 12075279079941599 | 12075279080065918 | 12075279080069420 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 92 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 51584 | 0x7f5b53d76500 | 0x7f5a48235c40 | 12075279080098454 | 12075279080109918 | 12075279080236157 | 12075279080239316 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 94 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 52544 | 0x7f5b53d76400 | 0x7f5a48235c80 | 12075279080276565 | 12075279080288156 | 12075279080413115 | 12075279080416385 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 96 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 54272 | 0x7f5b53d76300 | 0x7f5a48235cc0 | 12075279080443646 | 12075279080457594 | 12075279080710872 | 12075279080738023 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 98 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 55488 | 0x7f5b53d76a00 | 0x7f5a48235d00 | 12075279080760134 | 12075279080772791 | 12075279081016469 | 12075279081044212 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 100 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 56704 | 0x7f5b53d76900 | 0x7f5a48235d40 | 12075279081068838 | 12075279081082388 | 12075279081207347 | 12075279081210631 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 102 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 58176 | 0x7f5b53d76800 | 0x7f5a48235d80 | 12075279081236629 | 12075279081248947 | 12075279081377265 | 12075279081380467 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 104 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 59392 | 0x7f5b53d76700 | 0x7f5a48235dc0 | 12075279081416484 | 12075279081429585 | 12075279081554224 | 12075279081557566 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 106 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 61376 | 0x7f5b53d76600 | 0x7f5a48235e00 | 12075279081585207 | 12075279081599343 | 12075279081855981 | 12075279081878702 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 108 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 62592 | 0x7f5b53d76500 | 0x7f5a48235e40 | 12075279081900273 | 12075279081912780 | 12075279082197258 | 12075279082231308 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 110 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 63808 | 0x7f5b53d76400 | 0x7f5a48235e80 | 12075279082254431 | 12075279082267017 | 12075279082392456 | 12075279082396084 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 112 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 65280 | 0x7f5b53d76300 | 0x7f5a48235ec0 | 12075279082422343 | 12075279082435815 | 12075279082563494 | 12075279082567041 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 114 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 66496 | 0x7f5b53d76a00 | 0x7f5a48235f00 | 12075279082604521 | 12075279082617093 | 12075279082741892 | 12075279082745222 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 116 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 68480 | 0x7f5b53d76900 | 0x7f5a48235f40 | 12075279082770870 | 12075279082784612 | 12075279083039009 | 12075279083062121 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 118 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 69696 | 0x7f5b53d76800 | 0x7f5a48235f80 | 12075279083084653 | 12075279083097569 | 12075279083342526 | 12075279083368350 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 120 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 70912 | 0x7f5b53d76700 | 0x7f5a48235fc0 | 12075279083389810 | 12075279083400926 | 12075279083525885 | 12075279083529059 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 122 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 72384 | 0x7f5b53d76600 | 0x7f5a48236000 | 12075279083555438 | 12075279083568604 | 12075279083703963 | 12075279083707390 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 124 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 73600 | 0x7f5b53d76500 | 0x7f5a48236040 | 12075279083743427 | 12075279083755962 | 12075279083880121 | 12075279083883427 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 126 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 75840 | 0x7f5b53d76400 | 0x7f5a48236080 | 12075279083909776 | 12075279083923001 | 12075279084174198 | 12075279084200256 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 128 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 77056 | 0x7f5b53d76300 | 0x7f5a482360c0 | 12075279084223008 | 12075279084236758 | 12075279084480275 | 12075279084502418 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 130 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 78272 | 0x7f5b53d76a00 | 0x7f5a48236100 | 12075279084526943 | 12075279084539635 | 12075279084663794 | 12075279084667154 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 132 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 80000 | 0x7f5b53d76900 | 0x7f5a48236140 | 12075279084693202 | 12075279084705873 | 12075279084847952 | 12075279084851536 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 134 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 81216 | 0x7f5b53d76800 | 0x7f5a48236180 | 12075279084887002 | 12075279084899631 | 12075279085025070 | 12075279085028996 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 136 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 83456 | 0x7f5b53d76700 | 0x7f5a482361c0 | 12075279085055636 | 12075279085068910 | 12075279085322667 | 12075279085341256 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 138 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 84928 | 0x7f5b53d76600 | 0x7f5a48236200 | 12075279085361694 | 12075279085374507 | 12075279085617704 | 12075279085643638 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 140 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 86400 | 0x7f5b53d76500 | 0x7f5a48236240 | 12075279085664146 | 12075279085676744 | 12075279085801703 | 12075279085805068 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 142 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 88128 | 0x7f5b53d76400 | 0x7f5a48236280 | 12075279085833801 | 12075279085845862 | 12075279085994341 | 12075279085997856 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 144 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 89600 | 0x7f5b53d76300 | 0x7f5a482362c0 | 12075279086054692 | 12075279086068580 | 12075279086194339 | 12075279086197818 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 146 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 92096 | 0x7f5b53d76a00 | 0x7f5a48236300 | 12075279086224728 | 12075279086237698 | 12075279086496736 | 12075279086515338 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 148 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 93568 | 0x7f5b53d76900 | 0x7f5a48236340 | 12075279086537960 | 12075279086551295 | 12075279086795453 | 12075279086814674 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 150 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 95040 | 0x7f5b53d76800 | 0x7f5a48236380 | 12075279086836094 | 12075279086848732 | 12075279086973691 | 12075279086977146 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 152 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 96768 | 0x7f5b53d76700 | 0x7f5a482363c0 | 12075279087007282 | 12075279087019931 | 12075279087177209 | 12075279087180574 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 154 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 98240 | 0x7f5b53d76600 | 0x7f5a48236400 | 12075279087217402 | 12075279087230649 | 12075279087355928 | 12075279087359396 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 156 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 100736 | 0x7f5b53d76500 | 0x7f5a48236440 | 12075279087385575 | 12075279087398647 | 12075279087655765 | 12075279087681996 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 158 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 102208 | 0x7f5b53d76400 | 0x7f5a48236480 | 12075279087702013 | 12075279087714484 | 12075279087962642 | 12075279087984919 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 160 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 103680 | 0x7f5b53d76300 | 0x7f5a482364c0 | 12075279088013712 | 12075279088026161 | 12075279088151600 | 12075279088155345 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 162 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 105664 | 0x7f5b53d76a00 | 0x7f5a48236500 | 12075279088182977 | 12075279088195919 | 12075279088360398 | 12075279088363783 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 164 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 107136 | 0x7f5b53d76900 | 0x7f5a48236540 | 12075279088399850 | 12075279088412397 | 12075279088537836 | 12075279088541222 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 166 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 109888 | 0x7f5b53d76800 | 0x7f5a48236580 | 12075279088567982 | 12075279088579596 | 12075279088834473 | 12075279088860125 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 168 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 111360 | 0x7f5b53d76700 | 0x7f5a482365c0 | 12075279088881344 | 12075279088894313 | 12075279089145670 | 12075279089179648 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 170 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 112832 | 0x7f5b53d76600 | 0x7f5a48236600 | 12075279089202892 | 12075279089217830 | 12075279089342788 | 12075279089346228 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 172 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 114816 | 0x7f5b53d76500 | 0x7f5a48236640 | 12075279089373429 | 12075279089385668 | 12075279089558466 | 12075279089561728 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 174 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 116288 | 0x7f5b53d76400 | 0x7f5a48236680 | 12075279089599749 | 12075279089613026 | 12075279089738784 | 12075279089742194 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 176 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 119040 | 0x7f5b53d76300 | 0x7f5a482366c0 | 12075279089768964 | 12075279089781504 | 12075279090036062 | 12075279090059513 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 178 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 120768 | 0x7f5b53d76a00 | 0x7f5a48236700 | 12075279090080312 | 12075279090092861 | 12075279090340379 | 12075279090366113 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 180 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 122496 | 0x7f5b53d76900 | 0x7f5a48236740 | 12075279090389547 | 12075279090402138 | 12075279090528697 | 12075279090532091 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 182 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 124736 | 0x7f5b53d76800 | 0x7f5a48236780 | 12075279090558360 | 12075279090570616 | 12075279090752375 | 12075279090755767 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 184 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 126464 | 0x7f5b53d76700 | 0x7f5a482367c0 | 12075279090792055 | 12075279090805014 | 12075279090930773 | 12075279090933948 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 186 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 20 | 24 | 127936 | 0x7f5b53d76600 | 0x7f5a48236800 | 12075279090961038 | 12075279090973173 | 12075279091236370 | 12075279091262899 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 188 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 129664 | 0x7f5b53d76500 | 0x7f5a48236840 | 12075279091284680 | 12075279091297169 | 12075279091544207 | 12075279091566674 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 190 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 131392 | 0x7f5b53d76400 | 0x7f5a48236880 | 12075279091592692 | 12075279091605166 | 12075279091730445 | 12075279091733824 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 192 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 133632 | 0x7f5b53d76300 | 0x7f5a482368c0 | 12075279091758891 | 12075279091771405 | 12075279091961643 | 12075279091964964 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 194 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 135360 | 0x7f5b53d76a00 | 0x7f5a48236900 | 12075279092006211 | 12075279092018922 | 12075279092145961 | 12075279092149517 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 196 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 20 | 24 | 136832 | 0x7f5b53d76900 | 0x7f5a48236940 | 12075279092177379 | 12075279092190921 | 12075279092504358 | 12075279092527058 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 198 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 138560 | 0x7f5b53d76800 | 0x7f5a48236980 | 12075279092548198 | 12075279092560997 | 12075279092811715 | 12075279092838788 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 200 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 140288 | 0x7f5b53d76700 | 0x7f5a482369c0 | 12075279092858915 | 12075279092871874 | 12075279092996833 | 12075279093004486 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 202 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 142784 | 0x7f5b53d76600 | 0x7f5a48236a00 | 12075279093030223 | 12075279093041312 | 12075279093250910 | 12075279093277523 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 204 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 144768 | 0x7f5b53d76500 | 0x7f5a48236a40 | 12075279093311797 | 12075279093324350 | 12075279093453309 | 12075279093456656 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 206 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 20 | 24 | 145728 | 0x7f5b53d76400 | 0x7f5a48236a80 | 12075279093483706 | 12075279093495228 | 12075279093801465 | 12075279093824539 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 208 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 147712 | 0x7f5b53d76300 | 0x7f5a48236ac0 | 12075279093845959 | 12075279093858745 | 12075279094108662 | 12075279094138533 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 210 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 149696 | 0x7f5b53d76a00 | 0x7f5a48236b00 | 12075279094159812 | 12075279094172022 | 12075279094299860 | 12075279094303299 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 212 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 152192 | 0x7f5b53d76900 | 0x7f5a48236b40 | 12075279094330449 | 12075279094342580 | 12075279094568818 | 12075279094595151 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 214 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 154176 | 0x7f5b53d76800 | 0x7f5a48236b80 | 12075279094626139 | 12075279094638577 | 12075279094764816 | 12075279094768493 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 216 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 20 | 24 | 155648 | 0x7f5b53d76700 | 0x7f5a48236bc0 | 12075279094795063 | 12075279094808015 | 12075279095136652 | 12075279095160021 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 218 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 157632 | 0x7f5b53d76600 | 0x7f5a48236c00 | 12075279095182372 | 12075279095194892 | 12075279095441609 | 12075279095464457 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 220 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 159616 | 0x7f5b53d76500 | 0x7f5a48236c40 | 12075279095488702 | 12075279095501609 | 12075279095630087 | 12075279095633541 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 222 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 162368 | 0x7f5b53d76400 | 0x7f5a48236c80 | 12075279095660000 | 12075279095672487 | 12075279095915365 | 12075279095941814 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 224 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 164608 | 0x7f5b53d76300 | 0x7f5a48236cc0 | 12075279095972831 | 12075279095985764 | 12075279096115203 | 12075279096118893 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 226 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 20 | 24 | 166336 | 0x7f5b53d76a00 | 0x7f5a48236d00 | 12075279096145392 | 12075279096156322 | 12075279096556798 | 12075279096581973 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 228 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 168576 | 0x7f5b53d76900 | 0x7f5a48236d40 | 12075279096603874 | 12075279096616638 | 12075279096874395 | 12075279096900996 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 230 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 170816 | 0x7f5b53d76800 | 0x7f5a48236d80 | 12075279096921494 | 12075279096934715 | 12075279097065274 | 12075279097068868 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 232 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 174080 | 0x7f5b53d76700 | 0x7f5a48236dc0 | 12075279097096068 | 12075279097108313 | 12075279097385590 | 12075279097411615 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 234 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 176576 | 0x7f5b53d76600 | 0x7f5a48236e00 | 12075279097444916 | 12075279097458550 | 12075279097593748 | 12075279097597290 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 236 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 20 | 24 | 177792 | 0x7f5b53d76500 | 0x7f5a48236e40 | 12075279097624210 | 12075279097636788 | 12075279098058704 | 12075279098083022 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 238 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 180288 | 0x7f5b53d76400 | 0x7f5a48236e80 | 12075279098105143 | 12075279098116463 | 12075279098381741 | 12075279098408226 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 240 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 182784 | 0x7f5b53d76300 | 0x7f5a48236ec0 | 12075279098431039 | 12075279098441740 | 12075279098576139 | 12075279098579455 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 242 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 186304 | 0x7f5b53d76a00 | 0x7f5a48236f00 | 12075279098606114 | 12075279098618538 | 12075279098933255 | 12075279098961605 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 244 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 189312 | 0x7f5b53d76900 | 0x7f5a48236f40 | 12075279098992532 | 12075279099005415 | 12075279099156773 | 12075279099160755 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 246 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 20 | 24 | 190784 | 0x7f5b53d76800 | 0x7f5a48236f80 | 12075279099187605 | 12075279099199973 | 12075279099715488 | 12075279099738528 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 248 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 193792 | 0x7f5b53d76700 | 0x7f5a48236fc0 | 12075279099760549 | 12075279099772767 | 12075279100071164 | 12075279100098427 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 250 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 196800 | 0x7f5b53d76600 | 0x7f5a48237000 | 12075279100122963 | 12075279100135484 | 12075279100289562 | 12075279100293059 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 252 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 201088 | 0x7f5b53d76500 | 0x7f5a48237040 | 12075279100319748 | 12075279100332122 | 12075279100716918 | 12075279100743095 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 254 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 204608 | 0x7f5b53d76400 | 0x7f5a48237080 | 12075279100776627 | 12075279100789397 | 12075279100964756 | 12075279100968434 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 256 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 20 | 24 | 206080 | 0x7f5b53d76300 | 0x7f5a482370c0 | 12075279100994572 | 12075279101007155 | 12075279101615949 | 12075279101642977 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 258 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 209600 | 0x7f5b53d76a00 | 0x7f5a48237100 | 12075279101666290 | 12075279101678829 | 12075279102007306 | 12075279102035166 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 260 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 213120 | 0x7f5b53d76900 | 0x7f5a48237140 | 12075279102057437 | 12075279102069385 | 12075279102247623 | 12075279102251307 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 262 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 218176 | 0x7f5b53d76800 | 0x7f5a48237180 | 12075279102278007 | 12075279102290023 | 12075279102745059 | 12075279102771374 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 264 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 222208 | 0x7f5b53d76700 | 0x7f5a482371c0 | 12075279102805677 | 12075279102818818 | 12075279103017376 | 12075279103045553 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 266 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 20 | 24 | 223936 | 0x7f5b53d76600 | 0x7f5a48237200 | 12075279103066392 | 12075279103078655 | 12075279103780408 | 12075279103810535 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 268 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 227968 | 0x7f5b53d76500 | 0x7f5a48237240 | 12075279103833918 | 12075279103845048 | 12075279104216564 | 12075279104243960 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 270 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 232000 | 0x7f5b53d76400 | 0x7f5a48237280 | 12075279104267804 | 12075279104280564 | 12075279104483122 | 12075279104505356 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 272 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 237824 | 0x7f5b53d76300 | 0x7f5a482372c0 | 12075279104526415 | 12075279104538801 | 12075279105063756 | 12075279105091495 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 274 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 242368 | 0x7f5b53d76a00 | 0x7f5a48237300 | 12075279105122212 | 12075279105135755 | 12075279105359753 | 12075279105386894 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 276 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 20 | 24 | 243584 | 0x7f5b53d76900 | 0x7f5a48237340 | 12075279105407773 | 12075279105420553 | 12075279106216865 | 12075279106244317 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 278 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 248128 | 0x7f5b53d76800 | 0x7f5a48237380 | 12075279106267109 | 12075279106279744 | 12075279106722300 | 12075279106748684 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 280 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 252672 | 0x7f5b53d76700 | 0x7f5a482373c0 | 12075279106772188 | 12075279106784859 | 12075279107009657 | 12075279107036288 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 282 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 259264 | 0x7f5b53d76600 | 0x7f5a48237400 | 12075279107059101 | 12075279107070457 | 12075279107665491 | 12075279107691857 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 284 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 264832 | 0x7f5b53d76500 | 0x7f5a48237440 | 12075279107723616 | 12075279107735570 | 12075279108003408 | 12075279108031558 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 286 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 20 | 24 | 266304 | 0x7f5b53d76400 | 0x7f5a48237480 | 12075279108053298 | 12075279108065487 | 12075279109048677 | 12075279109076179 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 288 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 28 | 24 | 271872 | 0x7f5b53d76300 | 0x7f5a482374c0 | 12075279109097809 | 12075279109110277 | 12075279109625952 | 12075279109652349 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 290 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 277440 | 0x7f5b53d76a00 | 0x7f5a48237500 | 12075279109676234 | 12075279109688991 | 12075279109959069 | 12075279109985298 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 292 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 12 | 24 | 279936 | 0x7f5b53d76900 | 0x7f5a48237540 | 12075279110012088 | 12075279110024668 | 12075279110761301 | 12075279110794692 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 294 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 286528 | 0x7f5b53d76800 | 0x7f5a48237580 | 12075279110827994 | 12075279110840500 | 12075279111154577 | 12075279111187241 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 296 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 20 | 24 | 288000 | 0x7f5b53d76700 | 0x7f5a482375c0 | 12075279111209112 | 12075279111222256 | 12075279112391845 | 12075279112419421 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 298 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 32 | 24 | 294592 | 0x7f5b53d76600 | 0x7f5a48237600 | 12075279112440791 | 12075279112453124 | 12075279113062719 | 12075279113090899 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 300 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 301184 | 0x7f5b53d76500 | 0x7f5a48237640 | 12075279113112850 | 12075279113125118 | 12075279113445115 | 12075279113472899 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 302 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 12 | 24 | 304960 | 0x7f5b53d76400 | 0x7f5a48237680 | 12075279113495100 | 12075279113507834 | 12075279114383986 | 12075279114413466 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 304 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 24 | 24 | 313600 | 0x7f5b53d76300 | 0x7f5a482376c0 | 12075279114444794 | 12075279114458065 | 12075279114868141 | 12075279114895622 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 306 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 20 | 24 | 314816 | 0x7f5b53d76a00 | 0x7f5a48237700 | 12075279114919747 | 12075279114932140 | 12075279116481085 | 12075279116554444 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 308 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 20 | 24 | 317568 | 0x7f5b53d76900 | 0x7f5a48237740 | 12075279116579090 | 12075279116593185 | 12075279117385498 | 12075279117460588 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 310 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 12 | 24 | 320320 | 0x7f5b53d76800 | 0x7f5a48237780 | 12075279117484202 | 12075279117497176 | 12075279117910613 | 12075279117980995 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 312 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 12 | 24 | 324096 | 0x7f5b53d76700 | 0x7f5a482377c0 | 12075279118007144 | 12075279118019892 | 12075279119177162 | 12075279119249372 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 314 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 12 | 24 | 328896 | 0x7f5b53d76600 | 0x7f5a48237800 | 12075279119280971 | 12075279119294281 | 12075279120079075 | 12075279120150146 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 316 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 20 | 24 | 330112 | 0x7f5b53d76500 | 0x7f5a48237840 | 12075279120171756 | 12075279120183234 | 12075279123232648 | 12075279123303625 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 318 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 20 | 24 | 332864 | 0x7f5b53d76400 | 0x7f5a48237880 | 12075279123327590 | 12075279123339048 | 12075279124878075 | 12075279124950034 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 320 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 12 | 24 | 335616 | 0x7f5b53d76300 | 0x7f5a482378c0 | 12075279124971274 | 12075279124984474 | 12075279125773267 | 12075279125848203 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 322 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 12 | 24 | 339392 | 0x7f5b53d76a00 | 0x7f5a48237900 | 12075279125871537 | 12075279125885106 | 12075279128166207 | 12075279128240008 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 324 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 12 | 24 | 344192 | 0x7f5b53d76900 | 0x7f5a48237940 | 12075279128277547 | 12075279128291006 | 12075279129826034 | 12075279129897357 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 326 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 20 | 24 | 345408 | 0x7f5b53d76800 | 0x7f5a48237980 | 12075279129919889 | 12075279129933233 | 12075279135986942 | 12075279136061130 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 328 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 20 | 24 | 348160 | 0x7f5b53d76700 | 0x7f5a482379c0 | 12075279136084564 | 12075279136096381 | 12075279139136356 | 12075279139210452 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 330 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 12 | 24 | 350912 | 0x7f5b53d76600 | 0x7f5a48237a00 | 12075279139232704 | 12075279139244035 | 12075279140782262 | 12075279140854868 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 332 | 868283 | 868288 | 4194304 | 256 | 0 | 0 | 12 | 24 | 0 | 0x7f5b53d76500 | 0x7f5a48237a40 | 12075279140877279 | 12075279140888662 | 12075279145415344 | 12075279145490882 |