39 KiB
39 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBuffer.kd | 0 | 0 | 0 | 891557 | 891562 | 33554432 | 256 | 0 | 0 | 8 | 32 | 6464 | 0x0 | 0x7fbba9204180 | 12075755395432052 | 12075755395473365 | 12075755395797202 | 12075755395906163 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 891557 | 891562 | 32768 | 256 | 0 | 0 | 24 | 24 | 12480 | 0x0 | 0x7fbba9235100 | 12075755411537444 | 12075755411649045 | 12075755411655605 | 12075755411661073 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 4 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 12928 | 0x7fbcb4f48900 | 0x7fbba9235140 | 12075755411717368 | 12075755411733204 | 12075755411873363 | 12075755411876484 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 6 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 36 | 24 | 13632 | 0x7fbcb4f48800 | 0x7fbba9235180 | 12075755411928380 | 12075755411940402 | 12075755412188240 | 12075755412288509 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 8 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 14080 | 0x7fbcb4f48700 | 0x7fbba92351c0 | 12075755412323855 | 12075755412335918 | 12075755412582956 | 12075755412680608 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 10 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 14528 | 0x7fbcb4f48600 | 0x7fbba9235200 | 12075755412716194 | 12075755412728875 | 12075755412854473 | 12075755412857346 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 12 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 14976 | 0x7fbcb4f48500 | 0x7fbba9235240 | 12075755412894586 | 12075755412907913 | 12075755413033192 | 12075755413036239 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 14 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 15424 | 0x7fbcb4f48400 | 0x7fbba9235280 | 12075755413100068 | 12075755413112711 | 12075755413237350 | 12075755413239767 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 16 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 16128 | 0x7fbcb4f48300 | 0x7fbba92352c0 | 12075755413276005 | 12075755413288549 | 12075755413533667 | 12075755413631365 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 18 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 16832 | 0x7fbcb4f48a00 | 0x7fbba9235300 | 12075755413661371 | 12075755413673345 | 12075755413921343 | 12075755414020268 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 20 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 17536 | 0x7fbcb4f48900 | 0x7fbba9235340 | 12075755414051846 | 12075755414064061 | 12075755414189340 | 12075755414192498 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 22 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 18240 | 0x7fbcb4f48800 | 0x7fbba9235380 | 12075755414228425 | 12075755414240540 | 12075755414366139 | 12075755414369046 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 24 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 18944 | 0x7fbcb4f48700 | 0x7fbba92353c0 | 12075755414415112 | 12075755414426778 | 12075755414551417 | 12075755414554170 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 26 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 19904 | 0x7fbcb4f48600 | 0x7fbba9235400 | 12075755414588424 | 12075755414601176 | 12075755414845334 | 12075755414918788 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 28 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 20608 | 0x7fbcb4f48500 | 0x7fbba9235440 | 12075755414949865 | 12075755414962133 | 12075755415207570 | 12075755415278636 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 30 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 21312 | 0x7fbcb4f48400 | 0x7fbba9235480 | 12075755415309724 | 12075755415322449 | 12075755415447088 | 12075755415449724 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 32 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 22016 | 0x7fbcb4f48300 | 0x7fbba92354c0 | 12075755415485391 | 12075755415497327 | 12075755415622446 | 12075755415625220 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 34 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 22720 | 0x7fbcb4f48a00 | 0x7fbba9235500 | 12075755415670805 | 12075755415684206 | 12075755415808524 | 12075755415811276 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 36 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 23680 | 0x7fbcb4f48900 | 0x7fbba9235540 | 12075755415845550 | 12075755415860044 | 12075755416108041 | 12075755416178449 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 38 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 24384 | 0x7fbcb4f48800 | 0x7fbba9235580 | 12075755416213303 | 12075755416227720 | 12075755416473478 | 12075755416541363 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 40 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 25088 | 0x7fbcb4f48700 | 0x7fbba92355c0 | 12075755416572260 | 12075755416585797 | 12075755416710276 | 12075755416712872 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 42 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 25792 | 0x7fbcb4f48600 | 0x7fbba9235600 | 12075755416747176 | 12075755416758435 | 12075755416884354 | 12075755416887116 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 44 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 26496 | 0x7fbcb4f48500 | 0x7fbba9235640 | 12075755416932470 | 12075755416944833 | 12075755417069472 | 12075755417072250 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 46 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 27712 | 0x7fbcb4f48400 | 0x7fbba9235680 | 12075755417108487 | 12075755417124191 | 12075755417368989 | 12075755417436777 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 48 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 28416 | 0x7fbcb4f48300 | 0x7fbba92356c0 | 12075755417469107 | 12075755417480988 | 12075755417724506 | 12075755417821582 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 50 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 29120 | 0x7fbcb4f48a00 | 0x7fbba9235700 | 12075755417850676 | 12075755417862904 | 12075755417986583 | 12075755417989424 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 52 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 30080 | 0x7fbcb4f48900 | 0x7fbba9235740 | 12075755418030861 | 12075755418042262 | 12075755418167221 | 12075755418170170 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 54 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 30784 | 0x7fbcb4f48800 | 0x7fbba9235780 | 12075755418216055 | 12075755418228341 | 12075755418353139 | 12075755418356036 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 56 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 32000 | 0x7fbcb4f48700 | 0x7fbba92357c0 | 12075755418389107 | 12075755418401299 | 12075755418685136 | 12075755418782699 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 58 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 32960 | 0x7fbcb4f48600 | 0x7fbba9235800 | 12075755418810781 | 12075755418824175 | 12075755419069612 | 12075755419149370 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 60 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 33920 | 0x7fbcb4f48500 | 0x7fbba9235840 | 12075755419178725 | 12075755419190731 | 12075755419315850 | 12075755419318785 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 62 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 34880 | 0x7fbcb4f48400 | 0x7fbba9235880 | 12075755419353399 | 12075755419368649 | 12075755419493768 | 12075755419496665 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 64 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 35840 | 0x7fbcb4f48300 | 0x7fbba92358c0 | 12075755419541028 | 12075755419553768 | 12075755419679046 | 12075755419681549 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 66 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 37312 | 0x7fbcb4f48a00 | 0x7fbba9235900 | 12075755419714781 | 12075755419726566 | 12075755419980803 | 12075755420035417 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 68 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 38272 | 0x7fbcb4f48900 | 0x7fbba9235940 | 12075755420064020 | 12075755420075203 | 12075755420321920 | 12075755420401086 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 70 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 39232 | 0x7fbcb4f48800 | 0x7fbba9235980 | 12075755420429780 | 12075755420441279 | 12075755420565918 | 12075755420568868 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 72 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 40192 | 0x7fbcb4f48700 | 0x7fbba92359c0 | 12075755420605055 | 12075755420616797 | 12075755420742076 | 12075755420744605 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 74 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 41152 | 0x7fbcb4f48600 | 0x7fbba9235a00 | 12075755420787895 | 12075755420800475 | 12075755420925274 | 12075755420927765 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 76 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 42624 | 0x7fbcb4f48500 | 0x7fbba9235a40 | 12075755420962409 | 12075755420975994 | 12075755421223991 | 12075755421283406 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 78 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 43584 | 0x7fbcb4f48400 | 0x7fbba9235a80 | 12075755421310306 | 12075755421322550 | 12075755421566228 | 12075755421591989 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 80 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 44544 | 0x7fbcb4f48300 | 0x7fbba9235ac0 | 12075755421620633 | 12075755421632947 | 12075755421757906 | 12075755421760643 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 82 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 45760 | 0x7fbcb4f48a00 | 0x7fbba9235b00 | 12075755421794476 | 12075755421806546 | 12075755421931664 | 12075755421934336 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 84 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 46720 | 0x7fbcb4f48900 | 0x7fbba9235b40 | 12075755421979329 | 12075755421991184 | 12075755422116143 | 12075755422119109 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 86 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 48448 | 0x7fbcb4f48800 | 0x7fbba9235b80 | 12075755422154856 | 12075755422167502 | 12075755422418860 | 12075755422443893 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 88 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 49408 | 0x7fbcb4f48700 | 0x7fbba9235bc0 | 12075755422476563 | 12075755422488779 | 12075755422733256 | 12075755422756764 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 90 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 50368 | 0x7fbcb4f48600 | 0x7fbba9235c00 | 12075755422787712 | 12075755422799496 | 12075755422924135 | 12075755422926770 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 92 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 51584 | 0x7fbcb4f48500 | 0x7fbba9235c40 | 12075755422961615 | 12075755422973414 | 12075755423099973 | 12075755423103018 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 94 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 52544 | 0x7fbcb4f48400 | 0x7fbba9235c80 | 12075755423148322 | 12075755423162212 | 12075755423287171 | 12075755423290105 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 96 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 54272 | 0x7fbcb4f48300 | 0x7fbba9235cc0 | 12075755423324018 | 12075755423335651 | 12075755423592128 | 12075755423615801 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 98 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 55488 | 0x7fbcb4f48a00 | 0x7fbba9235d00 | 12075755423645546 | 12075755423658367 | 12075755423903805 | 12075755423926508 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 100 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 56704 | 0x7fbcb4f48900 | 0x7fbba9235d40 | 12075755423955151 | 12075755423968764 | 12075755424094363 | 12075755424097045 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 102 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 58176 | 0x7fbcb4f48800 | 0x7fbba9235d80 | 12075755424133613 | 12075755424146523 | 12075755424273881 | 12075755424276569 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 104 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 59392 | 0x7fbcb4f48700 | 0x7fbba9235dc0 | 12075755424321001 | 12075755424332601 | 12075755424457720 | 12075755424460300 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 106 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 61376 | 0x7fbcb4f48600 | 0x7fbba9235e00 | 12075755424494724 | 12075755424506679 | 12075755424758837 | 12075755424783551 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 108 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 62592 | 0x7fbcb4f48500 | 0x7fbba9235e40 | 12075755424812765 | 12075755424824596 | 12075755425072114 | 12075755425105269 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 110 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 63808 | 0x7fbcb4f48400 | 0x7fbba9235e80 | 12075755425133181 | 12075755425144433 | 12075755425269552 | 12075755425272560 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 112 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 65280 | 0x7fbcb4f48300 | 0x7fbba9235ec0 | 12075755425305120 | 12075755425317871 | 12075755425446990 | 12075755425449599 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 114 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 66496 | 0x7fbcb4f48a00 | 0x7fbba9235f00 | 12075755425493610 | 12075755425505549 | 12075755425630508 | 12075755425633120 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 116 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 68480 | 0x7fbcb4f48900 | 0x7fbba9235f40 | 12075755425666321 | 12075755425680268 | 12075755425933545 | 12075755425957432 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 118 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 69696 | 0x7fbcb4f48800 | 0x7fbba9235f80 | 12075755425987438 | 12075755426000744 | 12075755426280742 | 12075755426311500 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 120 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 70912 | 0x7fbcb4f48700 | 0x7fbba9235fc0 | 12075755426338931 | 12075755426350181 | 12075755426475300 | 12075755426478300 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 122 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 72384 | 0x7fbcb4f48600 | 0x7fbba9236000 | 12075755426511723 | 12075755426523779 | 12075755426659458 | 12075755426662162 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 124 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 73600 | 0x7fbcb4f48500 | 0x7fbba9236040 | 12075755426706284 | 12075755426718017 | 12075755426842656 | 12075755426845293 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 126 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 75840 | 0x7fbcb4f48400 | 0x7fbba9236080 | 12075755426878795 | 12075755426890976 | 12075755427148733 | 12075755427173002 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 128 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 77056 | 0x7fbcb4f48300 | 0x7fbba92360c0 | 12075755427201615 | 12075755427212893 | 12075755427457690 | 12075755427480733 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 130 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 78272 | 0x7fbcb4f48a00 | 0x7fbba9236100 | 12075755427509076 | 12075755427522650 | 12075755427647288 | 12075755427649948 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 132 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 80000 | 0x7fbcb4f48900 | 0x7fbba9236140 | 12075755427686135 | 12075755427698648 | 12075755427840406 | 12075755427843107 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 134 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 81216 | 0x7fbcb4f48800 | 0x7fbba9236180 | 12075755427885506 | 12075755427898326 | 12075755428024405 | 12075755428027159 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 136 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 83456 | 0x7fbcb4f48700 | 0x7fbba92361c0 | 12075755428062935 | 12075755428075284 | 12075755428337522 | 12075755428364606 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 138 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 84928 | 0x7fbcb4f48600 | 0x7fbba9236200 | 12075755428393880 | 12075755428406801 | 12075755428654478 | 12075755428677668 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 140 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 86400 | 0x7fbcb4f48500 | 0x7fbba9236240 | 12075755428706291 | 12075755428719598 | 12075755428845677 | 12075755428848746 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 142 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 88128 | 0x7fbcb4f48400 | 0x7fbba9236280 | 12075755428881326 | 12075755428893036 | 12075755429042475 | 12075755429045812 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 144 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 89600 | 0x7fbcb4f48300 | 0x7fbba92362c0 | 12075755429109400 | 12075755429123914 | 12075755429249033 | 12075755429252005 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 146 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 92096 | 0x7fbcb4f48a00 | 0x7fbba9236300 | 12075755429284636 | 12075755429296552 | 12075755429561350 | 12075755429581187 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 148 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 93568 | 0x7fbcb4f48900 | 0x7fbba9236340 | 12075755429612575 | 12075755429624389 | 12075755429869187 | 12075755429892896 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 150 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 95040 | 0x7fbcb4f48800 | 0x7fbba9236380 | 12075755429921109 | 12075755429932706 | 12075755430058785 | 12075755430062241 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 152 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 96768 | 0x7fbcb4f48700 | 0x7fbba92363c0 | 12075755430095803 | 12075755430107904 | 12075755430265663 | 12075755430268264 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 154 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 98240 | 0x7fbcb4f48600 | 0x7fbba9236400 | 12075755430312917 | 12075755430324382 | 12075755430449661 | 12075755430452446 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 156 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 100736 | 0x7fbcb4f48500 | 0x7fbba9236440 | 12075755430485438 | 12075755430497980 | 12075755430760858 | 12075755430781718 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 158 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 102208 | 0x7fbcb4f48400 | 0x7fbba9236480 | 12075755430811193 | 12075755430823257 | 12075755431070775 | 12075755431095852 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 160 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 103680 | 0x7fbcb4f48300 | 0x7fbba92364c0 | 12075755431122151 | 12075755431134454 | 12075755431259733 | 12075755431262422 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 162 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 105664 | 0x7fbcb4f48a00 | 0x7fbba9236500 | 12075755431298048 | 12075755431310772 | 12075755431475731 | 12075755431478694 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 164 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 107136 | 0x7fbcb4f48900 | 0x7fbba9236540 | 12075755431523076 | 12075755431534290 | 12075755431659569 | 12075755431662185 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 166 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 109888 | 0x7fbcb4f48800 | 0x7fbba9236580 | 12075755431695637 | 12075755431708048 | 12075755431963246 | 12075755431983532 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 168 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 111360 | 0x7fbcb4f48700 | 0x7fbba92365c0 | 12075755432017485 | 12075755432029325 | 12075755432275563 | 12075755432299569 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 170 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 112832 | 0x7fbcb4f48600 | 0x7fbba9236600 | 12075755432327942 | 12075755432342282 | 12075755432467401 | 12075755432470076 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 172 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 114816 | 0x7fbcb4f48500 | 0x7fbba9236640 | 12075755432505181 | 12075755432516521 | 12075755432689799 | 12075755432692439 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 174 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 116288 | 0x7fbcb4f48400 | 0x7fbba9236680 | 12075755432735429 | 12075755432749638 | 12075755432875877 | 12075755432878515 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 176 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 119040 | 0x7fbcb4f48300 | 0x7fbba92366c0 | 12075755432910434 | 12075755432922277 | 12075755433177794 | 12075755433207176 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 178 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 120768 | 0x7fbcb4f48a00 | 0x7fbba9236700 | 12075755433241319 | 12075755433253313 | 12075755433500671 | 12075755433524025 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 180 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 122496 | 0x7fbcb4f48900 | 0x7fbba9236740 | 12075755433553600 | 12075755433567390 | 12075755433692349 | 12075755433695113 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 182 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 124736 | 0x7fbcb4f48800 | 0x7fbba9236780 | 12075755433727683 | 12075755433739869 | 12075755433922587 | 12075755433925601 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 184 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 126464 | 0x7fbcb4f48700 | 0x7fbba92367c0 | 12075755433967559 | 12075755433979546 | 12075755434105465 | 12075755434108842 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 186 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 20 | 24 | 127936 | 0x7fbcb4f48600 | 0x7fbba9236800 | 12075755434141442 | 12075755434152825 | 12075755434416182 | 12075755434440007 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 188 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 129664 | 0x7fbcb4f48500 | 0x7fbba9236840 | 12075755434470423 | 12075755434482581 | 12075755434728499 | 12075755434752067 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 190 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 131392 | 0x7fbcb4f48400 | 0x7fbba9236880 | 12075755434779899 | 12075755434791058 | 12075755434916977 | 12075755434919638 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 192 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 133632 | 0x7fbcb4f48300 | 0x7fbba92368c0 | 12075755434953872 | 12075755434965137 | 12075755435156975 | 12075755435160115 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 194 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 135360 | 0x7fbcb4f48a00 | 0x7fbba9236900 | 12075755435202023 | 12075755435214894 | 12075755435340973 | 12075755435343676 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 196 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 20 | 24 | 136832 | 0x7fbcb4f48900 | 0x7fbba9236940 | 12075755435376297 | 12075755435389292 | 12075755435702729 | 12075755435730916 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 198 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 138560 | 0x7fbcb4f48800 | 0x7fbba9236980 | 12075755435760150 | 12075755435772169 | 12075755436017286 | 12075755436047565 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 200 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 140288 | 0x7fbcb4f48700 | 0x7fbba92369c0 | 12075755436077150 | 12075755436089926 | 12075755436216004 | 12075755436218833 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 202 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 142784 | 0x7fbcb4f48600 | 0x7fbba9236a00 | 12075755436251774 | 12075755436263364 | 12075755436473282 | 12075755436500496 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 204 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 144768 | 0x7fbcb4f48500 | 0x7fbba9236a40 | 12075755436536724 | 12075755436548801 | 12075755436675840 | 12075755436678607 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 206 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 20 | 24 | 145728 | 0x7fbcb4f48400 | 0x7fbba9236a80 | 12075755436711559 | 12075755436724319 | 12075755437060956 | 12075755437089531 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 208 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 147712 | 0x7fbcb4f48300 | 0x7fbba9236ac0 | 12075755437123905 | 12075755437135355 | 12075755437383353 | 12075755437410888 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 210 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 149696 | 0x7fbcb4f48a00 | 0x7fbba9236b00 | 12075755437441174 | 12075755437455192 | 12075755437583511 | 12075755437586575 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 212 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 152192 | 0x7fbcb4f48900 | 0x7fbba9236b40 | 12075755437617031 | 12075755437627990 | 12075755437855348 | 12075755437878387 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 214 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 154176 | 0x7fbcb4f48800 | 0x7fbba9236b80 | 12075755437915446 | 12075755437928628 | 12075755438055666 | 12075755438058722 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 216 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 20 | 24 | 155648 | 0x7fbcb4f48700 | 0x7fbba9236bc0 | 12075755438092174 | 12075755438104306 | 12075755438432783 | 12075755438458836 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 218 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 157632 | 0x7fbcb4f48600 | 0x7fbba9236c00 | 12075755438489383 | 12075755438501422 | 12075755438750699 | 12075755438778269 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 220 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 159616 | 0x7fbcb4f48500 | 0x7fbba9236c40 | 12075755438806281 | 12075755438818059 | 12075755438946698 | 12075755438949548 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 222 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 162368 | 0x7fbcb4f48400 | 0x7fbba9236c80 | 12075755438983771 | 12075755438995017 | 12075755439238535 | 12075755439263050 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 224 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 164608 | 0x7fbcb4f48300 | 0x7fbba9236cc0 | 12075755439302033 | 12075755439314534 | 12075755439443493 | 12075755439446591 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 226 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 20 | 24 | 166336 | 0x7fbcb4f48a00 | 0x7fbba9236d00 | 12075755439479392 | 12075755439491492 | 12075755439866689 | 12075755439889755 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 228 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 168576 | 0x7fbcb4f48900 | 0x7fbba9236d40 | 12075755439919851 | 12075755439932448 | 12075755440185565 | 12075755440210692 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 230 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 170816 | 0x7fbcb4f48800 | 0x7fbba9236d80 | 12075755440240337 | 12075755440252765 | 12075755440381883 | 12075755440385025 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 232 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 174080 | 0x7fbcb4f48700 | 0x7fbba9236dc0 | 12075755440417596 | 12075755440429723 | 12075755440708120 | 12075755440730858 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 234 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 176576 | 0x7fbcb4f48600 | 0x7fbba9236e00 | 12075755440769009 | 12075755440782200 | 12075755440917878 | 12075755440920711 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 236 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 20 | 24 | 177792 | 0x7fbcb4f48500 | 0x7fbba9236e40 | 12075755440952270 | 12075755440965718 | 12075755441412593 | 12075755441436970 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 238 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 180288 | 0x7fbcb4f48400 | 0x7fbba9236e80 | 12075755441471535 | 12075755441484273 | 12075755441740110 | 12075755441763898 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 240 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 182784 | 0x7fbcb4f48300 | 0x7fbba9236ec0 | 12075755441793072 | 12075755441806669 | 12075755441941548 | 12075755441944444 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 242 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 186304 | 0x7fbcb4f48a00 | 0x7fbba9236f00 | 12075755441976163 | 12075755441987308 | 12075755442302025 | 12075755442326975 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 244 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 189312 | 0x7fbcb4f48900 | 0x7fbba9236f40 | 12075755442366237 | 12075755442378344 | 12075755442529862 | 12075755442532767 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 246 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 20 | 24 | 190784 | 0x7fbcb4f48800 | 0x7fbba9236f80 | 12075755442565838 | 12075755442578022 | 12075755443094337 | 12075755443124036 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 248 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 193792 | 0x7fbcb4f48700 | 0x7fbba9236fc0 | 12075755443154292 | 12075755443166016 | 12075755443466173 | 12075755443493823 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 250 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 196800 | 0x7fbcb4f48600 | 0x7fbba9237000 | 12075755443522176 | 12075755443534653 | 12075755443688091 | 12075755443690929 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 252 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 201088 | 0x7fbcb4f48500 | 0x7fbba9237040 | 12075755443725514 | 12075755443737051 | 12075755444121367 | 12075755444150343 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 254 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 204608 | 0x7fbcb4f48400 | 0x7fbba9237080 | 12075755444189837 | 12075755444202966 | 12075755444379604 | 12075755444382715 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 256 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 20 | 24 | 206080 | 0x7fbcb4f48300 | 0x7fbba92370c0 | 12075755444414835 | 12075755444429044 | 12075755445038478 | 12075755445067097 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 258 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 209600 | 0x7fbcb4f48a00 | 0x7fbba9237100 | 12075755445098245 | 12075755445109197 | 12075755445464874 | 12075755445492377 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 260 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 213120 | 0x7fbcb4f48900 | 0x7fbba9237140 | 12075755445520850 | 12075755445532873 | 12075755445711271 | 12075755445714470 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 262 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 218176 | 0x7fbcb4f48800 | 0x7fbba9237180 | 12075755445747542 | 12075755445758951 | 12075755446214146 | 12075755446243133 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 264 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 222208 | 0x7fbcb4f48700 | 0x7fbba92371c0 | 12075755446282816 | 12075755446294945 | 12075755446495584 | 12075755446522422 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 266 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 20 | 24 | 223936 | 0x7fbcb4f48600 | 0x7fbba9237200 | 12075755446549592 | 12075755446561343 | 12075755447264056 | 12075755447293855 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 268 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 227968 | 0x7fbcb4f48500 | 0x7fbba9237240 | 12075755447328069 | 12075755447340055 | 12075755447738291 | 12075755447765321 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 270 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 232000 | 0x7fbcb4f48400 | 0x7fbba9237280 | 12075755447794786 | 12075755447806131 | 12075755448007729 | 12075755448037076 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 272 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 237824 | 0x7fbcb4f48300 | 0x7fbba92372c0 | 12075755448064397 | 12075755448078128 | 12075755448603883 | 12075755448630790 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 274 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 242368 | 0x7fbcb4f48a00 | 0x7fbba9237300 | 12075755448670864 | 12075755448683402 | 12075755448906920 | 12075755448933633 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 276 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 20 | 24 | 243584 | 0x7fbcb4f48900 | 0x7fbba9237340 | 12075755448960272 | 12075755448973799 | 12075755449771551 | 12075755449802618 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 278 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 248128 | 0x7fbcb4f48800 | 0x7fbba9237380 | 12075755449833225 | 12075755449845951 | 12075755450263867 | 12075755450292388 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 280 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 252672 | 0x7fbcb4f48700 | 0x7fbba92373c0 | 12075755450321282 | 12075755450335546 | 12075755450560984 | 12075755450587747 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 282 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 259264 | 0x7fbcb4f48600 | 0x7fbba9237400 | 12075755450617602 | 12075755450630583 | 12075755451226897 | 12075755451255297 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 284 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 264832 | 0x7fbcb4f48500 | 0x7fbba9237440 | 12075755451295001 | 12075755451308976 | 12075755451577614 | 12075755451600529 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 286 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 20 | 24 | 266304 | 0x7fbcb4f48400 | 0x7fbba9237480 | 12075755451631236 | 12075755451644973 | 12075755452629443 | 12075755452658335 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 288 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 28 | 24 | 271872 | 0x7fbcb4f48300 | 0x7fbba92374c0 | 12075755452689082 | 12075755452701283 | 12075755453216798 | 12075755453246217 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 290 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 277440 | 0x7fbcb4f48a00 | 0x7fbba9237500 | 12075755453275632 | 12075755453290237 | 12075755453562074 | 12075755453588984 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 292 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 12 | 24 | 279936 | 0x7fbcb4f48900 | 0x7fbba9237540 | 12075755453617858 | 12075755453630874 | 12075755454368466 | 12075755454396776 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 294 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 286528 | 0x7fbcb4f48800 | 0x7fbba9237580 | 12075755454435367 | 12075755454447826 | 12075755454763502 | 12075755454790467 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 296 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 20 | 24 | 288000 | 0x7fbcb4f48700 | 0x7fbba92375c0 | 12075755454818900 | 12075755454832622 | 12075755456004930 | 12075755456037585 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 298 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 32 | 24 | 294592 | 0x7fbcb4f48600 | 0x7fbba9237600 | 12075755456068753 | 12075755456081730 | 12075755456692604 | 12075755456720344 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 300 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 301184 | 0x7fbcb4f48500 | 0x7fbba9237640 | 12075755456749618 | 12075755456762523 | 12075755457080600 | 12075755457110219 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 302 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 12 | 24 | 304960 | 0x7fbcb4f48400 | 0x7fbba9237680 | 12075755457140214 | 12075755457152919 | 12075755458029870 | 12075755458060465 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 304 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 24 | 24 | 313600 | 0x7fbcb4f48300 | 0x7fbba92376c0 | 12075755458097874 | 12075755458112302 | 12075755458520139 | 12075755458552699 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 306 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 20 | 24 | 314816 | 0x7fbcb4f48a00 | 0x7fbba9237700 | 12075755458582845 | 12075755458597257 | 12075755460146684 | 12075755460219878 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 308 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 20 | 24 | 317568 | 0x7fbcb4f48900 | 0x7fbba9237740 | 12075755460248401 | 12075755460262043 | 12075755461056436 | 12075755461128136 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 310 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 12 | 24 | 320320 | 0x7fbcb4f48800 | 0x7fbba9237780 | 12075755461157931 | 12075755461170035 | 12075755461583951 | 12075755461656778 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 312 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 12 | 24 | 324096 | 0x7fbcb4f48700 | 0x7fbba92377c0 | 12075755461686313 | 12075755461698510 | 12075755462857060 | 12075755462930415 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 314 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 12 | 24 | 328896 | 0x7fbcb4f48600 | 0x7fbba9237800 | 12075755462970890 | 12075755462984259 | 12075755463769693 | 12075755463844354 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 316 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 20 | 24 | 330112 | 0x7fbcb4f48500 | 0x7fbba9237840 | 12075755463873107 | 12075755463886012 | 12075755466940545 | 12075755467014635 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 318 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 20 | 24 | 332864 | 0x7fbcb4f48400 | 0x7fbba9237880 | 12075755467048929 | 12075755467062304 | 12075755468604851 | 12075755468678658 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 320 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 12 | 24 | 335616 | 0x7fbcb4f48300 | 0x7fbba92378c0 | 12075755468708443 | 12075755468722450 | 12075755469511723 | 12075755469584982 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 322 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 12 | 24 | 339392 | 0x7fbcb4f48a00 | 0x7fbba9237900 | 12075755469616210 | 12075755469629802 | 12075755471910903 | 12075755471984261 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 324 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 12 | 24 | 344192 | 0x7fbcb4f48900 | 0x7fbba9237940 | 12075755472034615 | 12075755472048021 | 12075755473583528 | 12075755473657140 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 326 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 20 | 24 | 345408 | 0x7fbcb4f48800 | 0x7fbba9237980 | 12075755473690242 | 12075755473704647 | 12075755479760275 | 12075755479833929 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 328 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 20 | 24 | 348160 | 0x7fbcb4f48700 | 0x7fbba92379c0 | 12075755479865047 | 12075755479879154 | 12075755482921528 | 12075755482996898 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 330 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 12 | 24 | 350912 | 0x7fbcb4f48600 | 0x7fbba9237a00 | 12075755483036702 | 12075755483050487 | 12075755484589994 | 12075755484663736 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 332 | 891557 | 891562 | 4194304 | 256 | 0 | 0 | 12 | 24 | 0 | 0x7fbcb4f48500 | 0x7fbba9237a40 | 12075755484691457 | 12075755484704873 | 12075755489231074 | 12075755489304590 |