48 KiB
48 KiB
| 1 | Index | KernelName | gpu-id | queue-id | queue-index | pid | tid | grd | wgr | lds | scr | vgpr | sgpr | fbar | sig | obj | GRBM_COUNT | GRBM_GUI_ACTIVE | CPC_ME1_BUSY_FOR_PACKET_DECODE | SQ_CYCLES | SQ_WAVES | SQ_WAVE_CYCLES | SQ_BUSY_CYCLES | SQ_LEVEL_WAVES | SQ_ACCUM_PREV_HIRES | DispatchNs | BeginNs | EndNs | CompleteNs |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 2 | 0 | __amd_rocclr_fillBufferAligned.kd | 0 | 0 | 0 | 206513 | 206513 | 33554432 | 256 | 0 | 0 | 4 | 32 | 4160 | 0x0 | 0x7fd82ca04280 | 381343 | 381343 | 8981 | 3050752 | 524288 | 239919456 | 2962542 | 0 | 975899640 | 17336850338375 | 17336133839148 | 17336997386761 | 17336997497271 |
| 3 | 1 | void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd] | 0 | 0 | 2 | 206513 | 206513 | 32768 | 256 | 0 | 0 | 12 | 24 | 13888 | 0x0 | 0x7fd82ca23f80 | 34251 | 34251 | 30792 | 274016 | 512 | 1814325 | 172534 | 0 | 7270928 | 17337002664734 | 17336997386761 | 17337002807885 | 17337002812960 |
| 4 | 2 | void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd] | 0 | 0 | 5 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 14336 | 0x7fd82f967380 | 0x7fd82ca23fc0 | 164673 | 164673 | 13486 | 1317392 | 65536 | 85192702 | 1215418 | 0 | 342501352 | 17337002856539 | 17337002807885 | 17337003204845 | 17337003207389 |
| 5 | 3 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 8 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15040 | 0x7fd82f967200 | 0x7fd82ca24000 | 308785 | 308785 | 22884 | 2470288 | 65536 | 217509407 | 2369781 | 0 | 871766408 | 17337003253058 | 17337003204845 | 17337003632366 | 17337003634908 |
| 6 | 4 | void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd] | 0 | 0 | 11 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 16 | 24 | 15488 | 0x7fd82f967080 | 0x7fd82ca24040 | 311307 | 311307 | 25154 | 2490464 | 65536 | 227703054 | 2382205 | 0 | 912542188 | 17337003675557 | 17337003632366 | 17337004062926 | 17337004065557 |
| 7 | 5 | void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd] | 0 | 0 | 14 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 15936 | 0x7fd82d309f00 | 0x7fd82ca24080 | 166189 | 166189 | 14006 | 1329520 | 65536 | 75482357 | 1223205 | 0 | 303663096 | 17337004107216 | 17337004062926 | 17337004394126 | 17337004396638 |
| 8 | 6 | void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd] | 0 | 0 | 17 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 16384 | 0x7fd82d309d80 | 0x7fd82ca240c0 | 164244 | 164244 | 14355 | 1313960 | 65536 | 83814164 | 1210572 | 0 | 336989396 | 17337004437537 | 17337004394126 | 17337004720047 | 17337004722629 |
| 9 | 7 | void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd] | 0 | 0 | 20 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 17088 | 0x7fd82d309c00 | 0x7fd82ca24100 | 163520 | 163520 | 15321 | 1308168 | 65536 | 108952179 | 1209222 | 0 | 437540372 | 17337004776258 | 17337004720047 | 17337005044847 | 17337005047161 |
| 10 | 8 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 23 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 16 | 24 | 17792 | 0x7fd82d309a80 | 0x7fd82ca24140 | 309752 | 309752 | 24321 | 2478024 | 65536 | 227731809 | 2373550 | 0 | 912656608 | 17337005086740 | 17337005044847 | 17337005472687 | 17337005475289 |
| 11 | 9 | void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd] | 0 | 0 | 26 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 16 | 24 | 18496 | 0x7fd82d309900 | 0x7fd82ca24180 | 306900 | 306900 | 21785 | 2455208 | 65536 | 212289745 | 2352134 | 0 | 850889160 | 17337005514718 | 17337005472687 | 17337005890128 | 17337005892378 |
| 12 | 10 | void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd] | 0 | 0 | 29 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19200 | 0x7fd82d309780 | 0x7fd82ca241c0 | 164269 | 164269 | 15314 | 1314160 | 65536 | 105018464 | 1213337 | 0 | 421797992 | 17337005932167 | 17337005890128 | 17337006228528 | 17337006230819 |
| 13 | 11 | void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd] | 0 | 0 | 32 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 16 | 24 | 19904 | 0x7fd82d309600 | 0x7fd82ca24200 | 164104 | 164104 | 15077 | 1312840 | 65536 | 90873259 | 1211255 | 0 | 365221340 | 17337006271498 | 17337006228528 | 17337006563248 | 17337006565680 |
| 14 | 12 | void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd] | 0 | 0 | 35 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 20608 | 0x7fd82f967480 | 0x7fd82ca24240 | 164520 | 164520 | 15196 | 1316168 | 65536 | 100796642 | 1214231 | 0 | 404912164 | 17337006615269 | 17337006563248 | 17337006889808 | 17337006892272 |
| 15 | 13 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 38 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 16 | 24 | 21312 | 0x7fd82f967300 | 0x7fd82ca24280 | 310572 | 310572 | 23177 | 2484584 | 65536 | 217756929 | 2379786 | 0 | 872756976 | 17337006936191 | 17337006889808 | 17337007323569 | 17337007325310 |
| 16 | 14 | void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd] | 0 | 0 | 41 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22016 | 0x7fd82f967180 | 0x7fd82ca242c0 | 311338 | 311338 | 23397 | 2490712 | 65536 | 225610696 | 2385262 | 0 | 904172836 | 17337007367859 | 17337007323569 | 17337007713649 | 17337007715570 |
| 17 | 15 | void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd] | 0 | 0 | 44 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 16 | 24 | 22720 | 0x7fd82f967000 | 0x7fd82ca24300 | 164824 | 164824 | 14470 | 1318600 | 65536 | 88551311 | 1215038 | 0 | 355937616 | 17337007756569 | 17337007713649 | 17337008015089 | 17337008017032 |
| 18 | 16 | void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd] | 0 | 0 | 47 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 23424 | 0x7fd82d309e80 | 0x7fd82ca24340 | 164576 | 164576 | 14456 | 1316616 | 65536 | 95864719 | 1213023 | 0 | 385188380 | 17337008058321 | 17337008015089 | 17337008314610 | 17337008316524 |
| 19 | 17 | void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd] | 0 | 0 | 50 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 24128 | 0x7fd82d309d00 | 0x7fd82ca24380 | 164278 | 164278 | 14142 | 1314232 | 65536 | 89726775 | 1212882 | 0 | 360630392 | 17337008363863 | 17337008314610 | 17337008613970 | 17337008615696 |
| 20 | 18 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 53 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 16 | 24 | 24832 | 0x7fd82d309b80 | 0x7fd82ca243c0 | 309116 | 309116 | 24656 | 2472936 | 65536 | 226573889 | 2368668 | 0 | 908026860 | 17337008661725 | 17337008613970 | 17337009011890 | 17337009013715 |
| 21 | 19 | void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd] | 0 | 0 | 56 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 16 | 24 | 25536 | 0x7fd82d309a00 | 0x7fd82ca24400 | 308246 | 308246 | 22807 | 2465976 | 65536 | 224042857 | 2363576 | 0 | 897904076 | 17337009055454 | 17337009011890 | 17337009398931 | 17337009400765 |
| 22 | 20 | void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd] | 0 | 0 | 59 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26240 | 0x7fd82d309880 | 0x7fd82ca24440 | 163240 | 163240 | 15157 | 1305928 | 65536 | 101391458 | 1207403 | 0 | 407295460 | 17337009441914 | 17337009398931 | 17337009696051 | 17337009698007 |
| 23 | 21 | void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd] | 0 | 0 | 62 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 26944 | 0x7fd82d309700 | 0x7fd82ca24480 | 162458 | 162458 | 14721 | 1299672 | 65536 | 95523238 | 1201395 | 0 | 383818856 | 17337009741446 | 17337009696051 | 17337009997651 | 17337009999679 |
| 24 | 22 | void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd] | 0 | 0 | 65 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 27648 | 0x7fd82f967580 | 0x7fd82ca244c0 | 163289 | 163289 | 14913 | 1306320 | 65536 | 101838004 | 1203685 | 0 | 409082792 | 17337010047668 | 17337009997651 | 17337010314291 | 17337010316311 |
| 25 | 23 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 68 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 16 | 24 | 28608 | 0x7fd82f967400 | 0x7fd82ca24500 | 308847 | 308847 | 23365 | 2470784 | 65536 | 223628497 | 2367976 | 0 | 896243272 | 17337010358800 | 17337010314291 | 17337010705492 | 17337010707231 |
| 26 | 24 | void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd] | 0 | 0 | 71 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 16 | 24 | 29312 | 0x7fd82f967280 | 0x7fd82ca24540 | 309134 | 309134 | 22315 | 2473080 | 65536 | 223991998 | 2372474 | 0 | 897696388 | 17337010751860 | 17337010705492 | 17337011102292 | 17337011104310 |
| 27 | 25 | void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd] | 0 | 0 | 74 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 30016 | 0x7fd82f967100 | 0x7fd82ca24580 | 162481 | 162481 | 14923 | 1299856 | 65536 | 101433849 | 1201007 | 0 | 407473732 | 17337011145349 | 17337011102292 | 17337011399892 | 17337011401662 |
| 28 | 26 | void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd] | 0 | 0 | 77 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 8 | 24 | 30976 | 0x7fd82d309f80 | 0x7fd82ca245c0 | 162364 | 162364 | 14787 | 1298920 | 65536 | 94301783 | 1197865 | 0 | 378938568 | 17337011444921 | 17337011399892 | 17337011699413 | 17337011701184 |
| 29 | 27 | void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd] | 0 | 0 | 80 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 31680 | 0x7fd82d309e00 | 0x7fd82ca24600 | 162903 | 162903 | 15161 | 1303232 | 65536 | 95583588 | 1201745 | 0 | 384057584 | 17337011749123 | 17337011699413 | 17337012000693 | 17337012002647 |
| 30 | 28 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 83 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 16 | 24 | 32640 | 0x7fd82d309c80 | 0x7fd82ca24640 | 304758 | 304758 | 22975 | 2438072 | 65536 | 218470212 | 2330304 | 0 | 875613384 | 17337012043175 | 17337012000693 | 17337012388693 | 17337012390606 |
| 31 | 29 | void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd] | 0 | 0 | 86 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 33600 | 0x7fd82d309b00 | 0x7fd82ca24680 | 307214 | 307214 | 22811 | 2457720 | 65536 | 222942854 | 2352816 | 0 | 893500140 | 17337012432615 | 17337012388693 | 17337012776533 | 17337012778546 |
| 32 | 30 | void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd] | 0 | 0 | 89 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 34560 | 0x7fd82d309980 | 0x7fd82ca246c0 | 163599 | 163599 | 14540 | 1308800 | 65536 | 93650497 | 1204070 | 0 | 376328484 | 17337012819785 | 17337012776533 | 17337013076534 | 17337013078458 |
| 33 | 31 | void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd] | 0 | 0 | 92 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 8 | 24 | 35520 | 0x7fd82d309800 | 0x7fd82ca24700 | 165400 | 165400 | 15150 | 1323208 | 65536 | 99056661 | 1218468 | 0 | 397953272 | 17337013119127 | 17337013076534 | 17337013378134 | 17337013379960 |
| 34 | 32 | void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd] | 0 | 0 | 95 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 36224 | 0x7fd82d309680 | 0x7fd82ca24740 | 162429 | 162429 | 14829 | 1299440 | 65536 | 105085246 | 1200527 | 0 | 422065152 | 17337013427909 | 17337013378134 | 17337013683894 | 17337013685742 |
| 35 | 33 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 98 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 37184 | 0x7fd82f967500 | 0x7fd82ca24780 | 305822 | 305822 | 23051 | 2446584 | 65536 | 227440963 | 2346688 | 0 | 911495768 | 17337013730861 | 17337013683894 | 17337014073975 | 17337014080352 |
| 36 | 34 | void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd] | 0 | 0 | 101 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 38144 | 0x7fd82f967380 | 0x7fd82ca247c0 | 304925 | 304925 | 22036 | 2439408 | 65536 | 211104352 | 2336457 | 0 | 846146860 | 17337014117191 | 17337014073975 | 17337014464855 | 17337014466702 |
| 37 | 35 | void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd] | 0 | 0 | 104 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 39104 | 0x7fd82f967200 | 0x7fd82ca24800 | 163498 | 163498 | 14976 | 1307992 | 65536 | 94031257 | 1205277 | 0 | 377856236 | 17337014508080 | 17337014464855 | 17337014769015 | 17337014770874 |
| 38 | 36 | void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd] | 0 | 0 | 107 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 8 | 24 | 40320 | 0x7fd82f967080 | 0x7fd82ca24840 | 163570 | 163570 | 14363 | 1308568 | 65536 | 82656895 | 1198605 | 0 | 332356092 | 17337014812582 | 17337014769015 | 17337015072215 | 17337015073985 |
| 39 | 37 | void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd] | 0 | 0 | 110 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 41280 | 0x7fd82d309f00 | 0x7fd82ca24880 | 162196 | 162196 | 14205 | 1297576 | 65536 | 91554096 | 1193631 | 0 | 367943356 | 17337015122274 | 17337015072215 | 17337015378616 | 17337015380447 |
| 40 | 38 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 113 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 42240 | 0x7fd82d309d80 | 0x7fd82ca248c0 | 306818 | 306818 | 24499 | 2454552 | 65536 | 226323797 | 2352739 | 0 | 907024980 | 17337015425716 | 17337015378616 | 17337015783576 | 17337015785437 |
| 41 | 39 | void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd] | 0 | 0 | 116 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 43200 | 0x7fd82d309c00 | 0x7fd82ca24900 | 303894 | 303894 | 21607 | 2431160 | 65536 | 217817045 | 2329512 | 0 | 873001080 | 17337015827216 | 17337015783576 | 17337016175576 | 17337016177336 |
| 42 | 40 | void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd] | 0 | 0 | 119 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 8 | 24 | 44160 | 0x7fd82d309a80 | 0x7fd82ca24940 | 163644 | 163644 | 14535 | 1309160 | 65536 | 91093357 | 1196528 | 0 | 366097244 | 17337016217685 | 17337016175576 | 17337016476377 | 17337016478218 |
| 43 | 41 | void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd] | 0 | 0 | 122 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 45376 | 0x7fd82d309900 | 0x7fd82ca24980 | 162483 | 162483 | 14937 | 1299872 | 65536 | 90736956 | 1199952 | 0 | 364677228 | 17337016519377 | 17337016476377 | 17337016776857 | 17337016778660 |
| 44 | 42 | void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd] | 0 | 0 | 125 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 46336 | 0x7fd82d309780 | 0x7fd82ca249c0 | 162029 | 162029 | 14648 | 1296240 | 65536 | 88772993 | 1192710 | 0 | 356820400 | 17337016828149 | 17337016776857 | 17337017085337 | 17337017087172 |
| 45 | 43 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 128 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 47552 | 0x7fd82d309600 | 0x7fd82ca24a00 | 302848 | 302848 | 23076 | 2422792 | 65536 | 222551257 | 2320331 | 0 | 891934188 | 17337017132541 | 17337017085337 | 17337017477017 | 17337017478842 |
| 46 | 44 | void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd] | 0 | 0 | 131 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 48512 | 0x7fd82f967480 | 0x7fd82ca24a40 | 301478 | 301478 | 20554 | 2411832 | 65536 | 207595801 | 2308082 | 0 | 832114616 | 17337017520511 | 17337017477017 | 17337017863578 | 17337017865441 |
| 47 | 45 | void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd] | 0 | 0 | 134 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 8 | 24 | 49472 | 0x7fd82f967300 | 0x7fd82ca24a80 | 161906 | 161906 | 14840 | 1295256 | 65536 | 86438911 | 1193758 | 0 | 347488548 | 17337017907000 | 17337017863578 | 17337018163898 | 17337018165734 |
| 48 | 46 | void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd] | 0 | 0 | 137 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 50688 | 0x7fd82f967180 | 0x7fd82ca24ac0 | 163770 | 163770 | 15848 | 1310168 | 65536 | 98222095 | 1204581 | 0 | 394622888 | 17337018207692 | 17337018163898 | 17337018472858 | 17337018474645 |
| 49 | 47 | void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd] | 0 | 0 | 140 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 51648 | 0x7fd82f967000 | 0x7fd82ca24b00 | 162290 | 162290 | 15343 | 1298328 | 65536 | 97504070 | 1193016 | 0 | 391751740 | 17337018523874 | 17337018472858 | 17337018780539 | 17337018782367 |
| 50 | 48 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 143 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 52864 | 0x7fd82d309e80 | 0x7fd82ca24b40 | 303572 | 303572 | 22978 | 2428584 | 65536 | 222801793 | 2327173 | 0 | 892936216 | 17337018824896 | 17337018780539 | 17337019166939 | 17337019168997 |
| 51 | 49 | void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd] | 0 | 0 | 146 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 54080 | 0x7fd82d309d00 | 0x7fd82ca24b80 | 302048 | 302048 | 20714 | 2416392 | 65536 | 211905892 | 2309905 | 0 | 849352620 | 17337019211426 | 17337019166939 | 17337019563579 | 17337019565546 |
| 52 | 50 | void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd] | 0 | 0 | 149 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 8 | 24 | 55296 | 0x7fd82d309b80 | 0x7fd82ca24bc0 | 162694 | 162694 | 14864 | 1301560 | 65536 | 93110556 | 1201660 | 0 | 374165440 | 17337019605945 | 17337019563579 | 17337019863739 | 17337019865518 |
| 53 | 51 | void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd] | 0 | 0 | 152 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 56768 | 0x7fd82d309a00 | 0x7fd82ca24c00 | 162734 | 162734 | 15656 | 1301880 | 65536 | 100638172 | 1201013 | 0 | 404290100 | 17337019906657 | 17337019863739 | 17337020166780 | 17337020168620 |
| 54 | 52 | void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd] | 0 | 0 | 155 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 57728 | 0x7fd82d309880 | 0x7fd82ca24c40 | 161192 | 161192 | 13912 | 1289544 | 65536 | 90769078 | 1189399 | 0 | 364803884 | 17337020216729 | 17337020166780 | 17337020474300 | 17337020476162 |
| 55 | 53 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 158 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 58944 | 0x7fd82d309700 | 0x7fd82ca24c80 | 304772 | 304772 | 23725 | 2438184 | 65536 | 224605906 | 2335262 | 0 | 900155968 | 17337020521971 | 17337020474300 | 17337020870140 | 17337020871872 |
| 56 | 54 | void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd] | 0 | 0 | 161 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 60160 | 0x7fd82f967580 | 0x7fd82ca24cc0 | 302277 | 302277 | 21377 | 2418224 | 65536 | 215369431 | 2317854 | 0 | 863205988 | 17337020913421 | 17337020870140 | 17337021261501 | 17337021263391 |
| 57 | 55 | void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd] | 0 | 0 | 164 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 8 | 24 | 61376 | 0x7fd82f967400 | 0x7fd82ca24d00 | 163044 | 163044 | 15300 | 1304360 | 65536 | 91620512 | 1201898 | 0 | 368219072 | 17337021305530 | 17337021261501 | 17337021561501 | 17337021563353 |
| 58 | 56 | void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd] | 0 | 0 | 167 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 62848 | 0x7fd82f967280 | 0x7fd82ca24d40 | 168501 | 168501 | 16629 | 1348016 | 65536 | 104915370 | 1248118 | 0 | 421397448 | 17337021603672 | 17337021561501 | 17337021873501 | 17337021875295 |
| 59 | 57 | void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd] | 0 | 0 | 170 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 63808 | 0x7fd82f967100 | 0x7fd82ca24d80 | 161910 | 161910 | 14501 | 1295288 | 65536 | 95085129 | 1196353 | 0 | 382067476 | 17337021924554 | 17337021873501 | 17337022178781 | 17337022180897 |
| 60 | 58 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 173 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 65024 | 0x7fd82d309f80 | 0x7fd82ca24dc0 | 300615 | 300615 | 22535 | 2404928 | 65536 | 219423034 | 2302767 | 0 | 879424272 | 17337022223296 | 17337022178781 | 17337022568222 | 17337022570037 |
| 61 | 59 | void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd] | 0 | 0 | 176 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 66240 | 0x7fd82d309e00 | 0x7fd82ca24e00 | 299591 | 299591 | 21081 | 2396736 | 65536 | 215335696 | 2294718 | 0 | 863079256 | 17337022611916 | 17337022568222 | 17337022955742 | 17337022957567 |
| 62 | 60 | void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd] | 0 | 0 | 179 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 8 | 24 | 67456 | 0x7fd82d309c80 | 0x7fd82ca24e40 | 162435 | 162435 | 14847 | 1299488 | 65536 | 88112052 | 1196839 | 0 | 354174672 | 17337022998706 | 17337022955742 | 17337023253982 | 17337023255879 |
| 63 | 61 | void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd] | 0 | 0 | 182 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 68928 | 0x7fd82d309b00 | 0x7fd82ca24e80 | 177389 | 177389 | 16675 | 1419120 | 65536 | 103855694 | 1312200 | 0 | 417164344 | 17337023298788 | 17337023253982 | 17337023564703 | 17337023566601 |
| 64 | 62 | void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd] | 0 | 0 | 185 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 70144 | 0x7fd82d309980 | 0x7fd82ca24ec0 | 160960 | 160960 | 14526 | 1287688 | 65536 | 89956241 | 1184798 | 0 | 361557568 | 17337023615049 | 17337023564703 | 17337023877503 | 17337023879282 |
| 65 | 63 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 188 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 71616 | 0x7fd82d309800 | 0x7fd82ca24f00 | 303489 | 303489 | 22943 | 2427920 | 65536 | 224323210 | 2327885 | 0 | 899025200 | 17337023921091 | 17337023877503 | 17337024270943 | 17337024272732 |
| 66 | 64 | void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd] | 0 | 0 | 191 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 72832 | 0x7fd82d309680 | 0x7fd82ca24f40 | 304010 | 304010 | 22821 | 2432088 | 65536 | 216945199 | 2325342 | 0 | 869510128 | 17337024316211 | 17337024270943 | 17337024660224 | 17337024662232 |
| 67 | 65 | void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd] | 0 | 0 | 194 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 8 | 24 | 74048 | 0x7fd82f967500 | 0x7fd82ca24f80 | 161081 | 161081 | 15457 | 1288656 | 65536 | 91084203 | 1185479 | 0 | 366073832 | 17337024703381 | 17337024660224 | 17337024957504 | 17337024959484 |
| 68 | 66 | void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd] | 0 | 0 | 197 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 75776 | 0x7fd82f967380 | 0x7fd82ca24fc0 | 182132 | 182132 | 17107 | 1457064 | 65536 | 112964296 | 1351736 | 0 | 453605464 | 17337024999973 | 17337024957504 | 17337025272224 | 17337025273976 |
| 69 | 67 | void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd] | 0 | 0 | 200 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 76992 | 0x7fd82f967200 | 0x7fd82ca25000 | 161346 | 161346 | 15091 | 1290776 | 65536 | 90042045 | 1188506 | 0 | 361898820 | 17337025333834 | 17337025272224 | 17337025572384 | 17337025574108 |
| 70 | 68 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 203 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 78464 | 0x7fd82f967080 | 0x7fd82ca25040 | 302364 | 302364 | 22961 | 2418920 | 65536 | 222340419 | 2317721 | 0 | 891099128 | 17337025616927 | 17337025572384 | 17337025962785 | 17337025964507 |
| 71 | 69 | void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd] | 0 | 0 | 206 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 79936 | 0x7fd82d309f00 | 0x7fd82ca25080 | 303882 | 303882 | 23962 | 2431064 | 65536 | 223674652 | 2328281 | 0 | 896424828 | 17337026007156 | 17337025962785 | 17337026372865 | 17337026374887 |
| 72 | 70 | void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd] | 0 | 0 | 209 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 8 | 24 | 81408 | 0x7fd82d309d80 | 0x7fd82ca250c0 | 163329 | 163329 | 16054 | 1306640 | 65536 | 91707059 | 1199606 | 0 | 368559584 | 17337026415735 | 17337026372865 | 17337026674945 | 17337026676909 |
| 73 | 71 | void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd] | 0 | 0 | 212 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 83136 | 0x7fd82d309c00 | 0x7fd82ca25100 | 192550 | 192550 | 19049 | 1540408 | 65536 | 120286082 | 1430340 | 0 | 482890056 | 17337026718337 | 17337026674945 | 17337026996386 | 17337026998140 |
| 74 | 72 | void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd] | 0 | 0 | 215 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 84352 | 0x7fd82d309a80 | 0x7fd82ca25140 | 161985 | 161985 | 14850 | 1295888 | 65536 | 91224294 | 1195907 | 0 | 366637640 | 17337027047229 | 17337026996386 | 17337027305506 | 17337027307282 |
| 75 | 73 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 218 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 85824 | 0x7fd82d309900 | 0x7fd82ca25180 | 303646 | 303646 | 23693 | 2429176 | 65536 | 222142521 | 2325982 | 0 | 890304288 | 17337027353161 | 17337027305506 | 17337027697666 | 17337027699651 |
| 76 | 74 | void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd] | 0 | 0 | 221 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 87296 | 0x7fd82d309780 | 0x7fd82ca251c0 | 299061 | 299061 | 21865 | 2392496 | 65536 | 212949440 | 2292344 | 0 | 853527488 | 17337027741570 | 17337027697666 | 17337028082466 | 17337028084231 |
| 77 | 75 | void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd] | 0 | 0 | 224 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 88768 | 0x7fd82d309600 | 0x7fd82ca25200 | 162098 | 162098 | 15440 | 1296792 | 65536 | 95754401 | 1193585 | 0 | 384746440 | 17337028125630 | 17337028082466 | 17337028382947 | 17337028384713 |
| 78 | 76 | void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd] | 0 | 0 | 227 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 90752 | 0x7fd82f967480 | 0x7fd82ca25240 | 199963 | 199963 | 17941 | 1599712 | 65536 | 136381314 | 1498163 | 0 | 547267880 | 17337028424482 | 17337028382947 | 17337028714627 | 17337028716504 |
| 79 | 77 | void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd] | 0 | 0 | 230 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 91968 | 0x7fd82f967300 | 0x7fd82ca25280 | 161712 | 161712 | 15684 | 1293704 | 65536 | 93172581 | 1188627 | 0 | 374420488 | 17337028764493 | 17337028714627 | 17337029022307 | 17337029024056 |
| 80 | 78 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 233 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 93440 | 0x7fd82f967180 | 0x7fd82ca252c0 | 302068 | 302068 | 22448 | 2416552 | 65536 | 218247413 | 2313291 | 0 | 874721316 | 17337029069825 | 17337029022307 | 17337029414308 | 17337029416046 |
| 81 | 79 | void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd] | 0 | 0 | 236 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 94912 | 0x7fd82f967000 | 0x7fd82ca25300 | 298620 | 298620 | 20927 | 2388968 | 65536 | 206933402 | 2283268 | 0 | 829469632 | 17337029457735 | 17337029414308 | 17337029800068 | 17337029801806 |
| 82 | 80 | void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd] | 0 | 0 | 239 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 96384 | 0x7fd82d309e80 | 0x7fd82ca25340 | 162202 | 162202 | 15799 | 1297624 | 65536 | 99209684 | 1195000 | 0 | 398569312 | 17337029842395 | 17337029800068 | 17337030101988 | 17337030103778 |
| 83 | 81 | void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd] | 0 | 0 | 242 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 98368 | 0x7fd82d309d00 | 0x7fd82ca25380 | 210720 | 210720 | 18562 | 1685768 | 65536 | 125454908 | 1573296 | 0 | 503566024 | 17337030146047 | 17337030101988 | 17337030438308 | 17337030440199 |
| 84 | 82 | void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd] | 0 | 0 | 245 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 99584 | 0x7fd82d309b80 | 0x7fd82ca253c0 | 161332 | 161332 | 14735 | 1290664 | 65536 | 92411698 | 1190133 | 0 | 371376612 | 17337030488837 | 17337030438308 | 17337030745509 | 17337030747391 |
| 85 | 83 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 248 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 101312 | 0x7fd82d309a00 | 0x7fd82ca25400 | 299832 | 299832 | 22685 | 2398664 | 65536 | 216791270 | 2293449 | 0 | 868903240 | 17337030788230 | 17337030745509 | 17337031143749 | 17337031145500 |
| 86 | 84 | void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd] | 0 | 0 | 251 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 102784 | 0x7fd82d309880 | 0x7fd82ca25440 | 299482 | 299482 | 20135 | 2395864 | 65536 | 198570511 | 2289874 | 0 | 796016096 | 17337031187119 | 17337031143749 | 17337031530949 | 17337031532750 |
| 87 | 85 | void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd] | 0 | 0 | 254 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 104256 | 0x7fd82d309700 | 0x7fd82ca25480 | 162795 | 162795 | 15949 | 1302368 | 65536 | 99872383 | 1199561 | 0 | 401229416 | 17337031573989 | 17337031530949 | 17337031832710 | 17337031834472 |
| 88 | 86 | void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd] | 0 | 0 | 257 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 106240 | 0x7fd82f967580 | 0x7fd82ca254c0 | 218292 | 218292 | 19127 | 1746344 | 65536 | 146570341 | 1638670 | 0 | 588026604 | 17337031875861 | 17337031832710 | 17337032169510 | 17337032171363 |
| 89 | 87 | void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd] | 0 | 0 | 260 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 107712 | 0x7fd82f967400 | 0x7fd82ca25500 | 160426 | 160426 | 14979 | 1283416 | 65536 | 93530345 | 1183952 | 0 | 375857048 | 17337032219602 | 17337032169510 | 17337032478470 | 17337032480305 |
| 90 | 88 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 263 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 16 | 24 | 109440 | 0x7fd82f967280 | 0x7fd82ca25540 | 297329 | 297329 | 21579 | 2378640 | 65536 | 216206085 | 2276612 | 0 | 866559432 | 17337032526413 | 17337032478470 | 17337032885191 | 17337032887014 |
| 91 | 89 | void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd] | 0 | 0 | 266 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 16 | 24 | 111168 | 0x7fd82f967100 | 0x7fd82ca25580 | 300111 | 300111 | 22158 | 2400896 | 65536 | 213278096 | 2297541 | 0 | 854845932 | 17337032929153 | 17337032885191 | 17337033280551 | 17337033282333 |
| 92 | 90 | void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd] | 0 | 0 | 269 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 8 | 24 | 112896 | 0x7fd82d309f80 | 0x7fd82ca255c0 | 162161 | 162161 | 15328 | 1297296 | 65536 | 100116606 | 1195615 | 0 | 402200944 | 17337033323722 | 17337033280551 | 17337033590791 | 17337033592435 |
| 93 | 91 | void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd] | 0 | 0 | 272 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 115136 | 0x7fd82d309e00 | 0x7fd82ca25600 | 229728 | 229728 | 19605 | 1837832 | 65536 | 154369399 | 1727662 | 0 | 619219308 | 17337033634024 | 17337033590791 | 17337033938151 | 17337033940056 |
| 94 | 92 | void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd] | 0 | 0 | 275 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 116608 | 0x7fd82d309c80 | 0x7fd82ca25640 | 160689 | 160689 | 15185 | 1285520 | 65536 | 95826579 | 1185088 | 0 | 385037424 | 17337033988585 | 17337033938151 | 17337034252872 | 17337034254758 |
| 95 | 93 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 278 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 16 | 24 | 118336 | 0x7fd82d309b00 | 0x7fd82ca25680 | 296520 | 296520 | 21534 | 2372168 | 65536 | 212329594 | 2272483 | 0 | 851057124 | 17337034297357 | 17337034252872 | 17337034641032 | 17337034642937 |
| 96 | 94 | void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd] | 0 | 0 | 281 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 16 | 24 | 120064 | 0x7fd82d309980 | 0x7fd82ca256c0 | 297461 | 297461 | 20149 | 2379696 | 65536 | 205350983 | 2272226 | 0 | 823141268 | 17337034684526 | 17337034641032 | 17337035026952 | 17337035028717 |
| 97 | 95 | void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd] | 0 | 0 | 284 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 121792 | 0x7fd82d309800 | 0x7fd82ca25700 | 163779 | 163779 | 15837 | 1310240 | 65536 | 102993514 | 1210209 | 0 | 413708592 | 17337035070656 | 17337035026952 | 17337035328873 | 17337035330769 |
| 98 | 96 | void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd] | 0 | 0 | 287 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 124032 | 0x7fd82d309680 | 0x7fd82ca25740 | 240493 | 240493 | 20044 | 1923952 | 65536 | 145199972 | 1811956 | 0 | 582553392 | 17337035372168 | 17337035328873 | 17337035683913 | 17337035685910 |
| 99 | 97 | void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd] | 0 | 0 | 290 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 125504 | 0x7fd82f967500 | 0x7fd82ca25780 | 160778 | 160778 | 15502 | 1286232 | 65536 | 94007087 | 1184855 | 0 | 377763316 | 17337035734339 | 17337035683913 | 17337035987433 | 17337035989192 |
| 100 | 98 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 293 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 127488 | 0x7fd82f967380 | 0x7fd82ca257c0 | 298738 | 298738 | 21219 | 2389912 | 65536 | 212170970 | 2280238 | 0 | 850415716 | 17337036034181 | 17337035987433 | 17337036381514 | 17337036383392 |
| 101 | 99 | void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd] | 0 | 0 | 296 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 129216 | 0x7fd82f967200 | 0x7fd82ca25800 | 298224 | 298224 | 20826 | 2385800 | 65536 | 204868864 | 2277808 | 0 | 821212684 | 17337036424940 | 17337036381514 | 17337036773514 | 17337036775361 |
| 102 | 100 | void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd] | 0 | 0 | 299 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 130944 | 0x7fd82f967080 | 0x7fd82ca25840 | 172244 | 172244 | 16884 | 1377960 | 65536 | 98761040 | 1273275 | 0 | 396797224 | 17337036815910 | 17337036773514 | 17337037082474 | 17337037084473 |
| 103 | 101 | void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd] | 0 | 0 | 302 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 133440 | 0x7fd82d309f00 | 0x7fd82ca25880 | 259098 | 259098 | 21641 | 2072792 | 65536 | 175838423 | 1959099 | 0 | 705105368 | 17337037126152 | 17337037082474 | 17337037446154 | 17337037447924 |
| 104 | 102 | void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd] | 0 | 0 | 305 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 134912 | 0x7fd82d309d80 | 0x7fd82ca258c0 | 161876 | 161876 | 15984 | 1295016 | 65536 | 98032199 | 1192694 | 0 | 393861844 | 17337037496742 | 17337037446154 | 17337037754155 | 17337037755945 |
| 105 | 103 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 308 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 136896 | 0x7fd82d309c00 | 0x7fd82ca25900 | 296556 | 296556 | 19378 | 2372456 | 65536 | 195577089 | 2263607 | 0 | 784053672 | 17337037796794 | 17337037754155 | 17337038148075 | 17337038150015 |
| 106 | 104 | void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd] | 0 | 0 | 311 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 138880 | 0x7fd82d309a80 | 0x7fd82ca25940 | 296880 | 296880 | 21199 | 2375048 | 65536 | 212994959 | 2274603 | 0 | 853722248 | 17337038193834 | 17337038148075 | 17337038541995 | 17337038543785 |
| 107 | 105 | void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd] | 0 | 0 | 314 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 140864 | 0x7fd82d309900 | 0x7fd82ca25980 | 177442 | 177442 | 16434 | 1419544 | 65536 | 113628579 | 1316889 | 0 | 456256068 | 17337038583963 | 17337038541995 | 17337038854796 | 17337038856656 |
| 108 | 106 | void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd] | 0 | 0 | 317 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 143616 | 0x7fd82d309780 | 0x7fd82ca259c0 | 279168 | 279168 | 21900 | 2233352 | 65536 | 194272020 | 2128629 | 0 | 778837168 | 17337038898125 | 17337038854796 | 17337039232716 | 17337039234646 |
| 109 | 107 | void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd] | 0 | 0 | 320 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 145344 | 0x7fd82d309600 | 0x7fd82ca25a00 | 161504 | 161504 | 15904 | 1292040 | 65536 | 98921559 | 1189540 | 0 | 397428332 | 17337039284065 | 17337039232716 | 17337039541836 | 17337039543658 |
| 110 | 108 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 323 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 147584 | 0x7fd82f967480 | 0x7fd82ca25a40 | 296217 | 296217 | 21112 | 2369744 | 65536 | 208925383 | 2266798 | 0 | 837445108 | 17337039585727 | 17337039541836 | 17337039931757 | 17337039933558 |
| 111 | 109 | void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd] | 0 | 0 | 326 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 149568 | 0x7fd82f967300 | 0x7fd82ca25a80 | 296482 | 296482 | 20791 | 2371864 | 65536 | 202118037 | 2263273 | 0 | 810213816 | 17337039975607 | 17337039931757 | 17337040321037 | 17337040322777 |
| 112 | 110 | void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd] | 0 | 0 | 329 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 151552 | 0x7fd82f967180 | 0x7fd82ca25ac0 | 186729 | 186729 | 17690 | 1493840 | 65536 | 114633448 | 1387157 | 0 | 460294272 | 17337040363716 | 17337040321037 | 17337040645357 | 17337040647149 |
| 113 | 111 | void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd] | 0 | 0 | 332 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 154304 | 0x7fd82f967000 | 0x7fd82ca25b00 | 298546 | 298546 | 23505 | 2388376 | 65536 | 213281956 | 2282208 | 0 | 854875548 | 17337040688328 | 17337040645357 | 17337041037357 | 17337041039128 |
| 114 | 112 | void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd] | 0 | 0 | 335 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 156288 | 0x7fd82d309e80 | 0x7fd82ca25b40 | 171087 | 171087 | 16057 | 1368704 | 65536 | 106385284 | 1267172 | 0 | 427289536 | 17337041087747 | 17337041037357 | 17337041345678 | 17337041347570 |
| 115 | 113 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 338 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 158784 | 0x7fd82d309d00 | 0x7fd82ca25b80 | 297534 | 297534 | 19626 | 2380280 | 65536 | 179565447 | 2257136 | 0 | 720012352 | 17337041388669 | 17337041345678 | 17337041736878 | 17337041738720 |
| 116 | 114 | void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd] | 0 | 0 | 341 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 161024 | 0x7fd82d309b80 | 0x7fd82ca25bc0 | 296467 | 296467 | 19699 | 2371744 | 65536 | 190973641 | 2254681 | 0 | 765645740 | 17337041780859 | 17337041736878 | 17337042125998 | 17337042128080 |
| 117 | 115 | void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd] | 0 | 0 | 344 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 163264 | 0x7fd82d309a00 | 0x7fd82ca25c00 | 206082 | 206082 | 18276 | 1648664 | 65536 | 128364125 | 1541605 | 0 | 515212684 | 17337042169238 | 17337042125998 | 17337042459599 | 17337042461351 |
| 118 | 116 | void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd] | 0 | 0 | 347 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 166528 | 0x7fd82d309880 | 0x7fd82ca25c40 | 339502 | 339502 | 25581 | 2716024 | 65536 | 249324343 | 2609588 | 0 | 999052644 | 17337042502230 | 17337042459599 | 17337042873039 | 17337042895879 |
| 119 | 117 | void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd] | 0 | 0 | 350 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 168512 | 0x7fd82d309700 | 0x7fd82ca25c80 | 184338 | 184338 | 17247 | 1474712 | 65536 | 109973636 | 1365308 | 0 | 441643172 | 17337042924208 | 17337042873039 | 17337043199439 | 17337043201231 |
| 120 | 118 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 353 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 171264 | 0x7fd82f967580 | 0x7fd82ca25cc0 | 295804 | 295804 | 19790 | 2366440 | 65536 | 193474938 | 2252639 | 0 | 775659176 | 17337043241130 | 17337043199439 | 17337043590160 | 17337043592011 |
| 121 | 119 | void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd] | 0 | 0 | 356 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 173760 | 0x7fd82f967400 | 0x7fd82ca25d00 | 300036 | 300036 | 21253 | 2400296 | 65536 | 160848147 | 2260601 | 0 | 645141000 | 17337043633880 | 17337043590160 | 17337043982960 | 17337043984760 |
| 122 | 120 | void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd] | 0 | 0 | 359 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 176256 | 0x7fd82f967280 | 0x7fd82ca25d40 | 224412 | 224412 | 19280 | 1795304 | 65536 | 151945219 | 1689248 | 0 | 609535260 | 17337044025729 | 17337043982960 | 17337044326320 | 17337044328101 |
| 123 | 121 | void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd] | 0 | 0 | 362 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 179776 | 0x7fd82f967100 | 0x7fd82ca25d80 | 380221 | 380221 | 27373 | 3041776 | 65536 | 275738631 | 2933195 | 0 | 1104712716 | 17337044369710 | 17337044326320 | 17337044765521 | 17337044788499 |
| 124 | 122 | void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd] | 0 | 0 | 365 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 182272 | 0x7fd82d309f80 | 0x7fd82ca25dc0 | 210188 | 210188 | 18565 | 1681512 | 65536 | 138892718 | 1577681 | 0 | 557323716 | 17337044817348 | 17337044765521 | 17337045107761 | 17337045109520 |
| 125 | 123 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 368 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 185536 | 0x7fd82d309e00 | 0x7fd82ca25e00 | 306416 | 306416 | 21806 | 2451336 | 65536 | 194360870 | 2333074 | 0 | 779213444 | 17337045150639 | 17337045107761 | 17337045509681 | 17337045527369 |
| 126 | 124 | void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd] | 0 | 0 | 371 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 188544 | 0x7fd82d309c80 | 0x7fd82ca25e40 | 308703 | 308703 | 23728 | 2469632 | 65536 | 176856772 | 2327592 | 0 | 709184912 | 17337045551979 | 17337045509681 | 17337045923762 | 17337045940788 |
| 127 | 125 | void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd] | 0 | 0 | 374 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 191552 | 0x7fd82d309b00 | 0x7fd82ca25e80 | 265751 | 265751 | 21485 | 2126016 | 65536 | 181467858 | 2017703 | 0 | 727626412 | 17337045966388 | 17337045923762 | 17337046305362 | 17337046307449 |
| 128 | 126 | void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd] | 0 | 0 | 377 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 195840 | 0x7fd82d309980 | 0x7fd82ca25ec0 | 460661 | 460661 | 31378 | 3685296 | 65536 | 345444180 | 3575583 | 0 | 1383537328 | 17337046348568 | 17337046305362 | 17337046802642 | 17337046849304 |
| 129 | 127 | void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd] | 0 | 0 | 380 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 198592 | 0x7fd82d309800 | 0x7fd82ca25f00 | 244443 | 244443 | 20672 | 1955552 | 65536 | 150767904 | 1845393 | 0 | 604825892 | 17337046869244 | 17337046802642 | 17337047186963 | 17337047188815 |
| 130 | 128 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 383 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 202368 | 0x7fd82d309680 | 0x7fd82ca25f40 | 333855 | 333855 | 23187 | 2670848 | 65536 | 209231940 | 2559686 | 0 | 838706072 | 17337047230284 | 17337047186963 | 17337047603763 | 17337047646553 |
| 131 | 129 | void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd] | 0 | 0 | 386 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 205888 | 0x7fd82f967500 | 0x7fd82ca25f80 | 332359 | 332359 | 23473 | 2658880 | 65536 | 212872480 | 2533945 | 0 | 853264440 | 17337047658103 | 17337047603763 | 17337048039763 | 17337048081922 |
| 132 | 130 | void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd] | 0 | 0 | 389 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 209408 | 0x7fd82f967380 | 0x7fd82ca25fc0 | 307001 | 307001 | 23442 | 2456016 | 65536 | 218559255 | 2347929 | 0 | 876002736 | 17337048093311 | 17337048039763 | 17337048462964 | 17337048464812 |
| 133 | 131 | void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd] | 0 | 0 | 392 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 214464 | 0x7fd82f967200 | 0x7fd82ca26000 | 542521 | 542521 | 35763 | 4340176 | 65536 | 405951308 | 4227371 | 0 | 1625572020 | 17337048506430 | 17337048462964 | 17337049008244 | 17337049050876 |
| 134 | 132 | void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd] | 0 | 0 | 395 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 217728 | 0x7fd82f967080 | 0x7fd82ca26040 | 272707 | 272707 | 21607 | 2181664 | 65536 | 185023892 | 2072875 | 0 | 741863132 | 17337049070755 | 17337049008244 | 17337049402165 | 17337049403987 |
| 135 | 133 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 398 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 222016 | 0x7fd82d309f00 | 0x7fd82ca26080 | 368177 | 368177 | 26299 | 2945424 | 65536 | 237132228 | 2811416 | 0 | 950318436 | 17337049445596 | 17337049402165 | 17337049840245 | 17337049859205 |
| 136 | 134 | void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd] | 0 | 0 | 401 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 226048 | 0x7fd82d309d80 | 0x7fd82ca260c0 | 366428 | 366428 | 28392 | 2931432 | 65536 | 252300495 | 2821601 | 0 | 1010974364 | 17337049883374 | 17337049840245 | 17337050282645 | 17337050327402 |
| 137 | 135 | void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd] | 0 | 0 | 404 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 230080 | 0x7fd82d309c00 | 0x7fd82ca26100 | 346549 | 346549 | 25479 | 2772400 | 65536 | 251252851 | 2664107 | 0 | 1006774452 | 17337050339012 | 17337050282645 | 17337050729686 | 17337050777020 |
| 138 | 136 | void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd] | 0 | 0 | 407 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 235904 | 0x7fd82d309a80 | 0x7fd82ca26140 | 622869 | 622869 | 39757 | 4982960 | 65536 | 481323659 | 4875232 | 0 | 1927063996 | 17337050788350 | 17337050729686 | 17337051350646 | 17337051392774 |
| 139 | 137 | void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd] | 0 | 0 | 410 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 239424 | 0x7fd82d309900 | 0x7fd82ca26180 | 302052 | 302052 | 23086 | 2416424 | 65536 | 215565145 | 2311375 | 0 | 864028740 | 17337051412494 | 17337051350646 | 17337051771927 | 17337051773864 |
| 140 | 138 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 413 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 244224 | 0x7fd82d309780 | 0x7fd82ca261c0 | 397739 | 397739 | 27108 | 3181920 | 65536 | 270675263 | 3067015 | 0 | 1084487764 | 17337051814903 | 17337051771927 | 17337052233047 | 17337052275251 |
| 141 | 139 | void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd] | 0 | 0 | 416 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 248768 | 0x7fd82d309600 | 0x7fd82ca26200 | 390233 | 390233 | 27534 | 3121872 | 65536 | 292916837 | 3021631 | 0 | 1173439360 | 17337052287511 | 17337052233047 | 17337052709047 | 17337052751328 |
| 142 | 140 | void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd] | 0 | 0 | 419 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 253312 | 0x7fd82f967480 | 0x7fd82ca26240 | 387400 | 387400 | 27667 | 3099208 | 65536 | 287073935 | 2989206 | 0 | 1150063012 | 17337052761948 | 17337052709047 | 17337053174008 | 17337053216056 |
| 143 | 141 | void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd] | 0 | 0 | 422 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 8 | 24 | 255552 | 0x7fd82f967300 | 0x7fd82ca26280 | 717899 | 717899 | 45047 | 5743200 | 65536 | 535892136 | 5631478 | 0 | 2145308528 | 17337053228136 | 17337053174008 | 17337053856248 | 17337053898438 |
| 144 | 142 | void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd] | 0 | 0 | 425 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 259840 | 0x7fd82f967180 | 0x7fd82ca262c0 | 364808 | 364808 | 26673 | 2918472 | 65536 | 253243388 | 2801901 | 0 | 1014741844 | 17337053918798 | 17337053856248 | 17337054319609 | 17337054367006 |
| 145 | 143 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 428 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 265664 | 0x7fd82f967000 | 0x7fd82ca26300 | 470581 | 470581 | 31514 | 3764656 | 65536 | 362033016 | 3662600 | 0 | 1449928416 | 17337054379255 | 17337054319609 | 17337054857529 | 17337054900672 |
| 146 | 144 | void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd] | 0 | 0 | 431 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 271232 | 0x7fd82d309e80 | 0x7fd82ca26340 | 471380 | 471380 | 31685 | 3771048 | 65536 | 349796189 | 3663494 | 0 | 1400967620 | 17337054912751 | 17337054857529 | 17337055392570 | 17337055435027 |
| 147 | 145 | void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd] | 0 | 0 | 434 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 8 | 24 | 273216 | 0x7fd82d309d00 | 0x7fd82ca26380 | 482913 | 482913 | 32906 | 3863312 | 65536 | 353899027 | 3752868 | 0 | 1417338456 | 17337055446107 | 17337055392570 | 17337055918330 | 17337055960303 |
| 148 | 146 | void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd] | 0 | 0 | 437 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 8 | 24 | 275712 | 0x7fd82d309b80 | 0x7fd82ca263c0 | 880720 | 880720 | 52221 | 7045768 | 65536 | 682194004 | 6929705 | 0 | 2730518224 | 17337055971233 | 17337055918330 | 17337056704731 | 17337056746793 |
| 149 | 147 | void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd] | 0 | 0 | 440 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 280768 | 0x7fd82d309a00 | 0x7fd82ca26400 | 426482 | 426482 | 29571 | 3411864 | 65536 | 318161885 | 3306076 | 0 | 1274419496 | 17337056767122 | 17337056704731 | 17337057198971 | 17337057241030 |
| 150 | 148 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 443 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 287616 | 0x7fd82d309880 | 0x7fd82ca26440 | 549292 | 549292 | 35606 | 4394344 | 65536 | 409845852 | 4290206 | 0 | 1641169856 | 17337057252279 | 17337057198971 | 17337057780572 | 17337057822754 |
| 151 | 149 | void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd] | 0 | 0 | 446 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 294208 | 0x7fd82d309700 | 0x7fd82ca26480 | 550980 | 550980 | 35662 | 4407848 | 65536 | 416569573 | 4307236 | 0 | 1668061732 | 17337057834154 | 17337057780572 | 17337058361212 | 17337058407179 |
| 152 | 150 | void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd] | 0 | 0 | 449 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 8 | 24 | 296960 | 0x7fd82f967580 | 0x7fd82ca264c0 | 562741 | 562741 | 36185 | 4501936 | 65536 | 420237542 | 4390110 | 0 | 1682693988 | 17337058418688 | 17337058361212 | 17337058945533 | 17337058989683 |
| 153 | 151 | void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd] | 0 | 0 | 452 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 8 | 24 | 299968 | 0x7fd82f967400 | 0x7fd82ca26500 | 1040990 | 1040990 | 60593 | 8327928 | 65536 | 803575607 | 8221628 | 0 | 3216044224 | 17337059000523 | 17337058945533 | 17337059842653 | 17337059885359 |
| 154 | 152 | void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd] | 0 | 0 | 455 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 8 | 24 | 302720 | 0x7fd82f967280 | 0x7fd82ca26540 | 721745 | 721745 | 44421 | 5773968 | 65536 | 549771030 | 5657079 | 0 | 2200826464 | 17337059905009 | 17337059842431 | 17337060522271 | 17337060568501 |
| 155 | 153 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 458 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 305472 | 0x7fd82f967100 | 0x7fd82ca26580 | 723836 | 723836 | 44515 | 5790696 | 65536 | 551104972 | 5674828 | 0 | 2206161396 | 17337060580371 | 17337060522271 | 17337061218431 | 17337061260333 |
| 156 | 154 | void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd] | 0 | 0 | 461 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 308224 | 0x7fd82d309f80 | 0x7fd82ca265c0 | 721540 | 721540 | 44529 | 5772328 | 65536 | 553576258 | 5663501 | 0 | 2216044352 | 17337061272203 | 17337061218431 | 17337061904511 | 17337061924115 |
| 157 | 155 | void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd] | 0 | 0 | 464 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 8 | 24 | 310976 | 0x7fd82d309e00 | 0x7fd82ca26600 | 727405 | 727405 | 44861 | 5819248 | 65536 | 559877641 | 5702213 | 0 | 2241253588 | 17337061947785 | 17337061904511 | 17337062569471 | 17337062614547 |
| 158 | 156 | void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd] | 0 | 0 | 467 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 8 | 24 | 313216 | 0x7fd82d309c80 | 0x7fd82ca26640 | 1366235 | 1366235 | 77561 | 10929888 | 65536 | 1074480432 | 10814454 | 0 | 4299663440 | 17337062625887 | 17337062569471 | 17337063670112 | 17337063713838 |
| 159 | 157 | void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd] | 0 | 0 | 470 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 8 | 24 | 315968 | 0x7fd82d309b00 | 0x7fd82ca26680 | 1370735 | 1370735 | 77153 | 10965888 | 65536 | 1082890376 | 10848789 | 0 | 4333303572 | 17337063734168 | 17337063670112 | 17337064756992 | 17337064820179 |
| 160 | 158 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 473 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 318720 | 0x7fd82d309980 | 0x7fd82ca266c0 | 1372857 | 1372857 | 77599 | 10982864 | 65536 | 1073340523 | 10859451 | 0 | 4295103468 | 17337064832379 | 17337064756992 | 17337065890593 | 17337065959469 |
| 161 | 159 | void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd] | 0 | 0 | 476 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 321472 | 0x7fd82d309800 | 0x7fd82ca26700 | 1371715 | 1371715 | 76807 | 10973728 | 65536 | 1073266930 | 10853171 | 0 | 4294808500 | 17337065971569 | 17337065890593 | 17337067034113 | 17337067102299 |
| 162 | 160 | void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd] | 0 | 0 | 479 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 8 | 24 | 324224 | 0x7fd82d309680 | 0x7fd82ca26740 | 1374977 | 1374977 | 77550 | 10999824 | 65536 | 1086088670 | 10883976 | 0 | 4346097280 | 17337067113978 | 17337067034113 | 17337068168194 | 17337068234969 |
| 163 | 161 | void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd] | 0 | 0 | 482 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 8 | 24 | 326464 | 0x7fd82f967500 | 0x7fd82ca26780 | 2665471 | 2665471 | 143127 | 21323776 | 65536 | 2129827555 | 21184877 | 0 | 8521052912 | 17337068246338 | 17337068168194 | 17337070135234 | 17337070207106 |
| 164 | 162 | void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd] | 0 | 0 | 485 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 8 | 24 | 329216 | 0x7fd82f967380 | 0x7fd82ca267c0 | 2667157 | 2667157 | 142329 | 21337264 | 65536 | 2131358619 | 21224403 | 0 | 8527175480 | 17337070227226 | 17337070135234 | 17337072078595 | 17337072147155 |
| 165 | 163 | void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd] | 0 | 0 | 488 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 331968 | 0x7fd82f967200 | 0x7fd82ca26800 | 2671372 | 2671372 | 143212 | 21370984 | 65536 | 2133705692 | 21245221 | 0 | 8536563764 | 17337072159255 | 17337072078595 | 17337074075076 | 17337074125643 |
| 166 | 164 | void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd] | 0 | 0 | 491 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 12 | 24 | 334720 | 0x7fd82f967080 | 0x7fd82ca26840 | 2667694 | 2667694 | 142298 | 21341560 | 65536 | 2121038226 | 21230772 | 0 | 8485893444 | 17337074138472 | 17337074075076 | 17337076057157 | 17337076127140 |
| 167 | 165 | void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd] | 0 | 0 | 494 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 8 | 24 | 337472 | 0x7fd82d309f00 | 0x7fd82ca26880 | 2674254 | 2674254 | 143132 | 21394040 | 65536 | 2127418593 | 21263359 | 0 | 8511416164 | 17337076138619 | 17337076057157 | 17337078006118 | 17337078073789 |
| 168 | 166 | void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd] | 0 | 0 | 497 | 206513 | 206513 | 4194304 | 256 | 0 | 0 | 8 | 24 | 0 | 0x7fd82d309d80 | 0x7fd82ca268c0 | 5255694 | 5255694 | 273670 | 42045560 | 65536 | 4232847212 | 41928878 | 0 | 16933130288 | 17337078099068 | 17337078006118 | 17337081650919 | 17337081719282 |