Files
rocm-systems/tests/workloads/dev1/mi200/timestamps.csv
T
colramos-amd 62d130b458 Initial commit
2022-11-04 14:49:36 -05:00

37 KiB

1IndexKernelNamegpu-idqueue-idqueue-indexpidtidgrdwgrldsscrvgprsgprfbarsigobjDispatchNsBeginNsEndNsCompleteNs
20__amd_rocclr_fillBufferAligned.kd000231318231318335544322560043241600x00x7ff759c0428017724136167316177241361927871772413643086717724136522737
31void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd]00223131823131832768256001224138880x00x7ff759c23f8017724141183450177241411987131772414121215317724141230479
42void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd]0052313182313184194304256001224143360x7ff75cbbb3800x7ff759c23fc017724141234519177241412791931772414137167317724141373895
53void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0082313182313184194304256001624150400x7ff75cbbb2000x7ff759c2400017724141393985177241414039931772414158287417724141585140
64void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd]00112313182313184194304256001624154880x7ff75cbbb0800x7ff759c2404017724141600090177241416086341772414178815417724141790255
75void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd]00142313182313184194304256001224159360x7ff75a58bf000x7ff759c2408017724141804155177241418124741772414190607417724141908042
86void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd]00172313182313184194304256001224163840x7ff75a58bd800x7ff759c240c017724141923002177241419313541772414202335417724142025449
97void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd]00202313182313184194304256001224170880x7ff75a58bc000x7ff759c2410017724142051688177241420627141772414215439417724142156686
108void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00232313182313184194304256001624177920x7ff75a58ba800x7ff759c2414017724142174215177241421836741772414236351517724142365551
119void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd]00262313182313184194304256001624184960x7ff75a58b9000x7ff759c2418017724142384120177241424091151772414258879517724142591095
1210void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd]00292313182313184194304256001624192000x7ff75a58b7800x7ff759c241c017724142606494177241426150351772414270879517724142711072
1311void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd]00322313182313184194304256001624199040x7ff75a58b6000x7ff759c2420017724142729691177241427414351772414283519517724142837249
1412void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd]00352313182313184194304256001224206080x7ff75cbbb4800x7ff759c2424017724142861318177241428847951772414297855617724142980695
1513void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00382313182313184194304256001624213120x7ff75cbbb3000x7ff759c2428017724143006234177241430169561772414319535617724143197400
1614void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd]00412313182313184194304256001624220160x7ff75cbbb1800x7ff759c242c017724143212209177241432214361772414340143617724143403494
1715void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd]00442313182313184194304256001624227200x7ff75cbbb0000x7ff759c2430017724143417434177241434263961772414351951617724143521671
1816void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd]00472313182313184194304256001224234240x7ff75a58be800x7ff759c2434017724143542411177241435518361772414364463617724143646728
1917void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd]00502313182313184194304256001224241280x7ff75a58bd000x7ff759c2438017724143668188177241436785571772414377167717724143773745
2018void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00532313182313184194304256001624248320x7ff75a58bb800x7ff759c243c017724143792885177241438035171772414398239717724143984630
2119void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd]00562313182313184194304256001624255360x7ff75a58ba000x7ff759c2440017724144008809177241440185571772414419919717724144201264
2220void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd]00592313182313184194304256001224262400x7ff75a58b8800x7ff759c2444017724144220504177241442519971772414434543717724144347461
2321void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd]00622313182313184194304256001224269440x7ff75a58b7000x7ff759c2448017724144361630177241443715181772414446559817724144467778
2422void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd]00652313182313184194304256001224276480x7ff75cbbb5800x7ff759c244c017724144487837177241444983981772414459071817724144592864
2523void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00682313182313184194304256001624286080x7ff75cbbb4000x7ff759c2450017724144609294177241446180781772414479679817724144798939
2624void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd]00712313182313184194304256001624293120x7ff75cbbb2800x7ff759c2454017724144813199177241448228781772414500159817724145003084
2725void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd]00742313182313184194304256001224300160x7ff75cbbb1000x7ff759c2458017724145017884177241450262381772414511871917724145120271
2826void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd]0077231318231318419430425600824309760x7ff75a58bf800x7ff759c245c017724145135511177241451436791772414523567917724145237248
2927void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd]00802313182313184194304256001224316800x7ff75a58be000x7ff759c2460017724145258088177241452687991772414536191917724145363585
3028void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00832313182313184194304256001624326400x7ff75a58bc800x7ff759c2464017724145378535177241453865591772414556671917724145568260
3129void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd]00862313182313184194304256001224336000x7ff75a58bb000x7ff759c2468017724145582600177241455907191772414577215917724145773655
3230void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd]00892313182313184194304256001224345600x7ff75a58b9800x7ff759c246c017724145787394177241457953601772414588880017724145890382
3331void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd]0092231318231318419430425600824355200x7ff75a58b8000x7ff759c2470017724145904691177241459129601772414600672017724146008299
3432void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd]00952313182313184194304256001224362240x7ff75a58b6800x7ff759c2474017724146028628177241460387201772414613184017724146133456
3533void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00982313182313184194304256001224371840x7ff75cbbb5000x7ff759c2478017724146148165177241461563201772414633632017724146337861
3634void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd]001012313182313184194304256001224381440x7ff75cbbb3800x7ff759c247c017724146352570177241463612801772414654240117724146543965
3735void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd]001042313182313184194304256001224391040x7ff75cbbb2000x7ff759c2480017724146558965177241465673611772414666112117724146662762
3836void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd]00107231318231318419430425600824403200x7ff75cbbb0800x7ff759c2484017724146676442177241466846411772414677856117724146780049
3937void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd]001102313182313184194304256001224412800x7ff75a58bf000x7ff759c2488017724146799269177241468115211772414690448117724146905956
4038void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]001132313182313184194304256001224422400x7ff75a58bd800x7ff759c248c017724146921426177241469299211772414710864117724147110151
4139void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd]001162313182313184194304256001224432000x7ff75a58bc000x7ff759c2490017724147124671177241471324811772414731328217724147314716
4240void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd]00119231318231318419430425600824441600x7ff75a58ba800x7ff759c2494017724147330326177241473388821772414743216217724147433803
4341void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd]001222313182313184194304256001224453760x7ff75a58b9000x7ff759c2498017724147447693177241474556821772414755056217724147552090
4442void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd]001252313182313184194304256001224463360x7ff75a58b7800x7ff759c249c017724147577200177241475878421772414768192217724147683427
4543void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]001282313182313184194304256001224475520x7ff75a58b6000x7ff759c24a0017724147698947177241477068821772414788688217724147888392
4644void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd]001312313182313184194304256001224485120x7ff75cbbb4800x7ff759c24a4017724147903651177241479118421772414809456317724148096137
4745void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd]00134231318231318419430425600824494720x7ff75cbbb3000x7ff759c24a8017724148110736177241481188831772414821168317724148213294
4846void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd]001372313182313184194304256001224506880x7ff75cbbb1800x7ff759c24ac017724148228163177241482371231772414833024317724148331841
4947void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd]001402313182313184194304256001224516480x7ff75cbbb0000x7ff759c24b0017724148352450177241483632031772414845520317724148456778
5048void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]001432313182313184194304256001224528640x7ff75a58be800x7ff759c24b4017724148473277177241484812831772414866160417724148663142
5149void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd]001462313182313184194304256001224540800x7ff75a58bd000x7ff759c24b8017724148676422177241486848041772414886560417724148867157
5250void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd]00149231318231318419430425600824552960x7ff75a58bb800x7ff759c24bc017724148880697177241488884841772414898320417724148984824
5351void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd]001522313182313184194304256001224567680x7ff75a58ba000x7ff759c24c0017724148999484177241490073641772414910256417724149104041
5452void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd]001552313182313184194304256001224577280x7ff75a58b8800x7ff759c24c4017724149124521177241491356841772414922928417724149230868
5553void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]001582313182313184194304256001224589440x7ff75a58b7000x7ff759c24c8017724149246438177241492553641772414943360517724149435113
5654void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd]001612313182313184194304256001224601600x7ff75cbbb5800x7ff759c24cc017724149448773177241494572851772414963760517724149639088
5755void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd]00164231318231318419430425600824613760x7ff75cbbb4000x7ff759c24d0017724149653028177241496612851772414975552517724149757125
5856void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd]001672313182313184194304256001224628480x7ff75cbbb2800x7ff759c24d4017724149771765177241497806451772414988000517724149881622
5957void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd]001702313182313184194304256001224638080x7ff75cbbb1000x7ff759c24d8017724149902161177241499124851772415000576517724150007299
6058void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]001732313182313184194304256001224650240x7ff75a58bf800x7ff759c24dc017724150021708177241500310451772415021056617724150212424
6159void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd]001762313182313184194304256001224662400x7ff75a58be000x7ff759c24e0017724150227253177241502358461772415041504617724150416618
6260void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd]00179231318231318419430425600824674560x7ff75a58bc800x7ff759c24e4017724150431688177241504400061772415053472617724150536195
6361void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd]001822313182313184194304256001224689280x7ff75a58bb000x7ff759c24e8017724150550815177241505590461772415066320617724150664702
6462void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd]001852313182313184194304256001224701440x7ff75a58b9800x7ff759c24ec017724150684892177241506955261772415078832717724150789909
6563void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]001882313182313184194304256001224716160x7ff75a58b8000x7ff759c24f0017724150804729177241508126471772415099264717724150994224
6664void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd]001912313182313184194304256001224728320x7ff75a58b6800x7ff759c24f4017724151010554177241510190471772415119808717724151199679
6765void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd]00194231318231318419430425600824740480x7ff75cbbb5000x7ff759c24f8017724151213678177241512220871772415131520717724151316686
6866void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd]001972313182313184194304256001224757760x7ff75cbbb3800x7ff759c24fc017724151330865177241513387271772415144528717724151446813
6967void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd]002002313182313184194304256001224769920x7ff75cbbb2000x7ff759c2500017724151466462177241514772871772415157184817724151573309
7068void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]002032313182313184194304256001224784640x7ff75cbbb0800x7ff759c2504017724151588539177241515969681772415177568817724151777144
7169void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd]002062313182313184194304256001224799360x7ff75a58bf000x7ff759c2508017724151791784177241518003281772415197920817724151980799
7270void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd]00209231318231318419430425600824814080x7ff75a58bd800x7ff759c250c017724151995139177241520041681772415209888817724152100376
7371void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd]002122313182313184194304256001224831360x7ff75a58bc000x7ff759c2510017724152114866177241521228881772415223760917724152239203
7472void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd]002152313182313184194304256001224843520x7ff75a58ba800x7ff759c2514017724152273942177241522833691772415237808917724152379659
7573void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]002182313182313184194304256001224858240x7ff75a58b9000x7ff759c2518017724152395289177241524032091772415258304917724152584594
7674void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd]002212313182313184194304256001224872960x7ff75a58b7800x7ff759c251c017724152601663177241526092891772415278976917724152791339
7775void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd]002242313182313184194304256001224887680x7ff75a58b6000x7ff759c2520017724152807558177241528156891772415291072917724152912296
7876void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd]002272313182313184194304256001224907520x7ff75cbbb4800x7ff759c2524017724152927205177241529358501772415305665017724153058272
7977void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd]002302313182313184194304256001224919680x7ff75cbbb3000x7ff759c2528017724153077531177241530888101772415318225017724153183789
8078void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]002332313182313184194304256001224934400x7ff75cbbb1800x7ff759c252c017724153198328177241532064101772415338737017724153388954
8179void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd]002362313182313184194304256001224949120x7ff75cbbb0000x7ff759c2530017724153403893177241534120101772415359425017724153595918
8280void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd]002392313182313184194304256001224963840x7ff75a58be800x7ff759c2534017724153611328177241536195301772415371505117724153716615
8381void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd]002422313182313184194304256001224983680x7ff75a58bd000x7ff759c2538017724153731325177241537395311772415386641117724153868022
8482void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd]002452313182313184194304256001224995840x7ff75a58bb800x7ff759c253c017724153888901177241538993711772415399489117724153996488
8583void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0024823131823131841943042560012241013120x7ff75a58ba000x7ff759c2540017724154011958177241540196911772415419889117724154200623
8684void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd]0025123131823131841943042560012241027840x7ff75a58b8800x7ff759c2544017724154215243177241542238511772415440305217724154404658
8785void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd]0025423131823131841943042560012241042560x7ff75a58b7000x7ff759c2548017724154420528177241544283321772415452289217724154524515
8886void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd]0025723131823131841943042560012241062400x7ff75cbbb5800x7ff759c254c017724154539375177241545472121772415467841217724154679991
8987void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd]0026023131823131841943042560012241077120x7ff75cbbb4000x7ff759c2550017724154702421177241547129721772415480657217724154808108
9088void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0026323131823131841943042560016241094400x7ff75cbbb2800x7ff759c2554017724154823728177241548318521772415501089217724155012413
9189void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd]0026623131823131841943042560016241111680x7ff75cbbb1000x7ff759c2558017724155027493177241550360121772415521761317724155219198
9290void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd]002692313182313184194304256008241128960x7ff75a58bf800x7ff759c255c017724155233277177241552414531772415533729317724155338975
9391void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd]0027223131823131841943042560012241151360x7ff75a58be000x7ff759c2560017724155353554177241553617731772415550113317724155502721
9492void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd]0027523131823131841943042560012241166080x7ff75a58bc800x7ff759c2564017724155524220177241555355331772415563025317724155631837
9593void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0027823131823131841943042560016241183360x7ff75a58bb000x7ff759c2568017724155646907177241556548931772415583377417724155835322
9694void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd]0028123131823131841943042560016241200640x7ff75a58b9800x7ff759c256c017724155849432177241558587341772415604001417724156041477
9795void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd]0028423131823131841943042560012241217920x7ff75a58b8000x7ff759c2570017724156055217177241560630541772415615937417724156160924
9896void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd]0028723131823131841943042560012241240320x7ff75a58b6800x7ff759c2574017724156177474177241561862541772415633153417724156333130
9997void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd]0029023131823131841943042560012241255040x7ff75cbbb5000x7ff759c2578017724156354399177241563646541772415646097417724156462547
10098void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0029323131823131841943042560012241274880x7ff75cbbb3800x7ff759c257c017724156477036177241564854551772415666593517724156667472
10199void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd]0029623131823131841943042560012241292160x7ff75cbbb2000x7ff759c2580017724156681931177241566902551772415686929517724156870866
102100void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd]0029923131823131841943042560012241309440x7ff75cbbb0800x7ff759c2584017724156885106177241568945751772415699457517724156996223
103101void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd]0030223131823131841943042560012241334400x7ff75a58bf000x7ff759c2588017724157011753177241570198551772415717521517724157176819
104102void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd]0030523131823131841943042560012241349120x7ff75a58bd800x7ff759c258c017724157197318177241572078561772415730257617724157304066
105103void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0030823131823131841943042560012241368960x7ff75a58bc000x7ff759c2590017724157318925177241573267361772415750561617724157507151
106104void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd]0031123131823131841943042560012241388800x7ff75a58ba800x7ff759c2594017724157522800177241575312161772415771105617724157712775
107105void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd]0031423131823131841943042560012241408640x7ff75a58b9000x7ff759c2598017724157727155177241577356961772415784257617724157844102
108106void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd]0031723131823131841943042560012241436160x7ff75a58b7800x7ff759c259c017724157858392177241578668961772415803793717724158039507
109107void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd]0032023131823131841943042560012241453440x7ff75a58b6000x7ff759c25a0017724158060627177241580708971772415816673717724158168444
110108void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0032323131823131841943042560012241475840x7ff75cbbb4800x7ff759c25a4017724158183794177241581920171772415837137717724158372969
111109void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd]0032623131823131841943042560012241495680x7ff75cbbb3000x7ff759c25a8017724158386869177241583948971772415857633717724158577934
112110void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd]0032923131823131841943042560012241515520x7ff75cbbb1800x7ff759c25ac017724158592173177241586001771772415871041817724158711940
113111void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd]0033223131823131841943042560012241543040x7ff75cbbb0000x7ff759c25b0017724158726560177241587347381772415891601817724158917595
114112void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd]0033523131823131841943042560012241562880x7ff75a58be800x7ff759c25b4017724158939095177241589484981772415905025817724159051882
115113void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0033823131823131841943042560012241587840x7ff75a58bd000x7ff759c25b8017724159067212177241590752181772415925713817724159258807
116114void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd]0034123131823131841943042560012241610240x7ff75a58bb800x7ff759c25bc017724159273406177241592816181772415946625917724159467791
117115void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd]0034423131823131841943042560012241632640x7ff75a58ba000x7ff759c25c0017724159481821177241594897791772415961233917724159613918
118116void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd]0034723131823131841943042560012241665280x7ff75a58b8800x7ff759c25c4017724159628207177241596382591772415984529917724159867111
119117void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd]0035023131823131841943042560012241685120x7ff75a58b7000x7ff759c25c8017724159882351177241598928191772416000577917724160007408
120118void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0035323131823131841943042560012241712640x7ff75cbbb5800x7ff759c25cc017724160023328177241600318591772416021650017724160217963
121119void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd]0035623131823131841943042560012241737600x7ff75cbbb4000x7ff759c25d0017724160232112177241602417801772416042866017724160430257
122120void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd]0035923131823131841943042560012241762560x7ff75cbbb2800x7ff759c25d4017724160445647177241604541001772416058898017724160590533
123121void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd]0036223131823131841943042560012241797760x7ff75cbbb1000x7ff759c25d8017724160604823177241606126601772416084466117724160864657
124122void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd]0036523131823131841943042560012241822720x7ff75a58bf800x7ff759c25dc017724160880146177241608907411772416101778117724161019303
125123void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0036823131823131841943042560012241855360x7ff75a58be000x7ff759c25e0017724161034972177241610427411772416123490117724161236487
126124void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd]0037123131823131841943042560012241885440x7ff75a58bc800x7ff759c25e4017724161251887177241612605011772416145122117724161452772
127125void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd]0037423131823131841943042560012241915520x7ff75a58bb000x7ff759c25e8017724161468651177241614763421772416163650217724161638147
128126void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd]0037723131823131841943042560012241958400x7ff75a58b9800x7ff759c25ec017724161652707177241616606621772416194450217724161964259
129127void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd]0038023131823131841943042560012241985920x7ff75a58b8000x7ff759c25f0017724161980929177241619915421772416214210217724162143675
130128void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0038323131823131841943042560012242023680x7ff75a58b6800x7ff759c25f4017724162160134177241621680221772416237538317724162398208
131129void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd]0038623131823131841943042560012242058880x7ff75cbbb5000x7ff759c25f8017724162407758177241624177831772416262690317724162649182
132130void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd]0038923131823131841943042560012242094080x7ff75cbbb3800x7ff759c25fc017724162658282177241626686631772416285474317724162856357
133131void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd]0039223131823131841943042560012242144640x7ff75cbbb2000x7ff759c2600017724162872016177241628805031772416321538417724163234547
134132void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd]0039523131823131841943042560012242177280x7ff75cbbb0800x7ff759c2604017724163250327177241632611441772416342898417724163430532
135133void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0039823131823131841943042560012242220160x7ff75a58bf000x7ff759c2608017724163445222177241634533041772416368178517724163701085
136134void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd]0040123131823131841943042560012242260480x7ff75a58bd800x7ff759c260c017724163711405177241637214651772416395026517724163969189
137135void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd]0040423131823131841943042560012242300800x7ff75a58bc000x7ff759c2610017724163977898177241639877051772416419922517724164218192
138136void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd]0040723131823131841943042560012242359040x7ff75a58ba800x7ff759c2614017724164229452177241642387451772416462482617724164643702
139137void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd]0041023131823131841943042560012242394240x7ff75a58b9000x7ff759c2618017724164660921177241646717061772416485906617724164860596
140138void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0041323131823131841943042560012242442240x7ff75a58b7800x7ff759c261c017724164875886177241648837061772416513410717724165153699
141139void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd]0041623131823131841943042560012242487680x7ff75a58b6000x7ff759c2620017724165162409177241651728271772416541986717724165438482
142140void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd]0041923131823131841943042560012242533120x7ff75cbbb4800x7ff759c2624017724165448581177241654587471772416569570717724165711535
143141void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd]004222313182313184194304256008242555520x7ff75cbbb3000x7ff759c2628017724165722144177241657320271772416618514817724166215182
144142void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd]0042523131823131841943042560012242598400x7ff75cbbb1800x7ff759c262c017724166233232177241662440281772416646994917724166491765
145143void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0042823131823131841943042560012242656640x7ff75cbbb0000x7ff759c2630017724166500845177241665101091772416680786917724166829447
146144void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd]0043123131823131841943042560012242712320x7ff75a58be800x7ff759c2634017724166839396177241668488291772416714786917724167169568
147145void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd]004342313182313184194304256008242732160x7ff75a58bd000x7ff759c2638017724167178438177241671885101772416748547017724167506970
148146void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd]004372313182313184194304256008242757120x7ff75a58bb800x7ff759c263c017724167514990177241675253101772416808291117724168104505
149147void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd]0044023131823131841943042560012242807680x7ff75a58ba000x7ff759c2640017724168120554177241681310711772416839491117724168417727
150148void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0044323131823131841943042560012242876160x7ff75a58b8800x7ff759c2644017724168428217177241684387511772416878947217724168811107
151149void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd]0044623131823131841943042560012242942080x7ff75a58b7000x7ff759c2648017724168819857177241688310721772416918067217724169202227
152150void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd]004492313182313184194304256008242969600x7ff75cbbb5800x7ff759c264c017724169212777177241692225921772416956947317724169588408
153151void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd]004522313182313184194304256008242999680x7ff75cbbb4000x7ff759c2650017724169599457177241696091531772417027075417724170294260
154152void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd]004552313182313184194304256008243027200x7ff75cbbb2800x7ff759c2654017724170313590177241703227541772417077059517724170792478
155153void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0045823131823131841943042560012243054720x7ff75cbbb1000x7ff759c2658017724170802457177241708126751772417127827517724171301985
156154void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd]0046123131823131841943042560012243082240x7ff75a58bf800x7ff759c265c017724171314225177241713313951772417179299617724171816212
157155void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd]004642313182313184194304256008243109760x7ff75a58be000x7ff759c2660017724171825032177241718352361772417228707717724172310790
158156void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd]004672313182313184194304256008243132160x7ff75a58bc800x7ff759c2664017724172326289177241723350771772417320467817724173227877
159157void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd]004702313182313184194304256008243159680x7ff75a58bb000x7ff759c2668017724173245296177241732558781772417410963917724174134014
160158void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0047323131823131841943042560012243187200x7ff75a58b9800x7ff759c266c017724174143014177241741536391772417503812117724175062671
161159void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd]0047623131823131841943042560012243214720x7ff75a58b8000x7ff759c2670017724175072110177241750816411772417596180217724175986337
162160void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd]004792313182313184194304256008243242240x7ff75a58b6800x7ff759c2674017724175996617177241760158821772417687604317724176900014
163161void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd]004822313182313184194304256008243264640x7ff75cbbb5000x7ff759c2678017724176908194177241769184431772417861796617724178692319
164162void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd]004852313182313184194304256008243292160x7ff75cbbb3800x7ff759c267c017724178710539177241787216461772418038612817724180456225
165163void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0048823131823131841943042560012243319680x7ff75cbbb2000x7ff759c2680017724180465605177241804758881772418220245117724182272320
166164void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd]0049123131823131841943042560012243347200x7ff75cbbb0800x7ff759c2684017724182285899177241823139711772418402933317724184098844
167165void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd]004942313182313184194304256008243374720x7ff75a58bf000x7ff759c2688017724184110903177241841269331772418580101617724185868679
168166void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd]0049723131823131841943042560082400x7ff75a58bd800x7ff759c268c017724185877859177241858882161772418924614017724189320083