Files
rocm-systems/tests/workloads/invdev/mi200/SQ_INST_LEVEL_SMEM.csv
T
colramos-amd 62d130b458 Initial commit
2022-11-04 14:49:36 -05:00

41 KiB

1IndexKernelNamegpu-idqueue-idqueue-indexpidtidgrdwgrldsscrvgprsgprfbarsigobjSQ_INSTS_SMEMSQ_INST_LEVEL_SMEMSQ_ACCUM_PREV_HIRESDispatchNsBeginNsEndNsCompleteNs
20__amd_rocclr_fillBufferAligned.kd000236281236281335544322560043241600x00x7f45e22042803670016290570632508170417832236843728178031986651201783238162987017832381744199
31void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd]00223628123628132768256001224138880x00x7f45e2223f80512966641085128817832386900391178323816298701783238702651917832387030968
42void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd]0052362812362814194304256001224143360x7f45e517a3800x7f45e2223fc0655366399267170499217832387064037178323870265191783238740236017832387404639
53void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0082362812362814194304256001624150400x7f45e517a2000x7f45e2224000655366631207428473617832387441058178323874023601783238780140117832387803559
64void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd]00112362812362814194304256001624154880x7f45e517a0800x7f45e2224040655366553827346724817832387836288178323878014011783238818924117832388191179
75void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd]00142362812362814194304256001224159360x7f45e2b1bf000x7f45e2224080655366707067514457617832388224148178323881892411783238848668217832388488802
86void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd]00172362812362814194304256001224163840x7f45e2b1bd800x7f45e22240c0655366334987098989617832388520711178323884866821783238878444317832388786445
97void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd]00202362812362814194304256001224170880x7f45e2b1bc000x7f45e22241001310726827907634974417832388829873178323887844431783238908588317832389087897
108void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00232362812362814194304256001624177920x7f45e2b1ba800x7f45e22241401310727022587873404817832389118956178323890858831783238947004417832389472077
119void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd]00262362812362814194304256001624184960x7f45e2b1b9000x7f45e2224180655366629227423758417832389504707178323894700441783238985452517832389856588
1210void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd]00292362812362814194304256001624192000x7f45e2b1b7800x7f45e22241c01310727029447866251217832389887017178323898545251783239016524517832390167590
1311void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd]00322362812362814194304256001624199040x7f45e2b1b6000x7f45e22242001310726985927824972817832390198889178323901652451783239047164617832390473623
1412void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd]00352362812362814194304256001224206080x7f45e517a4800x7f45e22242401310726999227836665617832390513972178323904716461783239077116617832390773245
1513void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00382362812362814194304256001624213120x7f45e517a3000x7f45e22242801310726972767807845617832390805924178323907711661783239115356717832391155576
1614void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd]00412362812362814194304256001624220160x7f45e517a1800x7f45e22242c0655366717007520001617832391187125178323911535671783239154092817832391542376
1715void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd]00442362812362814194304256001624227200x7f45e517a0000x7f45e22243001310727179928031835217832391573205178323915409281783239181292817832391814339
1816void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd]00472362812362814194304256001224234240x7f45e2b1be800x7f45e22243401310726978187815256017832391845858178323918129281783239208092917832392082433
1917void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd]00502362812362814194304256001224241280x7f45e2b1bd000x7f45e22243801310726967127805284017832392120672178323920809291783239235116917832392352656
2018void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00532362812362814194304256001624248320x7f45e2b1bb800x7f45e22243c01310727039607881104017832392384785178323923511691783239270717017832392708527
2119void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd]00562362812362814194304256001624255360x7f45e2b1ba000x7f45e2224400655366273507020716017832392739226178323927071701783239306861017832393070078
2220void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd]00592362812362814194304256001224262400x7f45e2b1b8800x7f45e22244401310727052087895316817832393101637178323930686101783239333821117832393339751
2321void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd]00622362812362814194304256001224269440x7f45e2b1b7000x7f45e22244801310727006427844328817832393370981178323933382111783239360637117832393607955
2422void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd]00652362812362814194304256001224276480x7f45e517a5800x7f45e22244c01310726805747615308817832393646754178323936063711783239387469217832393876138
2523void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00682362812362814194304256001624286080x7f45e517a4000x7f45e22245001310726980667812868017832393908427178323938746921783239423117317832394232719
2624void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd]00712362812362814194304256001624293120x7f45e517a2800x7f45e2224540655366765607575412017832394265568178323942311731783239459085317832394592260
2725void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd]00742362812362814194304256001224300160x7f45e517a1000x7f45e22245801310726650527449480017832394623679178323945908531783239486813417832394869783
2826void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd]0077236281236281419430425600824309760x7f45e2b1bf800x7f45e22245c01310726623127408852017832394901143178323948681341783239513693417832395138407
2927void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd]00802362812362814194304256001224316800x7f45e2b1be000x7f45e22246001310726935827766379217832395177386178323951369341783239540941517832395411120
3028void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00832362812362814194304256001624326400x7f45e2b1bc800x7f45e22246401310726556747352310417832395443299178323954094151783239576941517832395770881
3129void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd]00862362812362814194304256001224336000x7f45e2b1bb000x7f45e2224680655366519427303714417832395802430178323957694151783239612957617832396130962
3230void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd]00892362812362814194304256001224345600x7f45e2b1b9800x7f45e22246c01310726973907819062417832396162821178323961295761783239639901717832396400575
3331void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd]0092236281236281419430425600824355200x7f45e2b1b8000x7f45e22247001310727050407903163217832396431605178323963990171783239666909717832396670499
3432void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd]00952362812362814194304256001224362240x7f45e2b1b6800x7f45e22247401310727025467868437617832396708378178323966690971783239694093817832396942292
3533void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00982362812362814194304256001224371840x7f45e517a5000x7f45e22247801310727005567835994417832396974431178323969409381783239729885817832397300373
3634void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd]001012362812362814194304256001224381440x7f45e517a3800x7f45e22247c0655366707027507470417832397332152178323972988581783239765629917832397657764
3735void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd]001042362812362814194304256001224391040x7f45e517a2000x7f45e22248001310727023767860765617832397689003178323976562991783239792685917832397928307
3836void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd]00107236281236281419430425600824403200x7f45e517a0800x7f45e22248401310726992187825271217832397960087178323979268591783239820718017832398208690
3937void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd]001102362812362814194304256001224412800x7f45e2b1bf000x7f45e22248801310727021027856680017832398247609178323982071801783239847998017832398481434
4038void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]001132362812362814194304256001224422400x7f45e2b1bd800x7f45e22248c01310727003227846293617832398512783178323984799801783239884078117832398842455
4139void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd]001162362812362814194304256001224432000x7f45e2b1bc000x7f45e2224900655366784327601651217832398873754178323988407811783239919854217832399199956
4240void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd]00119236281236281419430425600824441600x7f45e2b1ba800x7f45e22249401310727040487885044017832399231725178323991985421783239947406217832399475529
4341void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd]001222362812362814194304256001224453760x7f45e2b1b9000x7f45e22249801310727042947876248817832399506378178323994740621783239974414317832399745442
4442void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd]001252362812362814194304256001224463360x7f45e2b1b7800x7f45e22249c01310726971407810134417832399784061178323997441431783240001438317832400015876
4543void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]001282362812362814194304256001224475520x7f45e2b1b6000x7f45e2224a001310726917647741147217832400047205178324000143831783240036878417832400370137
4644void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd]001312362812362814194304256001224485120x7f45e517a4800x7f45e2224a40655366587387382505617832400402316178324003687841783240072942517832400730838
4745void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd]00134236281236281419430425600824494720x7f45e517a3000x7f45e2224a801310726567827360929617832400762547178324007294251783240100094517832401002361
4846void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd]001372362812362814194304256001224506880x7f45e517a1800x7f45e2224ac01310726611247397322417832401033580178324010009451783240126814617832401269644
4947void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd]001402362812362814194304256001224516480x7f45e517a0000x7f45e2224b001310726847727659846417832401308053178324012681461783240154830617832401549867
5048void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]001432362812362814194304256001224528640x7f45e2b1be800x7f45e2224b401310726973147812870417832401581147178324015483061783240190782717832401909338
5149void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd]001462362812362814194304256001224540800x7f45e2b1bd000x7f45e2224b80655366694067500503217832401940558178324019078271783240226318717832402264740
5250void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd]00149236281236281419430425600824552960x7f45e2b1bb800x7f45e2224bc01310727007667851676817832402296189178324022631871783240253502817832402536433
5351void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd]001522362812362814194304256001224567680x7f45e2b1ba000x7f45e2224c001310726979727817756017832402567832178324025350281783240280542817832402806846
5452void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd]001552362812362814194304256001224577280x7f45e2b1b8800x7f45e2224c401310727000487848715217832402845555178324028054281783240307454917832403076009
5553void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]001582362812362814194304256001224589440x7f45e2b1b7000x7f45e2224c801310726882047707912817832403107349178324030745491783240342991017832403431351
5654void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd]001612362812362814194304256001224601600x7f45e517a5800x7f45e2224cc0655366715327517976017832403463430178324034299101783240378847017832403789782
5755void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd]00164236281236281419430425600824613760x7f45e517a4000x7f45e2224d001310726984707821852817832403821291178324037884701783240406239117832404063835
5856void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd]001672362812362814194304256001224628480x7f45e517a2800x7f45e2224d401310727196568060229617832404096124178324040623911783240434287117832404344338
5957void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd]001702362812362814194304256001224638080x7f45e517a1000x7f45e2224d801310726996667833558417832404383487178324043428711783240461343217832404614811
6058void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]001732362812362814194304256001224650240x7f45e2b1bf800x7f45e2224dc01310726702107506088817832404646430178324046134321783240496815317832404969772
6159void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd]001762362812362814194304256001224662400x7f45e2b1be000x7f45e2224e00655366332087102777617832405001072178324049681531783240532239317832405323704
6260void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd]00179236281236281419430425600824674560x7f45e2b1bc800x7f45e2224e401310727070087915425617832405354693178324053223931783240559535417832405596747
6361void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd]001822362812362814194304256001224689280x7f45e2b1bb000x7f45e2224e801310726972187813760017832405628186178324055953541783240587375417832405875160
6462void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd]001852362812362814194304256001224701440x7f45e2b1b9800x7f45e2224ec01310726583087372467217832405914139178324058737541783240614655517832406148433
6563void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]001882362812362814194304256001224716160x7f45e2b1b8000x7f45e2224f001310727013867852734417832406179992178324061465551783240650751517832406508934
6664void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd]001912362812362814194304256001224728320x7f45e2b1b6800x7f45e2224f40655366996227840152017832406541013178324065075151783240686735617832406868765
6765void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd]00194236281236281419430425600824740480x7f45e517a5000x7f45e2224f801310726719587521012817832406900764178324068673561783240714351717832407144948
6866void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd]001972362812362814194304256001224757760x7f45e517a3800x7f45e2224fc01310726727067538111217832407176878178324071435171783240743279717832407434251
6967void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd]002002362812362814194304256001224769920x7f45e517a2000x7f45e22250001310726966067821712817832407473750178324074327971783240770127817832407702625
7068void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]002032362812362814194304256001224784640x7f45e517a0800x7f45e22250401310727082047942947217832407734074178324077012781783240805775817832408059176
7169void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd]002062362812362814194304256001224799360x7f45e2b1bf000x7f45e2225080655366618947415204017832408090825178324080577581783240841279917832408414247
7270void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd]00209236281236281419430425600824814080x7f45e2b1bd800x7f45e22250c01310727023247867239217832408445166178324084127991783240868191917832408683310
7371void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd]002122362812362814194304256001224831360x7f45e2b1bc000x7f45e22251001310727031987882524817832408714829178324086819191783240897120017832408972643
7472void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd]002152362812362814194304256001224843520x7f45e2b1ba800x7f45e22251401310726998147825492817832409022692178324089712001783240925104017832409253036
7573void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]002182362812362814194304256001224858240x7f45e2b1b9000x7f45e22251801310726982607821622417832409284085178324092510401783240961024117832409611667
7674void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd]002212362812362814194304256001224872960x7f45e2b1b7800x7f45e22251c0655366637587433668817832409642866178324096102411783240997136217832409972698
7775void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd]002242362812362814194304256001224887680x7f45e2b1b6000x7f45e22252001310726942007784864017832410003777178324099713621783241025280217832410254361
7876void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd]002272362812362814194304256001224907520x7f45e517a4800x7f45e22252401310727048347891101617832410286130178324102528021783241055168317832410553104
7977void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd]002302362812362814194304256001224919680x7f45e517a3000x7f45e22252801310726969287803510417832410592273178324105516831783241082176317832410823297
8078void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]002332362812362814194304256001224934400x7f45e517a1800x7f45e22252c01310726960327805705617832410854646178324108217631783241118384417832411185188
8179void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd]002362362812362814194304256001224949120x7f45e517a0000x7f45e2225300655366607307400500017832411216967178324111838441783241154000517832411541479
8280void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd]002392362812362814194304256001224963840x7f45e2b1be800x7f45e22253401310727011467840424017832411573128178324115400051783241181024517832411811662
8381void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd]002422362812362814194304256001224983680x7f45e2b1bd000x7f45e22253801310727031887876502417832411843102178324118102451783241211104617832412112465
8482void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd]002452362812362814194304256001224995840x7f45e2b1bb800x7f45e22253c01310727097547943502417832412151434178324121110461783241238064617832412382098
8583void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0024823628123628141943042560012241013120x7f45e2b1ba000x7f45e22254001310726582207379675217832412413128178324123806461783241273792717832412739229
8684void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd]0025123628123628141943042560012241027840x7f45e2b1b8800x7f45e2225440655366682267479921617832412770779178324127379271783241309408817832413095561
8785void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd]0025423628123628141943042560012241042560x7f45e2b1b7000x7f45e22254801310726991927828746417832413126350178324130940881783241336592817832413367344
8886void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd]0025723628123628141943042560012241062400x7f45e517a5800x7f45e22254c01310726645107439109617832413398753178324133659281783241368176917832413683106
8987void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd]0026023628123628141943042560012241077120x7f45e517a4000x7f45e22255001310726618607405930417832413722855178324136817691783241396032917832413961969
9088void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0026323628123628141943042560016241094400x7f45e517a2800x7f45e22255401310727372268257310417832413994028178324139603291783241433089017832414332460
9189void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd]0026623628123628141943042560016241111680x7f45e517a1000x7f45e2225580655366490467266900017832414364689178324143308901783241468849017832414689831
9290void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd]002692362812362814194304256008241128960x7f45e2b1bf800x7f45e22255c01310727007047842832017832414720670178324146884901783241495889117832414960154
9391void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd]0027223628123628141943042560012241151360x7f45e2b1be000x7f45e22256001310726986867825116817832414991923178324149588911783241526993217832415271487
9492void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd]0027523628123628141943042560012241166080x7f45e2b1bc800x7f45e22256401310727109167966889617832415310446178324152699321783241554545217832415546950
9593void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0027823628123628141943042560016241183360x7f45e2b1bb000x7f45e22256801310726973107814840817832415578609178324155454521783241590449317832415905951
9694void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd]0028123628123628141943042560016241200640x7f45e2b1b9800x7f45e22256c0655366619387401234417832415937590178324159044931783241625921317832416260682
9795void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd]0028423628123628141943042560012241217920x7f45e2b1b8000x7f45e22257001310726921267755264817832416291961178324162592131783241653073417832416532145
9896void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd]0028723628123628141943042560012241240320x7f45e2b1b6800x7f45e22257401310726989887825972817832416563474178324165307341783241686081517832416862117
9997void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd]0029023628123628141943042560012241255040x7f45e517a5000x7f45e22257801310727028767870571217832416901386178324168608151783241713857517832417139930
10098void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0029323628123628141943042560012241274880x7f45e517a3800x7f45e22257c01310726935607771075217832417171159178324171385751783241749377617832417495141
10199void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd]0029623628123628141943042560012241292160x7f45e517a2000x7f45e2225800655366627467409008017832417526740178324174937761783241785105617832417852392
102100void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd]0029923628123628141943042560012241309440x7f45e517a0800x7f45e22258401310726615187405676017832417884092178324178510561783241812865717832418130245
103101void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd]0030223628123628141943042560012241334400x7f45e2b1bf000x7f45e22258801310726537947326924017832418161545178324181286571783241846561717832418467077
104102void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd]0030523628123628141943042560012241349120x7f45e2b1bd800x7f45e22258c0131072102368411475396817832418506686178324184656171783241874065817832418742170
105103void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0030823628123628141943042560012241368960x7f45e2b1bc000x7f45e22259001310726712987508503217832418772820178324187406581783241909713917832419098551
106104void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd]0031123628123628141943042560012241388800x7f45e2b1ba800x7f45e2225940655366666067468920017832419130061178324190971391783241945217917832419453583
107105void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd]0031423628123628141943042560012241408640x7f45e2b1b9000x7f45e22259801310727103227953425617832419484652178324194521791783241973586017832419737316
108106void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd]0031723628123628141943042560012241436160x7f45e2b1b7800x7f45e22259c01310727363128250392017832419768565178324197358601783242007922017832420080667
109107void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd]0032023628123628141943042560012241453440x7f45e2b1b6000x7f45e2225a00131072104670011719144817832420119236178324200792201783242035506117832420356480
110108void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0032323628123628141943042560012241475840x7f45e517a4800x7f45e2225a401310727003007843988817832420388939178324203550611783242071138217832420712981
111109void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd]0032623628123628141943042560012241495680x7f45e517a3000x7f45e2225a80655366561807349269617832420744921178324207113821783242106738217832421068772
112110void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd]0032923628123628141943042560012241515520x7f45e517a1800x7f45e2225ac01310726614907416808817832421100522178324210673821783242135250317832421354025
113111void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd]0033223628123628141943042560012241543040x7f45e517a0000x7f45e2225b001310726615347411296817832421385605178324213525031783242171650417832421717916
114112void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd]0033523628123628141943042560012241562880x7f45e2b1be800x7f45e2225b40131072101189211348872817832421756865178324217165041783242199506417832421996489
115113void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0033823628123628141943042560012241587840x7f45e2b1bd000x7f45e2225b801310726966987810140017832422028569178324219950641783242236802517832422369470
116114void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd]0034123628123628141943042560012241610240x7f45e2b1bb800x7f45e2225bc0655366564687359557617832422401369178324223680251783242272850517832422729841
117115void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd]0034423628123628141943042560012241632640x7f45e2b1ba000x7f45e2225c001310726697347499691217832422761010178324227285051783242302610617832423027444
118116void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd]0034723628123628141943042560012241665280x7f45e2b1b8800x7f45e2225c401310726901387734960817832423059093178324230261061783242340898717832423453883
119117void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd]0035023628123628141943042560012241685120x7f45e2b1b7000x7f45e2225c80131072104691211712532017832423472813178324234089871783242373122717832423732736
120118void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0035323628123628141943042560012241712640x7f45e517a5800x7f45e2225cc01310726908007738459217832423764206178324237312271783242409074817832424092097
121119void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd]0035623628123628141943042560012241737600x7f45e517a4000x7f45e2225d00655366687147486033617832424123747178324240907481783242445202917832424453478
122120void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd]0035923628123628141943042560012241762560x7f45e517a2800x7f45e2225d401310727060347914424017832424484928178324244520291783242477234917832424773870
123121void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd]0036223628123628141943042560012241797760x7f45e517a1000x7f45e2225d801310727147588001909617832424805450178324247723491783242518243017832425201200
124122void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd]0036523628123628141943042560012241822720x7f45e2b1bf800x7f45e2225dc013107297025010860876817832425223149178324251824301783242549619117832425497572
125123void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0036823628123628141943042560012241855360x7f45e2b1be000x7f45e2225e001310726925887749515217832425529002178324254961911783242586195117832425879323
126124void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd]0037123628123628141943042560012241885440x7f45e2b1bc800x7f45e2225e40655366619727414417617832425894783178324258619511783242623411217832426255404
127125void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd]0037423628123628141943042560012241915520x7f45e2b1bb000x7f45e2225e801310726515187291456817832426267983178324262341121783242658563317832426587085
128126void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd]0037723628123628141943042560012241958400x7f45e2b1b9800x7f45e2225ec01310726717367520774417832426618065178324265856331783242704499317832427089873
129127void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd]0038023628123628141943042560012241985920x7f45e2b1b8000x7f45e2225f00131072106211611903542417832427108662178324270449931783242740611417832427407555
130128void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0038323628123628141943042560012242023680x7f45e2b1b6800x7f45e2225f40131072101441011367725617832427438934178324274061141783242779267517832427838994
131129void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd]0038623628123628141943042560012242058880x7f45e517a5000x7f45e2225f80655366570967369556817832427849524178324277926751783242821363617832428255404
132130void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd]0038923628123628141943042560012242094080x7f45e517a3800x7f45e2225fc01310727178448038538417832428266174178324282136361783242860755617832428608975
133131void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd]0039223628123628141943042560012242144640x7f45e517a2000x7f45e22260001310726735587563611217832428640334178324286075561783242911987717832429137962
134132void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd]0039523628123628141943042560012242177280x7f45e517a0800x7f45e2226040131072104112011662876017832429161011178324291198771783242947219817832429473604
135133void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0039823628123628141943042560012242220160x7f45e2b1bf000x7f45e2226080131072106773211965915217832429504273178324294721981783242988067917832429898823
136134void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd]0040123628123628141943042560012242260480x7f45e2b1bd800x7f45e22260c0655366587147372966417832429916513178324298806791783243029235917832430311503
137135void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd]0040423628123628141943042560012242300800x7f45e2b1bc000x7f45e22261001310726875267701951217832430325033178324302923591783243069268017832430710793
138136void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd]0040723628123628141943042560012242359040x7f45e2b1ba800x7f45e22261401310726667647477127217832430725573178324306926801783243126020117832431301548
139137void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd]0041023628123628141943042560012242394240x7f45e2b1b9000x7f45e2226180131072103308211580335217832431320018178324312602011783243164868217832431650150
140138void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0041323628123628141943042560012242442240x7f45e2b1b7800x7f45e22261c0131072101837811408555217832431681109178324316486821783243207940317832432098638
141139void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd]0041623628123628141943042560012242487680x7f45e2b1b6000x7f45e2226200655367073247920891217832432112608178324320794031783243250948317832432526118
142140void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd]0041923628123628141943042560012242533120x7f45e517a4800x7f45e22262401310726862427686085617832432542687178324325094831783243292596417832432942478
143141void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd]004222362812362814194304256008242555520x7f45e517a3000x7f45e2226280131072103827611626268817832432959327178324329259641783243355812517832433575932
144142void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd]0042523628123628141943042560012242598400x7f45e517a1800x7f45e22262c0131072103685811618186417832433599221178324335581251783243396740617832433983822
145143void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0042823628123628141943042560012242656640x7f45e517a0000x7f45e222630013107298729211072504817832433999841178324339674061783243445492717832434474699
146144void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd]0043123628123628141943042560012242712320x7f45e2b1be800x7f45e2226340655366596967389907217832434488319178324344549271783243493908817832434981337
147145void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd]004342362812362814194304256008242732160x7f45e2b1bd000x7f45e2226380131072101880011414784817832434992227178324349390881783243544452917832435485844
148146void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd]004372362812362814194304256008242757120x7f45e2b1bb800x7f45e22263c0131072103196011552327217832435497234178324354445291783243620501017832436246585
149147void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd]0044023628123628141943042560012242807680x7f45e2b1ba000x7f45e2226400131072101627011381180817832436266265178324362050101783243667861117832436698824
150148void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0044323628123628141943042560012242876160x7f45e2b1b8800x7f45e2226440131072103228011582813617832436711484178324366786111783243721173217832437228671
151149void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd]0044623628123628141943042560012242942080x7f45e2b1b7000x7f45e2226480655366596247405154417832437245851178324372117321783243774005317832437759248
152150void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd]004492362812362814194304256008242969600x7f45e517a5800x7f45e22264c0131072100566211255136817832437773327178324377400531783243827333417832438291035
153151void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd]004522362812362814194304256008242999680x7f45e517a4000x7f45e2226500131072103158411564574417832438307094178324382733341783243911621617832439157763
154152void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd]004552362812362814194304256008243027200x7f45e517a2800x7f45e2226540131072106136811894134417832439177303178324391162161783243976789717832439809577
155153void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0045823628123628141943042560012243054720x7f45e517a1000x7f45e2226580131072103677611615471217832439821457178324397678971783244043669817832440477671
156154void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd]0046123628123628141943042560012243082240x7f45e2b1bf800x7f45e22265c0655366601967390914417832440489810178324404366981783244110037917832441118625
157155void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd]004642362812362814194304256008243109760x7f45e2b1be000x7f45e2226600131072103947811641095217832441132995178324411003791783244173094117832441747759
158156void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd]004672362812362814194304256008243132160x7f45e2b1bc800x7f45e2226640131072104114611650408017832441763269178324417309411783244278422317832442804243
159157void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd]004702362812362814194304256008243159680x7f45e2b1bb000x7f45e2226680131072103853411634366417832442825283178324427842231783244382246417832443864977
160158void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0047323628123628141943042560012243187200x7f45e2b1b9800x7f45e22266c0131072103402611570608017832443875707178324438223081783244491430917832444984019
161159void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd]0047623628123628141943042560012243214720x7f45e2b1b8000x7f45e2226700655366543707341683217832444995709178324449143091783244604087017832446107291
162160void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd]004792362812362814194304256008243242240x7f45e2b1b6800x7f45e2226740131072106257411892286417832446119451178324460408701783244715063217832447217504
163161void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd]004822362812362814194304256008243264640x7f45e517a5000x7f45e2226780131072103583011623413617832447229853178324471506321783244909447517832449159095
164162void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd]004852362812362814194304256008243292160x7f45e517a3800x7f45e22267c0131072103750411610966417832449179225178324490944751783245100375817832451072248
165163void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0048823628123628141943042560012243319680x7f45e517a2000x7f45e2226800131072102837611527324017832451084307178324510037581783245298104117832453045679
166164void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd]0049123628123628141943042560012243347200x7f45e517a0800x7f45e2226840655366627267425286417832453056848178324529810411783245494248417832455013900
167165void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd]004942362812362814194304256008243374720x7f45e2b1bf000x7f45e2226880131072104077011675634417832455025780178324549424841783245688024717832456947382
168166void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd]0049723628123628141943042560082400x7f45e2b1bd800x7f45e22268c0131072103569411612701617832456958722178324568802471783246048649217832460564112