Files
rocm-systems/tests/workloads/Axes2/mi100/SQ_LEVEL_WAVES.csv
T
colramos-amd 62d130b458 Initial commit
2022-11-04 14:49:36 -05:00

50 KiB

1IndexKernelNamegpu-idqueue-idqueue-indexpidtidgrdwgrldsscrvgprsgprfbarsigobjGRBM_COUNTGRBM_GUI_ACTIVECPC_ME1_BUSY_FOR_PACKET_DECODESQ_CYCLESSQ_WAVESSQ_WAVE_CYCLESSQ_BUSY_CYCLESSQ_LEVEL_WAVESSQ_ACCUM_PREV_HIRESDispatchNsBeginNsEndNsCompleteNs
20__amd_rocclr_fillBuffer.kd000906511906516335544322560083264640x00x7f4586e0418050424650424617548403397652428836860567938277410148927581212076039738087526120760399829983651207603998332220412076039983431627
31void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd]00290651190651632768256002424124800x00x7f4586e351002870828708212092296725121162927787550466603612076039998516141120760399988456111207603999885201112076039998860611
42void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd]0049065119065164194304256002424129280x7f46b6ef19000x7f4586e35140226140226140224301809128655361214277591627144048752220412076039998932284120760399991740901207603999931136912076039999315967
53void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0069065119065164194304256003624136320x7f46b6ef18000x7f4586e351803971413971413306731771366553626890242930024580107742442012076039999393782120760399995828881207603999983504712076039999903209
64void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd]0089065119065164194304256002824140800x7f46b6ef17000x7f4586e351c04038524038523418832308246553635693914630608340142957117612076039999931782120760400001489651207604000040464412076040000472567
75void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd]00109065119065164194304256002424145280x7f46b6ef16000x7f4586e35200229517229517193171836144655361141865681660258045855365212076040000498194120760400007104031207604000085056212076040000854346
86void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd]00129065119065164194304256002424149760x7f46b6ef15000x7f4586e35240229461229461209741835696655361185476391660132047600312012076040000914638120760400011089611207604000124848012076040001252526
97void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd]00149065119065164194304256002424154240x7f46b6ef14000x7f4586e35280215940215940213071727528655361458036121557827058503555612076040001342874120760400015276791207604000165967812076040001663290
108void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00169065119065164194304256002824161280x7f46b6ef13000x7f4586e352c04024534024533265432196326553633768574230458900135255924412076040001720847120760400019225571207604000217807612076040002219994
119void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd]00189065119065164194304256002824168320x7f46b6ef1a000x7f4586e353003976613976613223931812966553634887710330149060139732499212076040002256592120760400024487941207604000270159312076040002767943
1210void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd]00209065119065164194304256002424175360x7f46b6ef19000x7f4586e35340214805214805228001718448655361560707671542093062610428012076040002790675120760400029964721207604000312655112076040003130587
1311void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd]00229065119065164194304256002424182400x7f46b6ef18000x7f4586e35380220980220980217121767848655361394944881597248055979293212076040003190999120760400033828701207604000351775012076040003521533
1412void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd]00249065119065164194304256002424189440x7f46b6ef17000x7f4586e353c0218005218005234111744048655361466109051568498058825734812076040003593567120760400037743881207604000390638812076040003909995
1513void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00269065119065164194304256002824199040x7f46b6ef16000x7f4586e354004050614050612461432404966553625091645930586030100548448812076040003969145120760400041671871207604000442526512076040004492498
1614void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd]00289065119065164194304256002824206080x7f46b6ef15000x7f4586e35440402060402060334373216488655362463315703044240098714310812076040004517554120760400047270241207604000498222312076040005048842
1715void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd]00309065119065164194304256002424213120x7f46b6ef14000x7f4586e35480215428215428216311723432655361569893911550840062977170812076040005072796120760400052758211207604000540750112076040005411315
1816void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd]00329065119065164194304256002424220160x7f46b6ef13000x7f4586e354c0218597218597234691748784655361408582301565360056524830812076040005470866120760400056627001207604000579549912076040005799066
1917void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd]00349065119065164194304256002424227200x7f46b6ef1a000x7f4586e35500215036215036223391720296655361433451041550056057519864412076040005869907120760400060604581207604000619165712076040006195633
2018void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00369065119065164194304256002824236800x7f46b6ef19000x7f4586e355404073804073802896832590486553630398691930814360121776338412076040006247790120760400064468561207604000670605512076040006772435
2119void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd]00389065119065164194304256002824243840x7f46b6ef18000x7f4586e355804008774008773260332070246553634995617830391310140163928812076040006796309120760400069977331207604000725293212076040007322517
2220void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd]00409065119065164194304256002424250880x7f46b6ef17000x7f4586e355c0214069214069233821712560655361525697401541876061209701212076040007346442120760400075473311207604000767725012076040007681033
2321void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd]00429065119065164194304256002424257920x7f46b6ef16000x7f4586e35600225045225045253511800368655361306220931605735052430533612076040007737889120760400079311691207604000806732812076040008071369
2422void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd]00449065119065164194304256002424264960x7f46b6ef15000x7f4586e35640215429215429205871723440655361546683931548040062048966812076040008144845120760400083233271207604000845420712076040008457957
2523void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00469065119065164194304256002824277120x7f46b6ef14000x7f4586e356804132844132842897933062806553630392816931251010121752787612076040008515845120760400087020461207604000896604412076040009033838
2624void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd]00489065119065164194304256002824284160x7f46b6ef13000x7f4586e356c03994363994363269531954966553633742877730233970135152884012076040009058403120760400092607631207604000951452212076040009580944
2725void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd]00509065119065164194304256002424291200x7f46b6ef1a000x7f4586e35700213588213588220231708712655361447719011543386058090493612076040009605580120760400098026801207604000993356012076040009937397
2826void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd]00529065119065164194304256002424300800x7f46b6ef19000x7f4586e35740215252215252239521722024655361456400701545413058437876012076040009995665120760400101884391207604001031979812076040010323645
2927void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd]00549065119065164194304256002424307840x7f46b6ef18000x7f4586e35780217021217021232381736176655361433211401562050057510256812076040010393925120760400105722771207604001070475612076040010708450
3028void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00569065119065164194304256002824320000x7f46b6ef17000x7f4586e357c03990533990533361731924326553631572075530161740126469910412076040010767389120760400109650751207604001121995412076040011288868
3129void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd]00589065119065164194304256002824329600x7f46b6ef16000x7f4586e358003983723983723040831869846553633176947330160110132889515612076040011315718120760400115089131207604001176315112076040011829944
3230void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd]00609065119065164194304256002424339200x7f46b6ef15000x7f4586e35840215068215068202151720552655361490870961552098059816745612076040011853808120760400120559501207604001218698912076040012190764
3331void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd]00629065119065164194304256002424348800x7f46b6ef14000x7f4586e35880221564221564241291772520655361413153121600583056711672812076040012248652120760400124351481207604001257146812076040012575189
3432void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd]00649065119065164194304256002424358400x7f46b6ef13000x7f4586e358c0213725213725231951709808655361621856881530612065056150412076040012645760120760400128258661207604001295610612076040012959874
3533void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00669065119065164194304256002824373120x7f46b6ef1a000x7f4586e359004028294028293480132226406553630432535530500380121911607612076040013017511120760400132100251207604001346794312076040013534432
3634void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd]00689065119065164194304256002824382720x7f46b6ef19000x7f4586e359404023014023013297432184166553633653367130384450134794932412076040013558657120760400137596221207604001401578112076040014083292
3735void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd]00709065119065164194304256002424392320x7f46b6ef18000x7f4586e35980221189221189213951769520655361388164531603172055710910012076040014106445120760400143114601207604001444713912076040014450935
3836void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd]00729065119065164194304256002424401920x7f46b6ef17000x7f4586e359c0228596228596213131828776655361476940651633388059261320012076040014512189120760400146944981207604001483465712076040014838525
3937void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd]00749065119065164194304256002424411520x7f46b6ef16000x7f4586e35a00217508217508203811740072655361496594321571933060046883612076040014908535120760400150901761207604001522361512076040015227709
4038void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00769065119065164194304256002824426240x7f46b6ef15000x7f4586e35a403950853950853482431606886553635512311729846580142231149612076040015278874120760400154732141207604001572585312076040015792208
4139void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd]00789065119065164194304256002824435840x7f46b6ef14000x7f4586e35a803954603954602952831636886553633653318429974450134794936012076040015818036120760400160188121207604001627209012076040016339014
4240void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd]00809065119065164194304256002424445440x7f46b6ef13000x7f4586e35ac0213164213164233951705320655361454115651525211058346542012076040016364231120760400165581691207604001668792912076040016691749
4341void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd]00829065119065164194304256002424457600x7f46b6ef1a000x7f4586e35b00216012216012234911728104655361681109001549287067426485612076040016748325120760400169354471207604001706856712076040017072798
4442void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd]00849065119065164194304256002424467200x7f46b6ef19000x7f4586e35b40276405276405171442211248655361516988611504142060863202012076040017144240120760400173202461207604001749160512076040017495864
4543void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00869065119065164194304256002824484480x7f46b6ef18000x7f4586e35b804171084171083292233368726553634654278831472120138798679212076040017547029120760400177376841207604001800408212076040018071153
4644void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd]00889065119065164194304256002824494080x7f46b6ef17000x7f4586e35bc04041724041722716532333846553626522393830485560106271056812076040018097332120760400182916011207604001854968012076040018616326
4745void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd]00909065119065164194304256002424503680x7f46b6ef16000x7f4586e35c00214917214917257131719344655361672400051527358067078028412076040018641303120760400188432791207604001897239812076040018976155
4846void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd]00929065119065164194304256002424515840x7f46b6ef15000x7f4586e35c40228805228805266011830448655361390342951647105055795598412076040019035515120760400192227971207604001936439612076040019368604
4947void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd]00949065119065164194304256002424525440x7f46b6ef14000x7f4586e35c80213492213492246451707944655361656626601532723066447122412076040019440237120760400196155951207604001974535412076040019749342
5048void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00969065119065164194304256002824542720x7f46b6ef13000x7f4586e35cc04228204228203263433825686553633251767032022270133188493612076040019805747120760400199979931207604002026935212076040020336563
5149void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd]00989065119065164194304256002824554880x7f46b6ef1a000x7f4586e35d004039734039733590732317926553626887529430555430107731675212076040020361850120760400205599111207604002081750912076040020884301
5250void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd]001009065119065164194304256002424567040x7f46b6ef19000x7f4586e35d40217364217364222121738920655361432614191565211057486405212076040020908376120760400211075881207604002124054712076040021244521
5351void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd]001029065119065164194304256002424581760x7f46b6ef18000x7f4586e35d80219844219844248461758760655361628785861574982065334183612076040021305814120760400214883861207604002162358612076040021627452
5452void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd]001049065119065164194304256002424593920x7f46b6ef17000x7f4586e35dc0211261211261204951690096655361578041771522073063305598812076040021697613120760400218712651207604002200086412076040022006156
5553void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]001069065119065164194304256002824613760x7f46b6ef16000x7f4586e35e004218294218293177933746406553632566664031895740130448159212076040022063493120760400222503031207604002252118212076040022587516
5654void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd]001089065119065164194304256002824625920x7f46b6ef15000x7f4586e35e404026124026123434332209046553634278948330449750137297379212076040022611090120760400228040601207604002306149912076040023131427
5755void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd]001109065119065164194304256002424638080x7f46b6ef14000x7f4586e35e80221061221061240711768496655361519027721593952060949256012076040023156303120760400233568581207604002349205712076040023495865
5856void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd]001129065119065164194304256002424652800x7f46b6ef13000x7f4586e35ec0219973219973273831759792655361652168781581038066272002012076040023555936120760400237382961207604002387413512076040023878075
5957void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd]001149065119065164194304256002424664960x7f46b6ef1a000x7f4586e35f00219285219285227551754288655361508596121575077060526054412076040023949788120760400241331741207604002426709312076040024271045
6058void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]001169065119065164194304256002824684800x7f46b6ef19000x7f4586e35f404100694100693289532805606553630252828030789320121193476412076040024320707120760400245157321207604002477925112076040024845853
6159void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd]001189065119065164194304256002824696960x7f46b6ef18000x7f4586e35f804040204040203226032321686553634112722230550900136632452412076040024871140120760400250674101207604002532580912076040025366461
6260void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd]001209065119065164194304256002424709120x7f46b6ef17000x7f4586e35fc0212733212733215351701872655361544719521511540061973802812076040025410292120760400255853271207604002571556712076040025719587
6361void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd]001229065119065164194304256002424723840x7f46b6ef16000x7f4586e36000227941227941299951823536655361836092251636205073630252812076040025779048120760400259678861207604002610820512076040026112357
6462void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd]001249065119065164194304256002424736000x7f46b6ef15000x7f4586e36040226972226972223451815784655361360561771644714054607665612076040026183389120760400263562041207604002649604312076040026499927
6563void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]001269065119065164194304256002824758400x7f46b6ef14000x7f4586e360804196604196603627233572886553635122380131783280140671140412076040026558306120760400267422821207604002701220112076040027079845
6664void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd]001289065119065164194304256002824770560x7f46b6ef13000x7f4586e360c03910683910683331031285526553635080588229562060140504031612076040027105553120760400272990791207604002755011812076040027616302
6765void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd]001309065119065164194304256002424782720x7f46b6ef1a000x7f4586e36100213036213036233071704296655361555348331536208062396638012076040027641078120760400278425971207604002797283612076040027976622
6866void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd]001329065119065164194304256002424800000x7f46b6ef19000x7f4586e36140233037233037269041864304655361804976371685506072385616412076040028035732120760400282309151207604002837523412076040028379340
6967void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd]001349065119065164194304256002424812160x7f46b6ef18000x7f4586e36180218709218709243631749680655361444544261575456057963775612076040028450182120760400286254731207604002875955312076040028763424
7068void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]001369065119065164194304256002824834560x7f46b6ef17000x7f4586e361c04152054152053559533216486553632561742531328350130429404812076040028819518120760400290083521207604002927619012076040029317544
7169void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd]001389065119065164194304256002824849280x7f46b6ef16000x7f4586e362004022614022612915332180966553631664204830280110126839161612076040029355835120760400295353891207604002979314812076040029860032
7270void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd]001409065119065164194304256002424864000x7f46b6ef15000x7f4586e36240218933218933218691751472655361542413561571819061883340412076040029885980120760400300841871207604003021890612076040030223117
7371void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd]001429065119065164194304256002424881280x7f46b6ef14000x7f4586e36280242196242196280971937576655362120792561768719085017589212076040030282187120760400304677051207604003061778412076040030621778
7472void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd]001449065119065164194304256002424896000x7f46b6ef13000x7f4586e362c0217141217141217151737136655361452417141552626058280100812076040030711184120760400308853031207604003101858212076040031022593
7573void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]001469065119065164194304256002824920960x7f46b6ef1a000x7f4586e363004254764254764030634038166553631077977232142660124493318412076040031082464120760400312718611207604003154594012076040031613210
7674void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd]001489065119065164194304256002824935680x7f46b6ef19000x7f4586e36340403556403556264853228456655362477089983039591099265391212076040031638197120760400318344181207604003209393712076040032163864
7775void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd]001509065119065164194304256002424950400x7f46b6ef18000x7f4586e36380221972221972232601775784655361417025381596849056868950812076040032188560120760400323902561207604003252641512076040032530385
7876void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd]001529065119065164194304256002424967680x7f46b6ef17000x7f4586e363c0252564252564277492020520655362210882961853491088621064412076040032589374120760400327729741207604003293073312076040032934746
7977void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd]001549065119065164194304256002424982400x7f46b6ef16000x7f4586e36400221052221052269341768424655361564868681561851062776605212076040033010607120760400331868921207604003332081212076040033324811
8078void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0015690651190651641943042560028241007360x7f46b6ef15000x7f4586e364404080284080283379432642326553631215540230630130125044076012076040033383280120760400335750501207604003383824912076040033904478
8179void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd]0015890651190651641943042560028241022080x7f46b6ef14000x7f4586e364803997173997173031431977446553628064045830083010112438564412076040033927511120760400341299281207604003438640712076040034453369
8280void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd]0016090651190651641943042560024241036800x7f46b6ef13000x7f4586e364c0225101225101239561800816655361484798021635268059577375212076040034476712120760400346721651207604003481120512076040034815091
8381void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd]0016290651190651641943042560024241056640x7f46b6ef1a000x7f4586e36500264941264941294362119536655362328597891950786093329131212076040034874902120760400350673631207604003523312312076040035237235
8482void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd]0016490651190651641943042560024241071360x7f46b6ef19000x7f4586e36540225516225516213551804136655361508573711630527060529151212076040035308798120760400354822421207604003562096112076040035625066
8583void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0016690651190651641943042560028241098880x7f46b6ef18000x7f4586e365804207414207413733433659366553631134724131676740124720940412076040035682914120760400358702401207604003614095912076040036212187
8684void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd]0016890651190651641943042560028241113600x7f46b6ef17000x7f4586e365c03940693940693242731525606553634732119429861760139110304412076040036235210120760400364355171207604003668959612076040036756298
8785void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd]0017090651190651641943042560024241128320x7f46b6ef16000x7f4586e36600225044225044233811800360655361527287721617037061279084412076040036779331120760400369755151207604003711407412076040037118031
8886void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd]0017290651190651641943042560024241148160x7f46b6ef15000x7f4586e36640275997275997293992207984655362462311872044116098678055612076040037175437120760400373639931207604003753807212076040037542009
8987void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd]0017490651190651641943042560024241162880x7f46b6ef14000x7f4586e36680219420219420241481755368655361512106871582495060667032412076040037612480120760400377857511207604003792047012076040037924329
9088void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0017690651190651641943042560028241190400x7f46b6ef13000x7f4586e366c04065334065333568932522726553632771181330540930131267688812076040037984070120760400381772691207604003843982812076040038506892
9189void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd]0017890651190651641943042560028241207680x7f46b6ef1a000x7f4586e367004044294044293046832354406553626101500830375840104588744812076040038533000120760400387267071207604003898622512076040039053868
9290void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd]0018090651190651641943042560024241224960x7f46b6ef19000x7f4586e36740223212223212240451785704655361581602791609118063452238812076040039077643120760400392751841207604003941326312076040039417134
9391void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd]0018290651190651641943042560024241247360x7f46b6ef18000x7f4586e367802909812909813144623278566553625765474321544150103246689212076040039475101120760400396598221207604003984302112076040039849367
9492void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd]0018490651190651641943042560024241264640x7f46b6ef17000x7f4586e367c0220692220692219161765544655361527080981591573061271335212076040039934205120760400401217401207604004025789912076040040262194
9593void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0018690651190651641943042560020241279360x7f46b6ef16000x7f4586e368004121404121403658432971286553637735661431198480151124751212076040040313820120760400405084581207604004077517712076040040823096
9694void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd]0018890651190651641943042560028241296640x7f46b6ef15000x7f4586e368404619414619411584036955366553629205605530563910117004240412076040040846490120760400410489361207604004134797412076040041414856
9795void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd]0019090651190651641943042560024241313920x7f46b6ef14000x7f4586e36880221989221989263201775920655361559964261601369062583481612076040041438590120760400416374131207604004177357212076040041777560
9896void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd]0019290651190651641943042560024241336320x7f46b6ef13000x7f4586e368c03032773032773063724262246553626375585522595140105687245612076040041837171120760400420241311207604004221661012076040042265497
9997void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd]0019490651190651641943042560024241353600x7f46b6ef1a000x7f4586e36900218364218364268421746920655361520397701568317061000234412076040042301314120760400424786891207604004261308912076040042616970
10098void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0019690651190651641943042560020241368320x7f46b6ef19000x7f4586e369404373654373653863434989286553640552711233342590162392922412076040042675229120760400428588471207604004314348612076040043192660
10199void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd]0019890651190651641943042560028241385600x7f46b6ef18000x7f4586e369804024774024773452532198246553631669801230337060126861942412076040043217486120760400434118051207604004367100412076040043719900
102100void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd]0020090651190651641943042560024241402880x7f46b6ef17000x7f4586e369c0222028222028238751776232655361462511651607047058687719612076040043744265120760400439370821207604004407436212076040044078376
103101void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd]0020290651190651641943042560024241427840x7f46b6ef16000x7f4586e36a003325653325653629326605286553629922501524727430119874969612076040044137516120760400443313211207604004454124012076040044565301
104102void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd]0020490651190651641943042560024241447680x7f46b6ef15000x7f4586e36a40226381226381261591811056655361563947621636670062747882012076040044628428120760400448055581207604004494539812076040044949305
105103void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0020690651190651641943042560020241457280x7f46b6ef14000x7f4586e36a805160285160281601941282326553643914114335979160175838435212076040045012142120760400452057171207604004554283512076040045592891
106104void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd]0020890651190651641943042560028241477120x7f46b6ef13000x7f4586e36ac04049244049243414232394006553630651638530515540122788550012076040045618188120760400458204561207604004608141512076040046133516
107105void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd]0021090651190651641943042560024241496960x7f46b6ef1a000x7f4586e36b00225188225188265981801512655361567036501616290062869087212076040046154004120760400463567731207604004649613212076040046499225
108106void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd]0021290651190651641943042560024241521920x7f46b6ef19000x7f4586e36b403585493585493584828684006553632765631327013980131248163612076040046557123120760400467428511207604004697149012076040047018711
109107void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd]0021490651190651641943042560024241541760x7f46b6ef18000x7f4586e36b80226821226821245721814576655361563144841629206062714125212076040047055289120760400472391701207604004737964912076040047382747
110108void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0021690651190651641943042560020241556480x7f46b6ef17000x7f4586e36bc05483895483891602543871206553647144675438807630188760768412076040047439833120760400476330881207604004799164712076040048040079
111109void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd]0021890651190651641943042560028241576320x7f46b6ef16000x7f4586e36c004093964093963450832751766553633599387530832740134580133612076040048063232120760400482617261207604004852604512076040048573320
112110void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd]0022090651190651641943042560024241596160x7f46b6ef15000x7f4586e36c40220709220709227091765680655361574662381586250063171615212076040048596132120760400487906841207604004892716312076040048930353
113111void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd]0022290651190651641943042560024241623680x7f46b6ef14000x7f4586e36c803820693820693726830565606553634974816528871620140083760012076040048990084120760400491879631207604004943260212076040049481868
114112void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd]0022490651190651641943042560024241646080x7f46b6ef13000x7f4586e36cc0221109221109253501768880655361616948631598166064865471212076040049517885120760400497009211207604004983788012076040049841356
115113void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0022690651190651641943042560020241663360x7f46b6ef1a000x7f4586e36d006137976137971687949103846553654205371544263830217003618412076040049899485120760400500988391207604005050043812076040050548691
116114void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd]0022890651190651641943042560028241685760x7f46b6ef19000x7f4586e36d404128374128373567033027046553632429344931208260129898954812076040050573407120760400507794771207604005104571612076040051095197
117115void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd]0023090651190651641943042560024241708160x7f46b6ef18000x7f4586e36d80225268225268279051802152655361672340471618662067079195212076040051118620120760400513257151207604005146555412076040051468821
118116void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd]0023290651190651641943042560024241740800x7f46b6ef17000x7f4586e36dc04358204358204199434865686553640274826133116630161284156012076040051527991120760400517234731207604005200379212076040052052626
119117void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd]0023490651190651641943042560024241765760x7f46b6ef16000x7f4586e36e00226029226029256031808240655361875170991638322075195877212076040052095706120760400522748311207604005241547112076040052418676
120118void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0023690651190651641943042560020241777920x7f46b6ef15000x7f4586e36e406475016475015331651800166553661276827250038030245289266012076040052477155120760400526628301207604005308810812076040053136671
121119void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd]0023890651190651641943042560028241802880x7f46b6ef14000x7f4586e36e804104604104603745332836886553632060076430850400128424674412076040053165484120760400533586671207604005362490712076040053646749
122120void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd]0024090651190651641943042560024241827840x7f46b6ef13000x7f4586e36ec0225253225253265041802032655361848650231613351074135085612076040053705768120760400538817061207604005402138512076040054024791
123121void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd]0024290651190651641943042560024241863040x7f46b6ef1a000x7f4586e36f004863804863804214838910486553645531995837235700182312554812076040054080385120760400542821841207604005459642312076040054645665
124122void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd]0024490651190651641943042560024241893120x7f46b6ef19000x7f4586e36f40245700245700296721965608655362135687811786509085616752412076040054680700120760400548660221207604005501866212076040055022435
125123void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0024690651190651641943042560020241907840x7f46b6ef18000x7f4586e36f807870697870696101562965606553675007875461222570300213522412076040055080273120760400552674611207604005578633912076040055834324
126124void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd]0024890651190651641943042560028241937920x7f46b6ef17000x7f4586e36fc04585004585004375036680086553637811866234771520151430583212076040055857728120760400560597781207604005635769712076040056405706
127125void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd]0025090651190651641943042560024241968000x7f46b6ef16000x7f4586e37000246436246436276971971496655362170719431807845087017354812076040056429360120760400566248961207604005677961512076040056782927
128126void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd]0025290651190651641943042560024242010880x7f46b6ef15000x7f4586e370405977405977405117947819286553655609212245949750222622243612076040056843560120760400570356141207604005742265312076040057473460
129127void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd]0025490651190651641943042560024242046080x7f46b6ef14000x7f4586e37080277292277292295332218344655362479859002053420099381734812076040057514286120760400576906521207604005786601112076040057869196
130128void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0025690651190651641943042560020242060800x7f46b6ef13000x7f4586e370c09259409259406874874075286553689003325772344550356195358012076040057927144120760400581311301207604005874104812076040058791690
131129void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd]0025890651190651641943042560028242096000x7f46b6ef1a000x7f4586e371005023895023894382840191206553645686399938451920182928814412076040058815995120760400590108071207604005933928612076040059407495
132130void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd]0026090651190651641943042560024242131200x7f46b6ef19000x7f4586e371402838202838203064122705686553625464843021033330102049133212076040059431590120760400596277651207604005980728412076040059810534
133131void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd]0026290651190651641943042560024242181760x7f46b6ef18000x7f4586e371806989176989175509955913446553666466642654232970266051638412076040059868842120760400600592831207604006051528212076040060581747
134132void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd]0026490651190651641943042560024242222080x7f46b6ef17000x7f4586e371c03149493149493277025196006553628534095523497350114325871612076040060617704120760400607984811207604006099912012076040061065526
135133void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0026690651190651641943042560020242239360x7f46b6ef16000x7f4586e372001067669106766978092854136065536102931594683553280411908482812076040061089020120760400612880791207604006199111612076040062058101
136134void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd]0026890651190651641943042560028242279680x7f46b6ef15000x7f4586e372405677095677094826845416806553652818654243659530211458237212076040062084480120760400622826351207604006265527412076040062722435
137135void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd]0027090651190651641943042560024242320000x7f46b6ef14000x7f4586e372803184603184603196325476886553628960696123783610116031694012076040062744056120760400629411931207604006314391212076040063212486
138136void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd]0027290651190651641943042560024242378240x7f46b6ef13000x7f4586e372c08044938044936137064359526553677007805862687230308215806812076040063235008120760400634343111207604006396054912076040064028603
139137void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd]0027490651190651641943042560024242423680x7f46b6ef1a000x7f4586e373003486693486693394827893606553631964423926250000128047280812076040064063538120760400642498281207604006447318712076040064539582
140138void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0027690651190651641943042560020242435840x7f46b6ef19000x7f4586e373401208797120879786053967038465536116784818694951180467321197612076040064562695120760400647581461207604006555686412076040065623858
141139void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd]0027890651190651641943042560028242481280x7f46b6ef18000x7f4586e373806716936716931569853735526553660140860049264860240748307612076040065647752120760400658491831207604006629158112076040066361508
142140void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd]0028090651190651641943042560024242526720x7f46b6ef17000x7f4586e373c03539413539413496828315366553632397484826577210129779146012076040066392917120760400665903001207604006681589912076040066883489
143141void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd]0028290651190651641943042560024242592640x7f46b6ef16000x7f4586e374009107499107496681472860006553687474911471187680350085080412076040066912322120760400671112581207604006770869612076040067777470
144142void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd]0028490651190651641943042560024242648320x7f46b6ef15000x7f4586e374404187494187494114333500006553638583470731722300154523714412076040067812435120760400679997351207604006826837412076040068334305
145143void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0028690651190651641943042560020242663040x7f46b6ef14000x7f4586e374801487405148740510040111899248655361448118019117347610579429269212076040068358179120760400685552531207604006953988912076040069607471
146144void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd]0028890651190651641943042560028242718720x7f46b6ef13000x7f4586e374c07787247787246113362298006553674030122060549610296305505212076040069638679120760400698394081207604007035348612076040070420201
147145void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd]0029090651190651641943042560024242774400x7f46b6ef1a000x7f4586e375004213324213323976933706646553638884798031951230155727764812076040070444727120760400706480451207604007091860412076040070985332
148146void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd]0029290651190651641943042560012242799360x7f46b6ef19000x7f4586e375401128668112866881730902935265536109025483688503610436284203212076040071017071120760400712086831207604007194740112076040072019263
149147void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd]0029490651190651641943042560024242865280x7f46b6ef18000x7f4586e375804893644893644357039149206553645700646037444260182991896412076040072054649120760400722421201207604007255859812076040072624889
150148void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0029690651190651641943042560020242880000x7f46b6ef17000x7f4586e375c0176917317691734791314153392655361725176960139804150690252829212076040072649124120760400728481971207604007401843312076040074085553
151149void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd]0029890651190651641943042560032242945920x7f46b6ef16000x7f4586e376009218219218216673173745766553680691037071854130322948416412076040074111251120760400743155521207604007492643012076040074992759
152150void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd]0030090651190651641943042560024243011840x7f46b6ef15000x7f4586e376404949564949564451839596566553646147406637888880184779712412076040075021463120760400752233891207604007554402812076040075612641
153151void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd]0030290651190651641943042560012243049600x7f46b6ef14000x7f4586e37680133780413378042143810702440655361299299561105351040519902467212076040075636355120760400758313871207604007670962312076040076776184
154152void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd]0030490651190651641943042560024243136000x7f46b6ef13000x7f4586e376c06324136324135575550593126553659331076448614370237513496812076040076811940120760400769958621207604007740610112076040077472588
155153void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0030690651190651641943042560020243148160x7f46b6ef1a000x7f4586e377002333372233337215056418666984655362284383508184965060913935446412076040077495811120760400776941001207604007924129412076040079309111
156154void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd]0030890651190651641943042560020243175680x7f46b6ef19000x7f4586e377401202484120248485773961988065536116289511194480330465340525612076040079338095120760400795433731207604008033793012076040080405529
157155void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd]0031090651190651641943042560012243203200x7f46b6ef18000x7f4586e377806411566411565181551292566553660698875849614250242978258412076040080435795120760400806329691207604008104800812076040081115528
158156void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd]0031290651190651641943042560012243240960x7f46b6ef17000x7f4586e377c01757917175791711718614063344655361714655878138953140686044861612076040081146566120760400813363271207604008249472312076040082561846
159157void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd]0031490651190651641943042560012243288960x7f46b6ef16000x7f4586e378001201173120117385559960939265536116225222594259600465083686812076040082600558120760400827820821207604008356799912076040083638617
160158void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0031690651190651641943042560020243301120x7f46b6ef15000x7f4586e3784045844614584461211089366756966553645159040823650550701806543803212076040083670266120760400838668781207604008691726712076040086985577
161159void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd]0031890651190651641943042560020243328640x7f46b6ef14000x7f4586e378802325957232595715245118607664655362275707759184312370910465616412076040087021314120760400872214261207604008876286012076040088832309
162160void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd]0032090651190651641943042560012243356160x7f46b6ef13000x7f4586e378c01203877120387784087963102465536116566398794636180466448020012076040088862886120760400890791791207604008986925612076040089938545
163161void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd]0032290651190651641943042560012243393920x7f46b6ef1a000x7f4586e3790034450923445092216660275607446553633859317502738412501354555388012076040089966658120760400901750151207604009245708712076040092525754
164162void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd]0032490651190651641943042560012243441920x7f46b6ef19000x7f4586e379402324173232417315036718593392655362274813929184193270910108116412076040092569946120760400927473261207604009428268012076040094351026
165163void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0032690651190651641943042560020243454080x7f46b6ef18000x7f4586e3798090886689088668545077727093526553689779632307253109703591367454812076040094382514120760400945778791207604010063129712076040100702480
166164void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd]0032890651190651641943042560020243481600x7f46b6ef17000x7f4586e379c045735494573549212175365884006553645022160923641485901801068714412076040100729830120760401009298561207604010397176512076040104042537
167165void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd]0033090651190651641943042560012243509120x7f46b6ef16000x7f4586e37a002330860233086015113118646888655362281424313184646060912752264812076040104072813120760401042725641207604010581207912076040105879952
168166void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd]00332906511906516419430425600122400x7f46b6ef15000x7f4586e37a4068143726814372413964545149846553667209027795433803102688543697212076040105910138120760401061088081207604011063599212076040110712513