Fichiers
rocm-systems/tests/workloads/dev0/mi100/SQ_INST_LEVEL_VMEM.csv
T
colramos-amd 62d130b458 Initial commit
2022-11-04 14:49:36 -05:00

43 KiB

1IndexKernelNamegpu-idqueue-idqueue-indexpidtidgrdwgrldsscrvgprsgprfbarsigobjSQ_INSTS_VMEMSQ_INST_LEVEL_VMEMSQ_ACCUM_PREV_HIRESDispatchNsBeginNsEndNsCompleteNs
20__amd_rocclr_fillBuffer.kd000921153921158335544322560083264640x00x7fbf7ac04180104857611001658140805285612076324607361092120763248515788561207632485190365412076324852039846
31void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd]00292115392115832768256002424124800x00x7fbf7ac3510040961132891447966012076324866554932120763248668517771207632486685801712076324866863235
42void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd]0049211539211584194304256002424129280x7fc0aab919000x7fbf7ac3514052428812401318158731127612076324866927514120763248671484151207632486727961512076324867283767
53void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0069211539211584194304256003624136320x7fc0aab918000x7fbf7ac3518052428813924068178235147612076324867354438120763248675256931207632486777353212076324867842695
64void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd]0089211539211584194304256002824140800x7fc0aab917000x7fbf7ac351c052428814366779183888098412076324867872430120763248680629711207632486831480912076324868383570
75void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd]00109211539211584194304256002424145280x7fc0aab916000x7fbf7ac3520052428811167660142951692812076324868408617120763248685949681207632486873160712076324868735214
86void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd]00129211539211584194304256002424149760x7fc0aab915000x7fbf7ac3524052428812212582156314372812076324868785387120763248689562461207632486908888512076324869092698
97void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd]00149211539211584194304256002424154240x7fc0aab914000x7fbf7ac3528052428812734855163007428012076324869171385120763248693426441207632486947256312076324869476321
108void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00169211539211584194304256002824161280x7fc0aab913000x7fbf7ac352c052428813905355177983288812076324869526575120763248697052021207632486995896112076324870005104
119void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd]00189211539211584194304256002824168320x7fc0aab91a000x7fbf7ac3530052428813638895174572036812076324870031794120763248702112801207632487046663812076324870507167
1210void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd]00209211539211584194304256002424175360x7fc0aab919000x7fbf7ac3534052428811953865153002898412076324870530250120763248707186371207632487085191612076324870855575
1311void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd]00229211539211584194304256002424182400x7fc0aab918000x7fbf7ac3538052428811019037141045298812076324870903554120763248710794351207632487121623512076324871220112
1412void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd]00249211539211584194304256002424189440x7fc0aab917000x7fbf7ac353c052428812347166158039368812076324871281817120763248714459931207632487157783312076324871581554
1513void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00269211539211584194304256002824199040x7fc0aab916000x7fbf7ac3540052428814251323182418266412076324871624504120763248718015121207632487205607012076324872124513
1614void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd]00289211539211584194304256002824206080x7fc0aab915000x7fbf7ac3544052428814134381180918494812076324872148016120763248723368691207632487259078812076324872657093
1715void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd]00309211539211584194304256002424213120x7fc0aab914000x7fbf7ac3548052428812003708153640132012076324872680987120763248728591061207632487299206612076324872995692
1816void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd]00329211539211584194304256002424220160x7fc0aab913000x7fbf7ac354c052428812761839163355080012076324873044783120763248732155841207632487334582412076324873349419
1917void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd]00349211539211584194304256002424227200x7fc0aab91a000x7fbf7ac3550052428812355665158151077212076324873408950120763248735720631207632487370374212076324873707294
2018void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00369211539211584194304256002824236800x7fc0aab919000x7fbf7ac3554052428813960437178686042412076324873758660120763248739199011207632487417205912076324874214918
2119void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd]00389211539211584194304256002824243840x7fc0aab918000x7fbf7ac3558052428814296440182992597612076324874237069120763248744243781207632487467253712076324874713925
2220void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd]00409211539211584194304256002424250880x7fc0aab917000x7fbf7ac355c052428811419318146157915612076324874735505120763248749179761207632487505285512076324875056792
2321void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd]00429211539211584194304256002424257920x7fc0aab916000x7fbf7ac3560052428812716538162762904412076324875107927120763248752789341207632487540917312076324875413004
2422void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd]00449211539211584194304256002424264960x7fc0aab915000x7fbf7ac3564052428812786121163675589212076324875472425120763248756346121207632487576485112076324875768585
2523void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00469211539211584194304256002824277120x7fc0aab914000x7fbf7ac3568052428813985714179015853212076324875816554120763248759827701207632487623524912076324876303439
2624void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd]00489211539211584194304256002824284160x7fc0aab913000x7fbf7ac356c052428813560902173575630012076324876330079120763248765072481207632487675844612076324876825439
2725void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd]00509211539211584194304256002424291200x7fc0aab91a000x7fbf7ac3570052428811718659149995151212076324876850366120763248770344451207632487716820412076324877171973
2826void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd]00529211539211584194304256002424300800x7fc0aab919000x7fbf7ac3574052428812932359165530450812076324877219902120763248773891631207632487751940212076324877523086
2927void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd]00549211539211584194304256002424307840x7fc0aab918000x7fbf7ac3578052428812610659161416058412076324877581434120763248777414811207632487787140112076324877875140
3028void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00569211539211584194304256002824320000x7fc0aab917000x7fbf7ac357c052428814065498180033720812076324877923720120763248781158791207632487837203812076324878439409
3129void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd]00589211539211584194304256002824329600x7fc0aab916000x7fbf7ac3580052428814390289184190087212076324878466319120763248786425971207632487889683512076324878963042
3230void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd]00609211539211584194304256002424339200x7fc0aab915000x7fbf7ac3584052428811632795148887534412076324878988389120763248791721941207632487930771312076324879311890
3331void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd]00629211539211584194304256002424348800x7fc0aab914000x7fbf7ac3588052428813041589166931122412076324879360360120763248795262721207632487965699112076324879660839
3432void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd]00649211539211584194304256002424358400x7fc0aab913000x7fbf7ac358c052428813141993168224960412076324879722754120763248798857901207632488001411012076324880017852
3533void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00669211539211584194304256002824373120x7fc0aab91a000x7fbf7ac3590052428813903488177963789612076324880067464120763248802392291207632488049570712076324880563456
3634void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd]00689211539211584194304256002824382720x7fc0aab919000x7fbf7ac3594052428813863049177444487612076324880586780120763248807720261207632488102274512076324881091307
3735void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd]00709211539211584194304256002424392320x7fc0aab918000x7fbf7ac3598052428812585259161091515612076324881119910120763248812995431207632488143058212076324881434365
3836void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd]00729211539211584194304256002424401920x7fc0aab917000x7fbf7ac359c052428812147124155484326412076324881482705120763248816539411207632488178722112076324881791128
3937void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd]00749211539211584194304256002424411520x7fc0aab916000x7fbf7ac35a0052428812065079154432188412076324881850709120763248820123391207632488214497912076324882148993
4038void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00769211539211584194304256002824426240x7fc0aab915000x7fbf7ac35a4052428813593200173992994412076324882196461120763248823683381207632488262545612076324882691912
4139void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd]00789211539211584194304256002824435840x7fc0aab914000x7fbf7ac35a8052428814200515181760208412076324882713462120763248828921751207632488314529412076324883216226
4240void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd]00809211539211584194304256002424445440x7fc0aab913000x7fbf7ac35ac052428812974942166088950012076324883238357120763248834180921207632488354753212076324883551209
4341void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd]00829211539211584194304256002424457600x7fc0aab91a000x7fbf7ac35b0052428812389424158581589612076324883599499120763248837646511207632488389681012076324883900618
4442void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd]00849211539211584194304256002424467200x7fc0aab919000x7fbf7ac35b4052428812579260161010188012076324883959738120763248841280091207632488425824812076324884262240
4543void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00869211539211584194304256002824484480x7fc0aab918000x7fbf7ac35b8052428813798283176617938412076324884310390120763248844772871207632488474160612076324884808636
4644void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd]00889211539211584194304256002824494080x7fc0aab917000x7fbf7ac35bc052428813967280178776512012076324884832991120763248850075241207632488530144312076324885368246
4745void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd]00909211539211584194304256002424503680x7fc0aab916000x7fbf7ac35c0052428812768928163442007212076324885393152120763248855755211207632488570528112076324885709039
4846void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd]00929211539211584194304256002424515840x7fc0aab915000x7fbf7ac35c4052428811048220141410174812076324885756788120763248859227191207632488605999912076324886063758
4947void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd]00949211539211584194304256002424525440x7fc0aab914000x7fbf7ac35c8052428811869975151941129212076324886124431120763248862881581207632488642031712076324886424038
5048void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]00969211539211584194304256002824542720x7fc0aab913000x7fbf7ac35cc052428812994597166322839612076324886468681120763248866371161207632488690687412076324886949354
5149void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd]00989211539211584194304256002824554880x7fc0aab91a000x7fbf7ac35d0052428814232764182178846012076324886975783120763248871547131207632488740671212076324887475632
5250void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd]001009211539211584194304256002424567040x7fc0aab919000x7fbf7ac35d4052428813097771167657116412076324887499006120763248876753511207632488780415012076324887808080
5351void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd]001029211539211584194304256002424581760x7fc0aab918000x7fbf7ac35d805242889712685124326828412076324887858624120763248880307091207632488817278812076324888176825
5452void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd]001049211539211584194304256002424593920x7fc0aab917000x7fbf7ac35dc052428811709071149877983612076324888236827120763248883979071207632488853102612076324888534821
5553void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]001069211539211584194304256002824613760x7fc0aab916000x7fbf7ac35e0052428814539178186107240812076324888582319120763248887468651207632488901454412076324889081958
5654void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd]001089211539211584194304256002824625920x7fc0aab915000x7fbf7ac35e4052428814171868181402137612076324889105682120763248892929421207632488954478112076324889611411
5755void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd]001109211539211584194304256002424638080x7fc0aab914000x7fbf7ac35e8052428811767035150617742412076324889635867120763248898183801207632488999341912076324889997218
5856void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd]001129211539211584194304256002424652800x7fc0aab913000x7fbf7ac35ec05242889202080117785257212076324890047051120763248902158181207632489035677712076324890360614
5957void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd]001149211539211584194304256002424664960x7fc0aab91a000x7fbf7ac35f0052428812333047157866547212076324890422609120763248905834961207632489071405512076324890718158
6058void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]001169211539211584194304256002824684800x7fc0aab919000x7fbf7ac35f4052428813147150168278038812076324890763743120763248909329341207632489119693312076324891267369
6159void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd]001189211539211584194304256002824696960x7fc0aab918000x7fbf7ac35f8052428814153714181163285212076324891292906120763248914689311207632489171789012076324891784791
6260void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd]001209211539211584194304256002424709120x7fc0aab917000x7fbf7ac35fc052428811152062142748681212076324891810709120763248919838091207632489211804812076324892122168
6361void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd]001229211539211584194304256002424723840x7fc0aab916000x7fbf7ac36000524288759546997216073212076324892171249120763248923354871207632489247580612076324892479612
6462void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd]001249211539211584194304256002424736000x7fc0aab915000x7fbf7ac3604052428812148182155494880812076324892538181120763248926958051207632489282892412076324892832708
6563void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]001269211539211584194304256002824758400x7fc0aab914000x7fbf7ac3608052428813124035167984818812076324892880517120763248930702031207632489333180212076324893381418
6664void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd]001289211539211584194304256002824770560x7fc0aab913000x7fbf7ac360c052428814233274182179280812076324893405332120763248935860401207632489383915912076324893888650
6765void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd]001309211539211584194304256002424782720x7fc0aab91a000x7fbf7ac3610052428812840930164371955612076324893913857120763248940954781207632489422411712076324894228342
6866void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd]001329211539211584194304256002424800000x7fc0aab919000x7fbf7ac36140524288704078290118722812076324894275089120763248944461961207632489459035512076324894594292
6967void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd]001349211539211584194304256002424812160x7fc0aab918000x7fbf7ac3618052428812809973163961312012076324894654794120763248948132341207632489494347312076324894947218
7068void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]001369211539211584194304256002824834560x7fc0aab917000x7fbf7ac361c052428814132386180891475612076324894994185120763248951684321207632489543371112076324895484486
7169void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd]001389211539211584194304256002824849280x7fc0aab916000x7fbf7ac3620052428813678968175085519212076324895509914120763248956882701207632489593834812076324895987581
7270void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd]001409211539211584194304256002424864000x7fc0aab915000x7fbf7ac3624052428811779596150783337212076324896020793120763248962049071207632489633898612076324896342932
7371void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd]001429211539211584194304256002424881280x7fc0aab914000x7fbf7ac36280524288537032968750004412076324896392764120763248965589851207632489671018412076324896714011
7472void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd]001449211539211584194304256002424896000x7fc0aab913000x7fbf7ac362c052428812296817157399903212076324896791876120763248969495431207632489708154312076324897085722
7573void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]001469211539211584194304256002824920960x7fc0aab91a000x7fbf7ac3630052428811501488147220209612076324897134282120763248973055411207632489757354012076324897596201
7674void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd]001489211539211584194304256002824935680x7fc0aab919000x7fbf7ac3634052428813320122170498375212076324897638279120763248977972191207632489805545812076324898107120
7775void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd]001509211539211584194304256002424950400x7fc0aab918000x7fbf7ac3638052428812016359153803447612076324898134050120763248983108161207632489844361612076324898447503
7876void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd]001529211539211584194304256002424967680x7fc0aab917000x7fbf7ac363c0524288432613155372332412076324898495282120763248986618541207632489881929412076324898823261
7977void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd]001549211539211584194304256002424982400x7fc0aab916000x7fbf7ac3640052428812239178156661340012076324898883263120763248990492121207632489918217212076324899186055
8078void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0015692115392115841943042560028241007360x7fc0aab915000x7fbf7ac3644052428812133403155310115212076324899233854120763248994071311207632489967448912076324899722693
8179void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd]0015892115392115841943042560028241022080x7fc0aab914000x7fbf7ac3648052428813469460172408946412076324899748821120763248999226481207632490018360712076324900237450
8280void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd]0016092115392115841943042560024241036800x7fc0aab913000x7fbf7ac364c052428810572687135322016012076324900264750120763249004432851207632490058328512076324900586959
8381void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd]0016292115392115841943042560024241056640x7fc0aab91a000x7fbf7ac36500524288414210353026036012076324900636742120763249008104831207632490097640312076324900980340
8482void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd]0016492115392115841943042560024241071360x7fc0aab919000x7fbf7ac3654052428812008178153701735612076324901042836120763249012053611207632490133864112076324901342203
8583void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0016692115392115841943042560028241098880x7fc0aab918000x7fbf7ac365805242889834726125881087612076324901393728120763249015552801207632490182167812076324901867108
8684void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd]0016892115392115841943042560028241113600x7fc0aab917000x7fbf7ac365c052428814102675180517604012076324901893748120763249020728771207632490232663612076324902374351
8785void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd]0017092115392115841943042560024241128320x7fc0aab916000x7fbf7ac3660052428810607477135773605612076324902401040120763249025771941207632490271575412076324902719783
8886void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd]0017292115392115841943042560024241148160x7fc0aab915000x7fbf7ac36640524288352727645141312812076324902766670120763249029330331207632490310695212076324903111360
8987void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd]0017492115392115841943042560024241162880x7fc0aab914000x7fbf7ac3668052428812880722164875098412076324903171562120763249033357511207632490346503012076324903468805
9088void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0017692115392115841943042560028241190400x7fc0aab913000x7fbf7ac366c05242889146419117076091612076324903512506120763249036823091207632490393990712076324903986697
9189void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd]0017892115392115841943042560028241207680x7fc0aab91a000x7fbf7ac3670052428814038124179687196812076324904016483120763249041983061207632490445350512076324904502616
9290void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd]0018092115392115841943042560024241224960x7fc0aab919000x7fbf7ac3674052428810574105135349675612076324904529416120763249047104641207632490484966312076324904853478
9391void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd]0018292115392115841943042560024241247360x7fc0aab918000x7fbf7ac36780524288345739944251811612076324904902720120763249050723821207632490525574112076324905259603
9492void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd]0018492115392115841943042560024241264640x7fc0aab917000x7fbf7ac367c052428810207108130652510012076324905320226120763249054797401207632490566437912076324905668333
9593void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0018692115392115841943042560020241279360x7fc0aab916000x7fbf7ac36800524288412591352813966012076324905718255120763249058795781207632490617861612076324906225939
9694void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd]0018892115392115841943042560028241296640x7fc0aab915000x7fbf7ac3684052428813900881177927794412076324906251737120763249064307751207632490668533312076324906733031
9795void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd]0019092115392115841943042560024241313920x7fc0aab914000x7fbf7ac3688052428811632847148897187212076324906758919120763249069317321207632490706613212076324907069937
9896void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd]0019292115392115841943042560024241336320x7fc0aab913000x7fbf7ac368c0524288343735243999719612076324907120692120763249072907701207632490748276912076324907530934
9997void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd]0019492115392115841943042560024241353600x7fc0aab91a000x7fbf7ac3690052428811389714145791364012076324907569756120763249077291681207632490786420712076324907868001
10098void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0019692115392115841943042560020241368320x7fc0aab919000x7fbf7ac36940524288291474337316253612076324907916030120763249080965261207632490838180512076324908430977
10199void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd]0019892115392115841943042560028241385600x7fc0aab918000x7fbf7ac3698052428813932315178328011612076324908456384120763249086333241207632490889252212076324908913363
102100void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd]0020092115392115841943042560024241402880x7fc0aab917000x7fbf7ac369c052428810430768133501685612076324908955692120763249091210011207632490926116012076324909265337
103101void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd]0020292115392115841943042560024241427840x7fc0aab916000x7fbf7ac36a00524288335110542907421612076324909313978120763249094801991207632490969011812076324909737725
104102void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd]0020492115392115841943042560024241447680x7fc0aab915000x7fbf7ac36a4052428810451016133771821612076324909776077120763249099349171207632491007347612076324910077457
105103void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0020692115392115841943042560020241457280x7fc0aab914000x7fbf7ac36a80524288256482032828286412076324910127720120763249102987551207632491060867312076324910655411
106104void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd]0020892115392115841943042560028241477120x7fc0aab913000x7fbf7ac36ac052428814030770179588942412076324910681670120763249108547521207632491110995112076324911160049
107105void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd]0021092115392115841943042560024241496960x7fc0aab91a000x7fbf7ac36b0052428810435639133581192012076324911186838120763249113629101207632491150210912076324911506032
108106void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd]0021292115392115841943042560024241521920x7fc0aab919000x7fbf7ac36b40524288323359541383024812076324911554852120763249117208281207632491198242612076324912029735
109107void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd]0021492115392115841943042560024241541760x7fc0aab918000x7fbf7ac36b8052428810017803128220986012076324912064670120763249122358651207632491237586412076324912379866
110108void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0021692115392115841943042560020241556480x7fc0aab917000x7fbf7ac36bc0524288249289631905036012076324912427394120763249125942631207632491292578212076324912947611
111109void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd]0021892115392115841943042560028241576320x7fc0aab916000x7fbf7ac36c0052428812895056165057224012076324912984680120763249131469001207632491340737912076324913456707
112110void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd]0022092115392115841943042560024241596160x7fc0aab915000x7fbf7ac36c4052428810583640135471780812076324913478728120763249136566581207632491379649712076324913800476
113111void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd]0022292115392115841943042560024241623680x7fc0aab914000x7fbf7ac36c80524288337622343203793612076324913848214120763249140152161207632491426113512076324914308670
114112void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd]0022492115392115841943042560024241646080x7fc0aab913000x7fbf7ac36cc05242889625041123204803212076324914345469120763249145113001207632491465146012076324914658581
115113void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0022692115392115841943042560020241663360x7fc0aab91a000x7fbf7ac36d00524288238514330524544412076324914705838120763249148653781207632491524265612076324915293090
116114void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd]0022892115392115841943042560028241685760x7fc0aab919000x7fbf7ac36d4052428813874201177580942812076324915318427120763249154943351207632491574905412076324915769124
117115void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd]0023092115392115841943042560024241708160x7fc0aab918000x7fbf7ac36d805242889307681119143317212076324915812435120763249159701731207632491611433212076324916118083
118116void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd]0023292115392115841943042560024241740800x7fc0aab917000x7fbf7ac36dc0524288336762243093203612076324916167244120763249163426511207632491665321012076324916701397
119117void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd]0023492115392115841943042560024241765760x7fc0aab916000x7fbf7ac36e005242888639586110582982812076324916739287120763249168972091207632491703224912076324917035628
120118void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0023692115392115841943042560020241777920x7fc0aab915000x7fbf7ac36e40524288233905929933944012076324917083978120763249172530481207632491767768612076324917724418
121119void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd]0023892115392115841943042560028241802880x7fc0aab914000x7fbf7ac36e8052428810103691129325003212076324917750777120763249179272851207632491819224412076324918240618
122120void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd]0024092115392115841943042560024241827840x7fc0aab913000x7fbf7ac36ec0524288730178893448442812076324918267037120763249184448831207632491858616212076324918589426
123121void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd]0024292115392115841943042560024241863040x7fc0aab91a000x7fbf7ac36f00524288344852244136770812076324918637465120763249188039211207632491911960012076324919170886
124122void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd]0024492115392115841943042560024241893120x7fc0aab919000x7fbf7ac36f40524288361011946220668812076324919207244120763249193695191207632491952391812076324919527128
125123void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0024692115392115841943042560020241907840x7fc0aab918000x7fbf7ac36f80524288230232929475131212076324919574777120763249197439171207632492026071512076324920307849
126124void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd]0024892115392115841943042560028241937920x7fc0aab917000x7fbf7ac36fc05242888378304107236975612076324920330802120763249205197541207632492081783312076324920838546
127125void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd]0025092115392115841943042560024241968000x7fc0aab916000x7fbf7ac37000524288332678342588426812076324920890202120763249210544721207632492120903112076324921212571
128126void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd]0025292115392115841943042560024242010880x7fc0aab915000x7fbf7ac37040524288326802341838676812076324921259578120763249214384701207632492182438812076324921871065
129127void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd]0025492115392115841943042560024242046080x7fc0aab914000x7fbf7ac37080524288340669243595080412076324921914355120763249220813471207632492225846712076324922261971
130128void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0025692115392115841943042560020242060800x7fc0aab913000x7fbf7ac370c0524288232136029720143212076324922310371120763249224800661207632492309062312076324923138600
131129void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd]0025892115392115841943042560028242096000x7fc0aab91a000x7fbf7ac37100524288372642347698295212076324923164739120763249233483821207632492367574112076324923721464
132130void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd]0026092115392115841943042560024242131200x7fc0aab919000x7fbf7ac37140524288310603939747340412076324923748774120763249239272601207632492410597912076324924109525
133131void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd]0026292115392115841943042560024242181760x7fc0aab918000x7fbf7ac37180524288331264342397868812076324924156622120763249243280581207632492478437612076324924832679
134132void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd]0026492115392115841943042560024242222080x7fc0aab917000x7fbf7ac371c0524288298309238188579612076324924872042120763249250395751207632492524021412076324925289097
135133void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0026692115392115841943042560020242239360x7fc0aab916000x7fbf7ac37200524288229130129333974412076324925311018120763249254970131207632492620757012076324926256495
136134void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd]0026892115392115841943042560028242279680x7fc0aab915000x7fbf7ac37240524288360225046117583212076324926280810120763249264610091207632492683508712076324926881707
137135void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd]0027092115392115841943042560024242320000x7fc0aab914000x7fbf7ac37280524288308903639532698412076324926908056120763249270938061207632492729764512076324927346741
138136void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd]0027292115392115841943042560024242378240x7fc0aab913000x7fbf7ac372c0524288403759751685639212076324927371627120763249275467641207632492807348212076324928121651
139137void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd]0027492115392115841943042560024242423680x7fc0aab91a000x7fbf7ac37300524288305038539035217212076324928160734120763249283216411207632492854516012076324928591574
140138void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0027692115392115841943042560020242435840x7fc0aab919000x7fbf7ac37340524288232440729741112412076324928613475120763249287961991207632492959619612076324929646785
141139void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd]0027892115392115841943042560028242481280x7fc0aab918000x7fbf7ac37380524288345181944189416412076324929672984120763249298505951207632493027203312076324930325016
142140void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd]0028092115392115841943042560024242526720x7fc0aab917000x7fbf7ac373c0524288313670640147688812076324930351976120763249305310721207632493075795112076324930806060
143141void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd]0028292115392115841943042560024242592640x7fc0aab916000x7fbf7ac37400524288464275059433647612076324930829994120763249310045101207632493160146712076324931650459
144142void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd]0028492115392115841943042560024242648320x7fc0aab915000x7fbf7ac37440524288320587841033140412076324931687067120763249318558661207632493212658512076324932177739
145143void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0028692115392115841943042560020242663040x7fc0aab914000x7fbf7ac37480524288230914629542813212076324932200201120763249323792241207632493336402012076324933431459
146144void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd]0028892115392115841943042560028242718720x7fc0aab913000x7fbf7ac374c0524288353594145250550812076324933462126120763249336377791207632493415297712076324934219604
147145void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd]0029092115392115841943042560024242774400x7fc0aab91a000x7fbf7ac37500524288320577941029586812076324934248407120763249344249761207632493469905412076324934765919
148146void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd]0029292115392115841943042560012242799360x7fc0aab919000x7fbf7ac37540524288219467028091035212076324934793480120763249349644931207632493570465012076324935773872
149147void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd]0029492115392115841943042560024242865280x7fc0aab918000x7fbf7ac37580524288328738542079203612076324935815820120763249359792091207632493629712812076324936364590
150148void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0029692115392115841943042560020242880000x7fc0aab917000x7fbf7ac375c0524288228082129190972812076324936393123120763249365716871207632493774336212076324937809225
151149void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd]0029892115392115841943042560032242945920x7fc0aab916000x7fbf7ac37600524288340785643619060812076324937839431120763249380092811207632493861807812076324938686485
152150void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd]0030092115392115841943042560024243011840x7fc0aab915000x7fbf7ac37640524288331020542367829612076324938717172120763249388921571207632493921119612076324939280329
153151void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd]0030292115392115841943042560012243049600x7fc0aab914000x7fbf7ac37680524288219622328099206812076324939309994120763249394926341207632494037183112076324940438000
154152void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd]0030492115392115841943042560024243136000x7fc0aab913000x7fbf7ac376c0524288327837641957516412076324940480008120763249406417501207632494105342812076324941120028
155153void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0030692115392115841943042560020243148160x7fc0aab91a000x7fbf7ac37700524288233181029853130012076324941151126120763249413236671207632494287342012076324942940451
156154void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd]0030892115392115841943042560020243175680x7fc0aab919000x7fbf7ac37740524288226303628978964012076324942963183120763249431543791207632494394973612076324944019366
157155void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd]0031092115392115841943042560012243203200x7fc0aab918000x7fbf7ac37780524288217361927821704012076324944048741120763249442286141207632494464397312076324944709699
158156void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd]0031292115392115841943042560012243240960x7fc0aab917000x7fbf7ac377c0524288224204228697148412076324944733664120763249449087721207632494606828712076324946136180
159157void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd]0031492115392115841943042560012243288960x7fc0aab916000x7fbf7ac37800524288224264628719170012076324946175754120763249463374061207632494712364212076324947191211
160158void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0031692115392115841943042560020243301120x7fc0aab915000x7fbf7ac37840524288266236334077092812076324947220205120763249473985211207632495044746812076324950514557
161159void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd]0031892115392115841943042560020243328640x7fc0aab914000x7fbf7ac37880524288229893129431936012076324950544573120763249507225071207632495226442112076324952331274
162160void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd]0032092115392115841943042560012243356160x7fc0aab913000x7fbf7ac378c0524288219716028108893612076324952360167120763249525447401207632495333401612076324953402354
163161void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd]0032292115392115841943042560012243393920x7fc0aab91a000x7fbf7ac37900524288253560232458242812076324953432911120763249536106551207632495589352612076324955961731
164162void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd]0032492115392115841943042560012243441920x7fc0aab919000x7fbf7ac37940524288238593430536972012076324956007636120763249561735241207632495770887812076324957778467
165163void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0032692115392115841943042560020243454080x7fc0aab918000x7fbf7ac37980524288288415336923612812076324957808362120763249579874371207632496404229112076324964112859
166164void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd]0032892115392115841943042560020243481600x7fc0aab917000x7fbf7ac379c0524288337737543217198812076324964139058120763249643173301207632496736243712076324967593037
167165void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd]0033092115392115841943042560012243509120x7fc0aab916000x7fbf7ac37a00524288226204228955144412076324967625167120763249678086761207632496934770912076324969417327
168166void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd]00332921153921158419430425600122400x7fc0aab915000x7fbf7ac37a40524288256767932858602812076324969444798120763249696264281207632497415328912076324974220834