Files
rocm-systems/tests/workloads/dev0/mi200/prev_analysis/2001.csv
T
colramos-amd 62d130b458 Initial commit
2022-11-04 14:49:36 -05:00

14 KiB

1IndexKernelNamegpu-id
20__amd_rocclr_fillBufferAligned.kd0
31void benchmark_func<short, 256, 8u, 0u>(short, short*) [clone .kd]0
42void benchmark_func<float, 256, 8u, 0u>(float, float*) [clone .kd]0
53void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 0u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
64void benchmark_func<double, 256, 8u, 0u>(double, double*) [clone .kd]0
75void benchmark_func<__half2, 256, 8u, 0u>(__half2, __half2*) [clone .kd]0
86void benchmark_func<int, 256, 8u, 0u>(int, int*) [clone .kd]0
97void benchmark_func<float, 256, 8u, 1u>(float, float*) [clone .kd]0
108void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 1u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
119void benchmark_func<double, 256, 8u, 1u>(double, double*) [clone .kd]0
1210void benchmark_func<__half2, 256, 8u, 1u>(__half2, __half2*) [clone .kd]0
1311void benchmark_func<int, 256, 8u, 1u>(int, int*) [clone .kd]0
1412void benchmark_func<float, 256, 8u, 2u>(float, float*) [clone .kd]0
1513void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 2u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
1614void benchmark_func<double, 256, 8u, 2u>(double, double*) [clone .kd]0
1715void benchmark_func<__half2, 256, 8u, 2u>(__half2, __half2*) [clone .kd]0
1816void benchmark_func<int, 256, 8u, 2u>(int, int*) [clone .kd]0
1917void benchmark_func<float, 256, 8u, 3u>(float, float*) [clone .kd]0
2018void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 3u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
2119void benchmark_func<double, 256, 8u, 3u>(double, double*) [clone .kd]0
2220void benchmark_func<__half2, 256, 8u, 3u>(__half2, __half2*) [clone .kd]0
2321void benchmark_func<int, 256, 8u, 3u>(int, int*) [clone .kd]0
2422void benchmark_func<float, 256, 8u, 4u>(float, float*) [clone .kd]0
2523void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 4u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
2624void benchmark_func<double, 256, 8u, 4u>(double, double*) [clone .kd]0
2725void benchmark_func<__half2, 256, 8u, 4u>(__half2, __half2*) [clone .kd]0
2826void benchmark_func<int, 256, 8u, 4u>(int, int*) [clone .kd]0
2927void benchmark_func<float, 256, 8u, 5u>(float, float*) [clone .kd]0
3028void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 5u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
3129void benchmark_func<double, 256, 8u, 5u>(double, double*) [clone .kd]0
3230void benchmark_func<__half2, 256, 8u, 5u>(__half2, __half2*) [clone .kd]0
3331void benchmark_func<int, 256, 8u, 5u>(int, int*) [clone .kd]0
3432void benchmark_func<float, 256, 8u, 6u>(float, float*) [clone .kd]0
3533void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 6u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
3634void benchmark_func<double, 256, 8u, 6u>(double, double*) [clone .kd]0
3735void benchmark_func<__half2, 256, 8u, 6u>(__half2, __half2*) [clone .kd]0
3836void benchmark_func<int, 256, 8u, 6u>(int, int*) [clone .kd]0
3937void benchmark_func<float, 256, 8u, 7u>(float, float*) [clone .kd]0
4038void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 7u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
4139void benchmark_func<double, 256, 8u, 7u>(double, double*) [clone .kd]0
4240void benchmark_func<__half2, 256, 8u, 7u>(__half2, __half2*) [clone .kd]0
4341void benchmark_func<int, 256, 8u, 7u>(int, int*) [clone .kd]0
4442void benchmark_func<float, 256, 8u, 8u>(float, float*) [clone .kd]0
4543void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 8u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
4644void benchmark_func<double, 256, 8u, 8u>(double, double*) [clone .kd]0
4745void benchmark_func<__half2, 256, 8u, 8u>(__half2, __half2*) [clone .kd]0
4846void benchmark_func<int, 256, 8u, 8u>(int, int*) [clone .kd]0
4947void benchmark_func<float, 256, 8u, 9u>(float, float*) [clone .kd]0
5048void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 9u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
5149void benchmark_func<double, 256, 8u, 9u>(double, double*) [clone .kd]0
5250void benchmark_func<__half2, 256, 8u, 9u>(__half2, __half2*) [clone .kd]0
5351void benchmark_func<int, 256, 8u, 9u>(int, int*) [clone .kd]0
5452void benchmark_func<float, 256, 8u, 10u>(float, float*) [clone .kd]0
5553void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 10u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
5654void benchmark_func<double, 256, 8u, 10u>(double, double*) [clone .kd]0
5755void benchmark_func<__half2, 256, 8u, 10u>(__half2, __half2*) [clone .kd]0
5856void benchmark_func<int, 256, 8u, 10u>(int, int*) [clone .kd]0
5957void benchmark_func<float, 256, 8u, 11u>(float, float*) [clone .kd]0
6058void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 11u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
6159void benchmark_func<double, 256, 8u, 11u>(double, double*) [clone .kd]0
6260void benchmark_func<__half2, 256, 8u, 11u>(__half2, __half2*) [clone .kd]0
6361void benchmark_func<int, 256, 8u, 11u>(int, int*) [clone .kd]0
6462void benchmark_func<float, 256, 8u, 12u>(float, float*) [clone .kd]0
6563void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 12u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
6664void benchmark_func<double, 256, 8u, 12u>(double, double*) [clone .kd]0
6765void benchmark_func<__half2, 256, 8u, 12u>(__half2, __half2*) [clone .kd]0
6866void benchmark_func<int, 256, 8u, 12u>(int, int*) [clone .kd]0
6967void benchmark_func<float, 256, 8u, 13u>(float, float*) [clone .kd]0
7068void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 13u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
7169void benchmark_func<double, 256, 8u, 13u>(double, double*) [clone .kd]0
7270void benchmark_func<__half2, 256, 8u, 13u>(__half2, __half2*) [clone .kd]0
7371void benchmark_func<int, 256, 8u, 13u>(int, int*) [clone .kd]0
7472void benchmark_func<float, 256, 8u, 14u>(float, float*) [clone .kd]0
7573void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 14u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
7674void benchmark_func<double, 256, 8u, 14u>(double, double*) [clone .kd]0
7775void benchmark_func<__half2, 256, 8u, 14u>(__half2, __half2*) [clone .kd]0
7876void benchmark_func<int, 256, 8u, 14u>(int, int*) [clone .kd]0
7977void benchmark_func<float, 256, 8u, 15u>(float, float*) [clone .kd]0
8078void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 15u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
8179void benchmark_func<double, 256, 8u, 15u>(double, double*) [clone .kd]0
8280void benchmark_func<__half2, 256, 8u, 15u>(__half2, __half2*) [clone .kd]0
8381void benchmark_func<int, 256, 8u, 15u>(int, int*) [clone .kd]0
8482void benchmark_func<float, 256, 8u, 16u>(float, float*) [clone .kd]0
8583void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 16u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
8684void benchmark_func<double, 256, 8u, 16u>(double, double*) [clone .kd]0
8785void benchmark_func<__half2, 256, 8u, 16u>(__half2, __half2*) [clone .kd]0
8886void benchmark_func<int, 256, 8u, 16u>(int, int*) [clone .kd]0
8987void benchmark_func<float, 256, 8u, 17u>(float, float*) [clone .kd]0
9088void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 17u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
9189void benchmark_func<double, 256, 8u, 17u>(double, double*) [clone .kd]0
9290void benchmark_func<__half2, 256, 8u, 17u>(__half2, __half2*) [clone .kd]0
9391void benchmark_func<int, 256, 8u, 17u>(int, int*) [clone .kd]0
9492void benchmark_func<float, 256, 8u, 18u>(float, float*) [clone .kd]0
9593void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 18u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
9694void benchmark_func<double, 256, 8u, 18u>(double, double*) [clone .kd]0
9795void benchmark_func<__half2, 256, 8u, 18u>(__half2, __half2*) [clone .kd]0
9896void benchmark_func<int, 256, 8u, 18u>(int, int*) [clone .kd]0
9997void benchmark_func<float, 256, 8u, 20u>(float, float*) [clone .kd]0
10098void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 20u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
10199void benchmark_func<double, 256, 8u, 20u>(double, double*) [clone .kd]0
102100void benchmark_func<__half2, 256, 8u, 20u>(__half2, __half2*) [clone .kd]0
103101void benchmark_func<int, 256, 8u, 20u>(int, int*) [clone .kd]0
104102void benchmark_func<float, 256, 8u, 22u>(float, float*) [clone .kd]0
105103void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 22u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
106104void benchmark_func<double, 256, 8u, 22u>(double, double*) [clone .kd]0
107105void benchmark_func<__half2, 256, 8u, 22u>(__half2, __half2*) [clone .kd]0
108106void benchmark_func<int, 256, 8u, 22u>(int, int*) [clone .kd]0
109107void benchmark_func<float, 256, 8u, 24u>(float, float*) [clone .kd]0
110108void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 24u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
111109void benchmark_func<double, 256, 8u, 24u>(double, double*) [clone .kd]0
112110void benchmark_func<__half2, 256, 8u, 24u>(__half2, __half2*) [clone .kd]0
113111void benchmark_func<int, 256, 8u, 24u>(int, int*) [clone .kd]0
114112void benchmark_func<float, 256, 8u, 28u>(float, float*) [clone .kd]0
115113void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 28u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
116114void benchmark_func<double, 256, 8u, 28u>(double, double*) [clone .kd]0
117115void benchmark_func<__half2, 256, 8u, 28u>(__half2, __half2*) [clone .kd]0
118116void benchmark_func<int, 256, 8u, 28u>(int, int*) [clone .kd]0
119117void benchmark_func<float, 256, 8u, 32u>(float, float*) [clone .kd]0
120118void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 32u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
121119void benchmark_func<double, 256, 8u, 32u>(double, double*) [clone .kd]0
122120void benchmark_func<__half2, 256, 8u, 32u>(__half2, __half2*) [clone .kd]0
123121void benchmark_func<int, 256, 8u, 32u>(int, int*) [clone .kd]0
124122void benchmark_func<float, 256, 8u, 40u>(float, float*) [clone .kd]0
125123void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 40u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
126124void benchmark_func<double, 256, 8u, 40u>(double, double*) [clone .kd]0
127125void benchmark_func<__half2, 256, 8u, 40u>(__half2, __half2*) [clone .kd]0
128126void benchmark_func<int, 256, 8u, 40u>(int, int*) [clone .kd]0
129127void benchmark_func<float, 256, 8u, 48u>(float, float*) [clone .kd]0
130128void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 48u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
131129void benchmark_func<double, 256, 8u, 48u>(double, double*) [clone .kd]0
132130void benchmark_func<__half2, 256, 8u, 48u>(__half2, __half2*) [clone .kd]0
133131void benchmark_func<int, 256, 8u, 48u>(int, int*) [clone .kd]0
134132void benchmark_func<float, 256, 8u, 56u>(float, float*) [clone .kd]0
135133void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 56u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
136134void benchmark_func<double, 256, 8u, 56u>(double, double*) [clone .kd]0
137135void benchmark_func<__half2, 256, 8u, 56u>(__half2, __half2*) [clone .kd]0
138136void benchmark_func<int, 256, 8u, 56u>(int, int*) [clone .kd]0
139137void benchmark_func<float, 256, 8u, 64u>(float, float*) [clone .kd]0
140138void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 64u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
141139void benchmark_func<double, 256, 8u, 64u>(double, double*) [clone .kd]0
142140void benchmark_func<__half2, 256, 8u, 64u>(__half2, __half2*) [clone .kd]0
143141void benchmark_func<int, 256, 8u, 64u>(int, int*) [clone .kd]0
144142void benchmark_func<float, 256, 8u, 80u>(float, float*) [clone .kd]0
145143void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 80u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
146144void benchmark_func<double, 256, 8u, 80u>(double, double*) [clone .kd]0
147145void benchmark_func<__half2, 256, 8u, 80u>(__half2, __half2*) [clone .kd]0
148146void benchmark_func<int, 256, 8u, 80u>(int, int*) [clone .kd]0
149147void benchmark_func<float, 256, 8u, 96u>(float, float*) [clone .kd]0
150148void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 96u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
151149void benchmark_func<double, 256, 8u, 96u>(double, double*) [clone .kd]0
152150void benchmark_func<__half2, 256, 8u, 96u>(__half2, __half2*) [clone .kd]0
153151void benchmark_func<int, 256, 8u, 96u>(int, int*) [clone .kd]0
154152void benchmark_func<float, 256, 8u, 128u>(float, float*) [clone .kd]0
155153void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 128u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
156154void benchmark_func<double, 256, 8u, 128u>(double, double*) [clone .kd]0
157155void benchmark_func<__half2, 256, 8u, 128u>(__half2, __half2*) [clone .kd]0
158156void benchmark_func<int, 256, 8u, 128u>(int, int*) [clone .kd]0
159157void benchmark_func<float, 256, 8u, 256u>(float, float*) [clone .kd]0
160158void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 256u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
161159void benchmark_func<double, 256, 8u, 256u>(double, double*) [clone .kd]0
162160void benchmark_func<__half2, 256, 8u, 256u>(__half2, __half2*) [clone .kd]0
163161void benchmark_func<int, 256, 8u, 256u>(int, int*) [clone .kd]0
164162void benchmark_func<float, 256, 8u, 512u>(float, float*) [clone .kd]0
165163void benchmark_func<HIP_vector_type<float, 2u>, 256, 8u, 512u>(HIP_vector_type<float, 2u>, HIP_vector_type<float, 2u>*) [clone .kd]0
166164void benchmark_func<double, 256, 8u, 512u>(double, double*) [clone .kd]0
167165void benchmark_func<__half2, 256, 8u, 512u>(__half2, __half2*) [clone .kd]0
168166void benchmark_func<int, 256, 8u, 512u>(int, int*) [clone .kd]0