doc improvements for 1.0.0 part 2 (#330)

* update installation steps

* Github Issue #50 Adding README's for samples

* Making name change to ROCprofiler-SDK for consistency

* Fix HIP trace documentation

* Fix HSA trace in docs

* Fix kernel trace in docs

* Fixing memory copy and memory allocation traces

* runtime trace and sys trace doc update

* Fix scratch memory doc

* kernel naming and filtering options

* Adding collection period in docs

* Perfetto configs update

* summary output file

* kernel trace format fix

* update CHANGELOG

* Agent index doc update

* rocm-smi output

* group by queue option

* Updated --group-by-queue description

* perfetto visualization

---------

Co-authored-by: Ian Trowbridge <Ian.Trowbridge@amd.com>
Αυτή η υποβολή περιλαμβάνεται σε:
Bhardwaj, Gopesh
2025-04-16 02:00:07 +05:30
υποβλήθηκε από GitHub
γονέας 4fbcfd142c
υποβολή ca7cce9e81
32 αρχεία άλλαξαν με 744 προσθήκες και 106 διαγραφές
@@ -1,9 +1,10 @@
"Kind","Agent_Id","Queue_Id","Stream_Id","Thread_Id","Dispatch_Id","Kernel_Id","Kernel_Name","Correlation_Id","Start_Timestamp","End_Timestamp","Private_Segment_Size","Group_Segment_Size","Workgroup_Size_X","Workgroup_Size_Y","Workgroup_Size_Z","Grid_Size_X","Grid_Size_Y","Grid_Size_Z"
"KERNEL_DISPATCH",2,1,1,21228,1,11,"void addition_kernel<float>(float*, float const*, float const*, int, int)",1937,2414192765353337,2414192765369494,0,0,64,1,1,1024,1024,1
"KERNEL_DISPATCH",2,1,1,21228,2,14,"subtract_kernel(float*, float const*, float const*, int, int)",1945,2414192765424862,2414192765435326,0,0,64,1,1,1024,1024,1
"KERNEL_DISPATCH",2,1,1,21228,3,13,"multiply_kernel(float*, float const*, float const*, int, int)",1953,2414192765487486,2414192765497669,0,0,64,1,1,1024,1024,1
"KERNEL_DISPATCH",2,1,1,21228,4,12,"divide_kernel(float*, float const*, float const*, int, int)",1961,2414192765545619,2414192765555722,0,0,64,1,1,1024,1024,1
"KERNEL_DISPATCH",2,2,2,21228,5,11,"void addition_kernel<float>(float*, float const*, float const*, int, int)",1969,2414192765608844,2414192765621674,0,0,64,1,1,1024,1024,1
"KERNEL_DISPATCH",2,2,2,21228,6,14,"subtract_kernel(float*, float const*, float const*, int, int)",1977,2414192765658519,2414192765669424,0,0,64,1,1,1024,1024,1
"KERNEL_DISPATCH",2,2,2,21228,7,13,"multiply_kernel(float*, float const*, float const*, int, int)",1985,2414192765715650,2414192765726795,0,0,64,1,1,1024,1024,1
"KERNEL_DISPATCH",2,2,2,21228,8,12,"divide_kernel(float*, float const*, float const*, int, int)",1993,2414192765773422,2414192765784969,0,0,64,1,1,1024,1024,1
"KERNEL_DISPATCH","Agent 4",3,4,77,9,12,"void addition_kernel<float>(float*, float const*, float const*, int, int)",9,1057678125307992,1057678125319352,0,0,64,1,1,1024,1024,1
"KERNEL_DISPATCH","Agent 4",2,3,77,8,11,"divide_kernel(float*, float const*, float const*, int, int)",8,1057678125310912,1057678125319952,0,0,64,1,1,1024,1024,1
"KERNEL_DISPATCH","Agent 4",2,3,77,7,13,"multiply_kernel(float*, float const*, float const*, int, int)",7,1057678125298952,1057678125310912,0,0,64,1,1,1024,1024,1
"KERNEL_DISPATCH","Agent 4",2,3,77,6,14,"subtract_kernel(float*, float const*, float const*, int, int)",6,1057678125288912,1057678125298952,0,0,64,1,1,1024,1024,1
"KERNEL_DISPATCH","Agent 4",2,3,77,5,12,"void addition_kernel<float>(float*, float const*, float const*, int, int)",5,1057678125279112,1057678125288912,0,0,64,1,1,1024,1024,1
"KERNEL_DISPATCH","Agent 4",3,4,77,10,14,"subtract_kernel(float*, float const*, float const*, int, int)",10,1057678125319352,1057678125328912,0,0,64,1,1,1024,1024,1
"KERNEL_DISPATCH","Agent 4",3,4,77,12,11,"divide_kernel(float*, float const*, float const*, int, int)",12,1057678125356832,1057678125366712,0,0,64,1,1,1024,1024,1
"KERNEL_DISPATCH","Agent 4",3,4,77,11,13,"multiply_kernel(float*, float const*, float const*, int, int)",11,1057678125344352,1057678125356832,0,0,64,1,1,1024,1024,1
"KERNEL_DISPATCH","Agent 4",4,5,77,13,12,"void addition_kernel<float>(float*, float const*, float const*, int, int)",13,1057678125382792,1057678125394032,0,0,64,1,1,1024,1024,1
1 Kind Agent_Id Queue_Id Stream_Id Thread_Id Dispatch_Id Kernel_Id Kernel_Name Correlation_Id Start_Timestamp End_Timestamp Private_Segment_Size Group_Segment_Size Workgroup_Size_X Workgroup_Size_Y Workgroup_Size_Z Grid_Size_X Grid_Size_Y Grid_Size_Z
2 KERNEL_DISPATCH 2 Agent 4 1 3 1 4 21228 77 1 9 11 12 void addition_kernel<float>(float*, float const*, float const*, int, int) 1937 9 2414192765353337 1057678125307992 2414192765369494 1057678125319352 0 0 64 1 1 1024 1024 1
3 KERNEL_DISPATCH 2 Agent 4 1 2 1 3 21228 77 2 8 14 11 subtract_kernel(float*, float const*, float const*, int, int) divide_kernel(float*, float const*, float const*, int, int) 1945 8 2414192765424862 1057678125310912 2414192765435326 1057678125319952 0 0 64 1 1 1024 1024 1
4 KERNEL_DISPATCH 2 Agent 4 1 2 1 3 21228 77 3 7 13 multiply_kernel(float*, float const*, float const*, int, int) 1953 7 2414192765487486 1057678125298952 2414192765497669 1057678125310912 0 0 64 1 1 1024 1024 1
5 KERNEL_DISPATCH 2 Agent 4 1 2 1 3 21228 77 4 6 12 14 divide_kernel(float*, float const*, float const*, int, int) subtract_kernel(float*, float const*, float const*, int, int) 1961 6 2414192765545619 1057678125288912 2414192765555722 1057678125298952 0 0 64 1 1 1024 1024 1
6 KERNEL_DISPATCH 2 Agent 4 2 2 3 21228 77 5 11 12 void addition_kernel<float>(float*, float const*, float const*, int, int) 1969 5 2414192765608844 1057678125279112 2414192765621674 1057678125288912 0 0 64 1 1 1024 1024 1
7 KERNEL_DISPATCH 2 Agent 4 2 3 2 4 21228 77 6 10 14 subtract_kernel(float*, float const*, float const*, int, int) 1977 10 2414192765658519 1057678125319352 2414192765669424 1057678125328912 0 0 64 1 1 1024 1024 1
8 KERNEL_DISPATCH 2 Agent 4 2 3 2 4 21228 77 7 12 13 11 multiply_kernel(float*, float const*, float const*, int, int) divide_kernel(float*, float const*, float const*, int, int) 1985 12 2414192765715650 1057678125356832 2414192765726795 1057678125366712 0 0 64 1 1 1024 1024 1
9 KERNEL_DISPATCH 2 Agent 4 2 3 2 4 21228 77 8 11 12 13 divide_kernel(float*, float const*, float const*, int, int) multiply_kernel(float*, float const*, float const*, int, int) 1993 11 2414192765773422 1057678125344352 2414192765784969 1057678125356832 0 0 64 1 1 1024 1024 1
10 KERNEL_DISPATCH Agent 4 4 5 77 13 12 void addition_kernel<float>(float*, float const*, float const*, int, int) 13 1057678125382792 1057678125394032 0 0 64 1 1 1024 1024 1