[rocpd] Adding summary module to generate summaries from rocpd database + query submodule + rocpd command-line tools (#488)

* adding summary.py to generate tmp <category_region>_summary views * migrating CSV summary to SDK method of writing CSVs - Add domain_view to summary.py - omit the C++ code of writing CSV because it gets revered later anyway * Add summary subparser and write_sql_view_to_csv function * adding all <>_summary views generation to summary.py * add summary_per_rank feature * add --summary-per-rank * reconstruct generate_summary_view and create_domain_view -introduce by_rank * remove sqr and variance in summary views * use RocpdImportData instead of connection * two fixes on summary.py --modify the generate_summary_view function to return a tuple with view name and sql code add if_not_exits parameter to generete_summary_view * Refactor summary.py to allow output path and filename args, and apply time_window - clean up summary table column headers - only generate by-rank views if that param is specified * Add ProcessID to Hostname output and csv, so users can identify the system in the by-rank summaries * Summary.py, just add hostname to by-rank summaries, instead of creating mapping table * Summary - migrate csv writer to pandas, for more future flexibility * Adding a few simple tests for summary.py * Linting fixes * add region_categories to summary options - Automatically retrieve region categories from the database if argument is None * add backticks for view_names * fix tests after rebase * Made code review changes - fixed whitespace in CMakelists.txt - adding query.py module & subparser in __main__.py - refactor summary function to return query - used query.py to output csv - used query.py to also output summary to console - provided new command line options to select summary output to csv or console * Made fix to jinja template in query.py, as suggested by copilot * Consolidated output calls to query in export_view function based on feedback - refactored: helpers, query functions, create view functions - extended formats to include what query supports (md, html, pdf, json) - added json format to query, and changed orient=records - adding jinja2 and reportlab to requirements.txt * Add version_info for rocpd and roctx * Add rocpd commandline tool * Add executable permissions to source/bin/rocpd.py * Removed rocpd2query, and cleaned up --help examples --------- Co-authored-by: acanadas <acanadas@amd.com> Co-authored-by: Jin Tao <jintao12@amd.com> Co-authored-by: a-canadasruiz <Araceli.CanadasRuiz@amd.com> Co-authored-by: Jonathan R. Madsen <Jonathan.Madsen@amd.com> [ROCm/rocprofiler-sdk commit: 3954cedd25]
2025-07-24 17:12:06 -04:00
parent 35d491159f
commit 68ae6cf65f
13 changed files with 1480 additions and 277 deletions
@@ -5,6 +5,7 @@ cmake>=3.21.0
 cmake-format
 dataclasses
 flake8
+jinja2
 numpy
 otf2
 pandas
@@ -12,3 +13,4 @@ perfetto
 pycobertura
 pytest
 pyyaml
+reportlab
@@ -25,3 +25,39 @@ install(
    PERMISSIONS OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_READ GROUP_EXECUTE WORLD_READ
                WORLD_EXECUTE
    COMPONENT tools)
+
+# for each entry here there must be a ROCPD_BIN_<entry> list
+set(ROCPD_EXECUTABLES "all" "csv" "otf2" "pftrace" "summary")
+
+# format is list: [<exe-name>, <python-module>, <extra-args-to-python-module>]
+set(ROCPD_BIN_all "rocpd" "rocpd" "")
+set(ROCPD_BIN_csv "rocpd2csv" "rocpd.csv" "")
+set(ROCPD_BIN_otf2 "rocpd2otf2" "rocpd.otf2" "")
+set(ROCPD_BIN_pftrace "rocpd2pftrace" "rocpd.pftrace" "")
+set(ROCPD_BIN_summary "rocpd2summary" "rocpd.summary" "")
+
+foreach(_EXE IN LISTS ROCPD_EXECUTABLES)
+    list(GET ROCPD_BIN_${_EXE} 0 ROCPD_EXE_NAME)
+    list(GET ROCPD_BIN_${_EXE} 1 ROCPD_EXE_MODULE)
+    list(GET ROCPD_BIN_${_EXE} 2 ROCPD_EXE_MODULE_ARGS)
+
+    if(NOT ROCPD_EXE_NAME
+       OR NOT ROCPD_EXE_MODULE
+       OR (NOT ROCPD_EXE_MODULE_ARGS AND NOT ROCPD_EXE_MODULE_ARGS STREQUAL ""))
+        message(
+            FATAL_ERROR "ROCPD_BIN_${_EXE} not properly defined: ${ROCPD_BIN_${_EXE}}")
+    endif()
+
+    set(ROCPD_EXE_OUTPUT_FILE
+        ${PROJECT_BINARY_DIR}/${CMAKE_INSTALL_BINDIR}/${ROCPD_EXE_NAME})
+
+    # Adding main rocpd
+    configure_file(rocpd.py ${ROCPD_EXE_OUTPUT_FILE} @ONLY)
+
+    install(
+        FILES ${ROCPD_EXE_OUTPUT_FILE}
+        DESTINATION ${CMAKE_INSTALL_BINDIR}
+        PERMISSIONS OWNER_READ OWNER_WRITE OWNER_EXECUTE GROUP_READ GROUP_EXECUTE
+                    WORLD_READ WORLD_EXECUTE
+        COMPONENT rocpd)
+endforeach()
@@ -0,0 +1,74 @@
+#!/usr/bin/env python3
+
+# MIT License
+#
+# Copyright (c) 2024-2025 Advanced Micro Devices, Inc. All rights reserved.
+#
+# Permission is hereby granted, free of charge, to any person obtaining a copy
+# of this software and associated documentation files (the "Software"), to deal
+# in the Software without restriction, including without limitation the rights
+# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+# copies of the Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice shall be included in
+# all copies or substantial portions of the Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL THE
+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
+# THE SOFTWARE.
+
+import os
+import sys
+
+"""
+Simple Python executable script for invoking `python3 -m @ROCPD_EXE_MODULE@`
+"""
+
+
+def main(argv=sys.argv[1:], environ=dict(os.environ)):
+    """
+    Executes {sys.executable} -m @ROCPD_EXE_MODULE@ @ROCPD_EXE_MODULE_ARGS@
+    """
+
+    ROCPD_SUPPORTED_PYTHON_VERSIONS = [
+        ".".join(itr.split(".")[:2]) for itr in "@ROCPROFILER_PYTHON_VERSIONS@".split(";")
+    ]
+    ROCPD_MODULE_ARGS = [f"{itr}" for itr in "@ROCPD_EXE_MODULE_ARGS@".split(" ") if itr]
+
+    this_dir = os.path.dirname(os.path.realpath(__file__))
+    this_python_ver = f"{sys.version_info.major}.{sys.version_info.minor}"
+    if this_python_ver not in ROCPD_SUPPORTED_PYTHON_VERSIONS:
+        raise ImportError(
+            "@ROCPD_EXE_NAME@ not supported for Python version {} (sys.executable='{}').\n@ROCPD_EXE_NAME@ supported python versions: {}".format(
+                this_python_ver,
+                sys.executable,
+                ", ".join(ROCPD_SUPPORTED_PYTHON_VERSIONS),
+            )
+        )
+
+    module_path = os.path.join(
+        this_dir,
+        "..",
+        "@CMAKE_INSTALL_LIBDIR@",
+        f"python{this_python_ver}",
+        "site-packages",
+    )
+
+    python_path = [module_path] + os.environ.get("PYTHONPATH", "").split(":")
+
+    # update PYTHONPATH environment variable
+    environ["PYTHONPATH"] = ":".join(python_path)
+
+    args = [f"{sys.executable}", "-m", "@ROCPD_EXE_MODULE@"] + ROCPD_MODULE_ARGS + argv
+
+    # does not return
+    os.execvpe(args[0], args, env=environ)
+
+
+if __name__ == "__main__":
+    main()
@@ -46,8 +46,24 @@ __all__ = [
    "write_csv",
    "write_otf2",
    "RocpdImportData",
+    "version_info",
 ]

+version_info = {
+    "version": "@PROJECT_VERSION@",
+    "major": int("@PROJECT_VERSION_MAJOR@"),
+    "minor": int("@PROJECT_VERSION_MINOR@"),
+    "patch": int("@PROJECT_VERSION_PATCH@"),
+    "git_revision": "@ROCPROFILER_SDK_GIT_REVISION@",
+    "library_arch": "@CMAKE_LIBRARY_ARCHITECTURE@",
+    "system_name": "@CMAKE_SYSTEM_NAME@",
+    "system_processor": "@CMAKE_SYSTEM_PROCESSOR@",
+    "system_version": "@CMAKE_SYSTEM_VERSION@",
+    "compiler_id": "@CMAKE_CXX_COMPILER_ID@",
+    "compiler_version": "@CMAKE_CXX_COMPILER_VERSION@",
+    "rocm_version": "@rocm_version_FULL_VERSION@",
+}
+

 def format_path(path, tag=os.path.basename(sys.executable)):
    return libpyrocpd.format_path(path, tag)
@@ -38,11 +38,14 @@ def main(argv=None, config=None):

    """
    import argparse
-    from . import time_window
-    from . import output_config
-    from . import pftrace
    from . import csv
    from . import otf2
+    from . import output_config
+    from . import pftrace
+    from . import query
+    from . import summary
+    from . import time_window
+    from . import version_info
    from .importer import RocpdImportData

    convert_examples = """
@@ -50,25 +53,62 @@ def main(argv=None, config=None):
 Example usage:

    Convert 1 database, output perfetto trace
-    $ python3 -m rocpd convert -i db1.db --output-format pftrace
+    $ rocpd convert -i db1.db --output-format pftrace

    Convert 2 databases, output perfetto trace to path and filename, reduce time window to omit the first 30%
-    $ python3 -m rocpd convert -i db1.db db2.db --output-format pftrace -d "./output/" -o "twoFileTraces" --start 30% --end 100%
+    $ rocpd convert -i db1.db db2.db --output-format pftrace -d "./output/" -o "twoFileTraces" --start 30% --end 100%

    Convert 6 databases, output CSV and perfetto trace formats
-    $ python3 -m rocpd convert -i db{0..5}.db --output-format csv pftrace -d "~/output_folder/" -o "sixFileTraces"
+    $ rocpd convert -i db{0..5}.db --output-format csv pftrace -d "~/output_folder/" -o "sixFileTraces"

    Convert 2 databases, output CSV, OTF2, and perfetto trace formats
-    $ python3 -m rocpd convert -i db{3,4}.db --output-format csv otf2 pftrace
+    $ rocpd convert -i db{3,4}.db --output-format csv otf2 pftrace

 """

+    query_examples = """
+
+Example usage:
+
+    Query the first 5 rows of the 'rocpd_info_agents' view and output to console
+    $ rocpd query -i db0.db --query "SELECT * FROM rocpd_info_agents LIMIT 5"
+
+    Combine 4 databases and query the first 10 rows of the 'top_kernels' view and output to CSV file
+    $ rocpd query -i db{0..3}.db --query "SELECT * FROM top_kernels LIMIT 10" --format csv
+"""
+
+    summary_examples = """
+
+Example usage:
+
+    Output all summaries to console and include domain summary for 1 database
+    $ rocpd summary -i db1.db --domain-summary
+
+    Aggregate 3 databases and output all summary files and include summary by rank/process ID, to csv file output
+    $ rocpd summary -i db{1..3}.db --summary-by-rank --format csv
+
+    Output all summaries to console and exlude all regions to save processing time
+    $ rocpd summary -i db0.db --region-categories NONE
+
+    Aggregate 2 databases and output all summary files to HTML, only include HIP and MARKER regions, include domain summary
+    $ rocpd summary -i db{0,1}.db --region-categories HIP MARKERS --domain-summary --format html
+
+"""
+
+    # Add the subparsers
    parser = argparse.ArgumentParser(
        prog="rocpd",
        description="Aggregate and/or analyze ROCm Profiling Data (rocpd)",
        allow_abbrev=False,
    )

+    parser.add_argument(
+        "-v",
+        "--version",
+        action="store_true",
+        help="Print the version information and exit",
+    )
+
    subparsers = parser.add_subparsers(dest="command")
    converter = subparsers.add_parser(
        "convert",
@@ -78,20 +118,36 @@ Example usage:
        epilog=convert_examples,
    )

+    query_reporter = subparsers.add_parser(
+        "query",
+        description="Generate output on a query",
+        allow_abbrev=False,
+        formatter_class=argparse.RawTextHelpFormatter,
+        epilog=query_examples,
+    )
+
+    generate_summary = subparsers.add_parser(
+        "summary",
+        description="Generate summary views from rocPD data",
+        allow_abbrev=False,
+        formatter_class=argparse.RawTextHelpFormatter,
+        epilog=summary_examples,
+    )
+
    def get_output_type(val):
        return val.lower().replace("perfetto", "pftrace")

-    required_params = converter.add_argument_group("Required arguments")
-
-    required_params.add_argument(
+    # add required options for each subparser
+    converter_required_params = converter.add_argument_group("Required options")
+    converter_required_params.add_argument(
        "-i",
        "--input",
        required=True,
        type=output_config.check_file_exists,
        nargs="+",
-        help="Input path and filename to one or more database(s), separated by spaces",
+        help="Input path and filename to one or more database(s)",
    )
-    required_params.add_argument(
+    converter_required_params.add_argument(
        "-f",
        "--output-format",
        help="For adding output format (supported formats: csv, pftrace, otf2)",
@@ -102,7 +158,27 @@ Example usage:
        required=True,
    )

-    # add args from any sub-modules
+    query_required_params = query_reporter.add_argument_group("Required options")
+    query_required_params.add_argument(
+        "-i",
+        "--input",
+        required=True,
+        type=output_config.check_file_exists,
+        nargs="+",
+        help="Input path and filename to one or more database(s)",
+    )
+
+    summary_required_params = generate_summary.add_argument_group("Required options")
+    summary_required_params.add_argument(
+        "-i",
+        "--input",
+        required=True,
+        type=output_config.check_file_exists,
+        nargs="+",
+        help="Input path and filename to one or more database(s)",
+    )
+
+    # converter: add args from any sub-modules
    valid_out_config_args = output_config.add_args(converter)
    valid_generic_args = output_config.add_generic_args(converter)
    valid_pftrace_args = pftrace.add_args(converter)
@@ -110,51 +186,110 @@ Example usage:
    valid_otf2_args = otf2.add_args(converter)
    valid_time_window_args = time_window.add_args(converter)

+    # query: subparser args
+    valid_out_config_args = output_config.add_args(query_reporter)
+    valid_query_args = query.add_args(query_reporter)
+    valid_time_window_args = time_window.add_args(query_reporter)
+
+    # summary: subparser args
+    valid_io_args = summary.add_io_args(generate_summary)
+    valid_summary_args = summary.add_args(generate_summary)
+    valid_time_window_args = time_window.add_args(generate_summary)
+
    # parse the command line arguments
    args = parser.parse_args(argv)

-    # process the args
-    out_cfg_args = output_config.process_args(args, valid_out_config_args)
-    generic_out_cfg_args = output_config.process_generic_args(args, valid_generic_args)
-    pftrace_args = pftrace.process_args(args, valid_pftrace_args)
-    csv_args = csv.process_args(args, valid_csv_args)
-    otf2_args = otf2.process_args(args, valid_otf2_args)
-    window_args = time_window.process_args(args, valid_time_window_args)
+    if args.version:
+        for key, itr in version_info.items():
+            if key in ["major", "minor", "patch"]:
+                continue
+            print(f"    {key:>16}: {itr}")
+        return 0

-    # now start processing the data.  Import the data and merge the views
-    importData = RocpdImportData(args.input)
+    # error check the command line arguments, if no subparser command is given, print the help message
+    if args.command is None:
+        parser.print_help()
+        return

-    # adjust the time window view of the data
-    if window_args is not None:
-        time_window.apply_time_window(importData, **window_args)
+    # if the user requested converter, process the conversion
+    if args.command == "convert":
+        # process the args
+        out_cfg_args = output_config.process_args(args, valid_out_config_args)
+        generic_out_cfg_args = output_config.process_generic_args(
+            args, valid_generic_args
+        )
+        pftrace_args = pftrace.process_args(args, valid_pftrace_args)
+        csv_args = csv.process_args(args, valid_csv_args)
+        otf2_args = otf2.process_args(args, valid_otf2_args)
+        window_args = time_window.process_args(args, valid_time_window_args)

-    all_args = {
-        **out_cfg_args,
-        **generic_out_cfg_args,
-        **pftrace_args,
-        **csv_args,
-        **otf2_args,
-    }
-    # setup the config args
-    config = (
-        output_config.output_config(**all_args)
-        if config is None
-        else config.update(**all_args)
-    )
+        # now start processing the data.  Import the data and merge the views
+        importData = RocpdImportData(args.input)

-    # process each requested output format
-    format_handlers = {
-        "pftrace": pftrace.write_pftrace,
-        "csv": csv.write_csv,
-        "otf2": otf2.write_otf2,
-    }
+        # adjust the time window view of the data
+        if window_args is not None:
+            time_window.apply_time_window(importData, **window_args)

-    for out_format in args.output_format:
-        if out_format in format_handlers:
-            print(f"Converting database(s) to {out_format} format:")
-            format_handlers[out_format](importData, config)
-        else:
-            print(f"Warning: Unsupported output format '{out_format}'")
+        all_args = {
+            **out_cfg_args,
+            **generic_out_cfg_args,
+            **pftrace_args,
+            **csv_args,
+            **otf2_args,
+        }
+        # setup the config args
+        config = (
+            output_config.output_config(**all_args)
+            if config is None
+            else config.update(**all_args)
+        )
+
+        # process each requested output format
+        format_handlers = {
+            "pftrace": pftrace.write_pftrace,
+            "csv": csv.write_csv,
+            "otf2": otf2.write_otf2,
+        }
+
+        for out_format in args.output_format:
+            if out_format in format_handlers:
+                print(f"Converting database(s) to {out_format} format:")
+                format_handlers[out_format](importData, config)
+            else:
+                print(f"Warning: Unsupported output format '{out_format}'")
+
+    # if the user requested query module, execute the query
+    elif args.command == "query":
+        # query subparser args
+        query_args = query.process_args(args, valid_query_args)
+        out_cfg_args = output_config.process_args(args, valid_out_config_args)
+        window_args = time_window.process_args(args, valid_time_window_args)
+
+        all_args = {**query_args, **out_cfg_args}
+
+        query.execute(
+            args.input,
+            args,
+            window_args=window_args,
+            **all_args,
+        )
+
+    # if the user requested a summary, generate the views
+    elif args.command == "summary":
+        # summary subparser args
+        summary_args = summary.process_args(args, valid_summary_args)
+        io_args = output_config.process_args(args, valid_io_args)
+        window_args = time_window.process_args(args, valid_time_window_args)
+
+        # now start processing the data.  Import the data and merge the views
+        importData = RocpdImportData(args.input)
+
+        # adjust the time window view of the data
+        if window_args is not None:
+            time_window.apply_time_window(importData, **window_args)
+
+        all_args = {**summary_args, **io_args}
+        summary.generate_all_summaries(importData, **all_args)

    print("Done. Exiting...")

@@ -0,0 +1,560 @@
+#!/usr/bin/env python3
+###############################################################################
+# MIT License
+#
+# Copyright (c) 2025 Advanced Micro Devices, Inc.
+#
+# Permission is hereby granted, free of charge, to any person obtaining a copy
+# of this software and associated documentation files (the "Software"), to deal
+# in the Software without restriction, including without limitation the rights
+# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+# copies of the Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice shall be included in
+# all copies or substantial portions of the Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
+# THE SOFTWARE.
+###############################################################################
+
+import os
+import sys
+
+from typing import Union, Tuple, List, Optional
+from datetime import datetime
+
+from . import output_config
+from . import libpyrocpd
+from .importer import RocpdImportData
+from .time_window import apply_time_window
+
+
+def export_sqlite_query(
+    conn: RocpdImportData,
+    query: str,
+    params: Union[Tuple, List] = (),
+    export_format: Optional[str] = None,
+    export_path: Optional[str] = None,
+    dashboard_template_path: Optional[str] = None,
+) -> Optional[str]:
+    """
+    Execute a SQLite query and print it to console.
+    Then, if export_format is specified, write the results to a file.
+    Returns the path to the exported file (or None if nothing was exported).
+
+    Supported export_format values (case-insensitive):
+        - "csv"
+        - "html"
+        - "md"   (markdown)
+        - "pdf"
+        - "dashboard"   (templated HTML dashboard)
+        - "clipboard"
+
+    If export_format == "dashboard", you may optionally pass a
+    dashboard_template_path (a Jinja2 template file). If omitted,
+    a built-in default template is used.
+    """
+
+    try:
+        import pandas as pd
+
+        conn = conn.connection if isinstance(conn, RocpdImportData) else conn
+
+        # 1) Run the query via pandas
+        df = pd.read_sql_query(query, conn, params=params)
+
+        if df.empty:
+            sys.stderr.write(f"No results found for query: {query}\n")
+            sys.stderr.flush()
+            return None
+
+        if export_format == "console" or export_format is None:
+            # 2) Print to console
+            print(df.to_string(index=False))
+            return None
+
+        elif export_format == "clipboard":
+            df.to_clipboard(excel=False)
+            return None
+
+        export_format = export_format.lower()
+        ext = export_format
+        export_path = export_path or f"query_output.{ext}"
+        if not export_path.endswith(f".{ext}"):
+            export_path = f"{export_path}.{ext}"
+        export_path = os.path.abspath(libpyrocpd.format_path(export_path, "rocpd"))
+
+        os.makedirs(os.path.dirname(export_path), exist_ok=True)
+
+        def write_export(content):
+            with open(export_path, "w") as ofs:
+                ofs.write(f"{content}\n")
+                ofs.flush()
+
+        # 3) Export based on format
+        if export_format == "csv":
+            df.to_csv(export_path, index=False)
+
+        elif export_format == "html":
+            write_export(df.to_html(index=False))
+
+        elif export_format == "md":
+            # pandas 1.0+ has to_markdown
+            try:
+                write_export(df.to_markdown(index=False))
+            except AttributeError:
+                # fallback: manually write markdown table
+                _df_to_markdown_fallback(df, export_path)
+
+        elif export_format == "pdf":
+            _export_df_to_pdf(df, export_path)
+
+        elif export_format == "dashboard":
+            _export_dashboard(
+                df, export_path=export_path, template_path=dashboard_template_path
+            )
+
+        elif export_format == "json":
+            df.to_json(export_path, index=False, indent=2, orient="records")
+
+        else:
+            print(f"Unsupported export format: {export_format}")
+            return None
+
+        print(f"Exported to: {export_path}\n")
+        return export_path
+
+    except Exception as e:
+        print(f"Error: {e}")
+        return None
+
+
+def _df_to_markdown_fallback(df, path: str):
+    """
+    Simple fallback if pandas.DataFrame.to_markdown(...) is unavailable.
+    """
+    headers = list(df.columns)
+    with open(path, "w", encoding="utf-8") as f:
+        # Header row
+        f.write("| " + " | ".join(headers) + " |\n")
+        # Separator
+        f.write("|" + "|".join("---" for _ in headers) + "|\n")
+        # Data rows
+        for row in df.itertuples(index=False):
+            line = "| " + " | ".join(str(v) for v in row) + " |\n"
+            f.write(line)
+
+
+def _export_df_to_pdf(df, path: str):
+    """
+    Render a DataFrame into a monospaced text table inside a PDF.
+    """
+    from reportlab.lib.pagesizes import letter
+    from reportlab.pdfgen import canvas
+    from reportlab.lib.units import inch
+
+    c = canvas.Canvas(path, pagesize=letter)
+    width, height = letter
+    x = 0.5 * inch
+    y = height - 1 * inch
+    row_height = 14
+
+    c.setFont("Courier", 9)
+    headers = list(df.columns)
+    header_line = " | ".join(headers)
+    c.drawString(x, y, header_line)
+    y -= row_height
+    c.drawString(x, y, "-" * len(header_line))
+    y -= row_height
+
+    for _, row in df.iterrows():
+        row_line = " | ".join(str(v) for v in row)
+        # Clip at ~160 characters so it doesn’t overflow the page width
+        c.drawString(x, y, row_line[:160])
+        y -= row_height
+        if y < 1 * inch:
+            c.showPage()
+            c.setFont("Courier", 9)
+            y = height - 1 * inch
+
+    c.save()
+
+
+def _export_dashboard(df, export_path: str, template_path: Optional[str] = None):
+    """
+    Generate a templated HTML “dashboard” from df. If template_path is None,
+    use a built-in template. Otherwise, load the Jinja2 template from that path.
+    """
+    from jinja2 import Environment, FileSystemLoader, select_autoescape
+
+    # 1) Prepare Jinja2 environment
+    if template_path:
+        # User provided a .html (Jinja2) file
+        env = Environment(
+            loader=FileSystemLoader(os.path.dirname(template_path)),
+            autoescape=select_autoescape(["html", "xml"]),
+        )
+        template = env.get_template(os.path.basename(template_path))
+    else:
+        # Built-in default template
+        builtin_html = """
+        <!DOCTYPE html>
+        <html lang="en">
+        <head>
+            <meta charset="UTF-8" />
+            <title>Dashboard Report</title>
+            <style>
+                body { font-family: Arial, sans-serif; margin: 20px; }
+                h1 { color: #333; }
+                table { border-collapse: collapse; width: 100%; }
+                th, td { border: 1px solid #aaa; padding: 8px; text-align: left; }
+                th { background-color: #f0f0f0; }
+                tr:nth-child(even) { background-color: #fafafa; }
+            </style>
+        </head>
+        <body>
+            <h1>{{ title }}</h1>
+            <p><em>Generated on {{ timestamp }}</em></p>
+            <div>
+                {{ table_html | safe }}
+            </div>
+        </body>
+        </html>
+        """
+        env = Environment(autoescape=select_autoescape(["html", "xml"]))
+        template = env.from_string(builtin_html)
+
+    # 2) Render template with context
+    context = {
+        "title": "SQLite Query Dashboard",
+        "timestamp": datetime.now().strftime("%Y-%m-%d %H:%M:%S"),
+        "table_html": df.to_html(index=False, classes="dashboard-table"),
+    }
+    rendered = template.render(**context)
+
+    # 3) Write to export_path
+    with open(export_path, "w", encoding="utf-8") as f:
+        f.write(rendered)
+
+
+def zip_files(file_paths: List[str], zip_path: str) -> str:
+    """
+    Zip up one or more files into zip_path. Overwrites existing zip if present.
+    Returns the path to the created zip.
+    """
+    import zipfile
+
+    with zipfile.ZipFile(zip_path, "w", zipfile.ZIP_DEFLATED) as zf:
+        for fp in file_paths:
+            if os.path.isfile(fp):
+                zf.write(fp, arcname=os.path.basename(fp))
+            else:
+                raise FileNotFoundError(f"Cannot find file to zip: {fp}")
+    print(f"Created ZIP archive: {zip_path}")
+    return zip_path
+
+
+def send_report_email(
+    file_paths: List[str],
+    to: Union[str, List[str]],
+    sender: str,
+    subject: str = "rocpd query Report",
+    inline_preview: bool = False,
+    smtp_server: str = "localhost",
+    smtp_port: int = 25,
+    smtp_user: Optional[str] = None,
+    smtp_password: Optional[str] = None,
+    zip_attachments: bool = False,
+) -> None:
+    """
+    Send an email with one or more attachments, optionally zipped,
+    and optionally with an inline preview (if the primary attachment is HTML).
+
+    Args:
+        file_paths: List of file paths to attach (each must exist).
+        to: Recipient email address, or list of addresses.
+        sender: Sender email address.
+        subject: Subject line.
+        inline_preview: If True, and one of the attachments is HTML, use that
+                        HTML as the email body (and still attach files).
+        smtp_server / smtp_port / smtp_user / smtp_password: SMTP credentials.
+        zip_attachments: If True, bundle all file_paths into a single ZIP named
+                         "<timestamp>_attachments.zip" and attach that ZIP only.
+    """
+    import smtplib
+    from email.message import EmailMessage
+
+    # 1) Validate that files exist
+    for fp in file_paths:
+        if not os.path.isfile(fp):
+            raise FileNotFoundError(f"Attachment not found: {fp}")
+
+    # 2) If zip_attachments is True, zip everything into one archive
+    actual_attachments: List[str]
+    if zip_attachments:
+        timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
+        zip_path = f"attachments_{timestamp}.zip"
+        zip_files(file_paths, zip_path)
+        actual_attachments = [zip_path]
+    else:
+        actual_attachments = file_paths.copy()
+
+    # 3) Build the EmailMessage
+    msg = EmailMessage()
+    msg["Subject"] = subject
+    msg["From"] = sender
+    msg["To"] = ", ".join(to) if isinstance(to, list) else to
+
+    # 4) If inline_preview is True, look for the first HTML attachment,
+    #    read its content, and set as an HTML alternative in the email body.
+    if inline_preview:
+        html_body_found = False
+        for fp in actual_attachments:
+            if fp.lower().endswith(".html"):
+                with open(fp, "r", encoding="utf-8") as f:
+                    html_content = f.read()
+                msg.set_content(
+                    "This email contains an inline HTML preview. If your mail client "
+                    "doesn’t display HTML, see the attachment."
+                )
+                msg.add_alternative(html_content, subtype="html")
+                html_body_found = True
+                break
+        if not html_body_found:
+            # No HTML attachment found; create a simple text body
+            msg.set_content("Please see attached report file(s).")
+
+    else:
+        # No inline preview desired; use a simple text body
+        msg.set_content("Please see attached report file(s).")
+
+    # 5) Attach each file (or the single ZIP)
+    for fp in actual_attachments:
+        with open(fp, "rb") as f:
+            data = f.read()
+        ctype = "application"
+        subtype = "octet-stream"
+        filename = os.path.basename(fp)
+        msg.add_attachment(data, maintype=ctype, subtype=subtype, filename=filename)
+
+    # 6) Connect to SMTP and send
+    with smtplib.SMTP(smtp_server, smtp_port) as server:
+        server.ehlo()
+        if smtp_user and smtp_password:
+            server.starttls()
+            server.login(smtp_user, smtp_password)
+        server.send_message(msg)
+
+    print(f"Email sent to {msg['To']} with subject '{subject}'")
+
+
+def add_args(parser):
+    """Add query arguments"""
+
+    query_options = parser.add_argument_group("Query Options")
+
+    # Common arguments
+    query_options.add_argument(
+        "--query", required=True, help="SQL SELECT query to execute (enclose in quotes)."
+    )
+
+    query_options.add_argument(
+        "--script",
+        required=False,
+        type=str,
+        help="Input SQL script which should be read before query (e.g. defines views)",
+    )
+
+    query_options.add_argument(
+        "--format",
+        help="Export format",
+        choices=("console", "csv", "html", "json", "md", "pdf", "dashboard", "clipboard"),
+        type=str.lower,
+    )
+
+    email_options = parser.add_argument_group("Query Email Options")
+
+    # Email options (optional)
+    email_options.add_argument(
+        "--email-to", help="Recipient email address (or comma-separated list)."
+    )
+    email_options.add_argument(
+        "--email-from", help="Sender email address (required if --email-to is used)."
+    )
+    email_options.add_argument(
+        "--email-subject",
+        default="SQLite Query Report",
+        help="Subject line for the email (default: %(default)s).",
+    )
+    email_options.add_argument(
+        "--smtp-server",
+        default="localhost",
+        help="SMTP server hostname (default: %(default)s).",
+    )
+    email_options.add_argument(
+        "--smtp-port",
+        type=int,
+        default=25,
+        help="SMTP server port (default: %(default)d).",
+    )
+    email_options.add_argument("--smtp-user", help="SMTP login username (if required).")
+    email_options.add_argument(
+        "--smtp-password", help="SMTP login password (if required)."
+    )
+    email_options.add_argument(
+        "--zip-attachments",
+        action="store_true",
+        help="Zip all attachments into a single .zip file before sending.",
+    )
+    email_options.add_argument(
+        "--inline-preview",
+        action="store_true",
+        help="Embed HTML report as inline body if an HTML attachment is present.",
+    )
+
+    dashboard_options = parser.add_argument_group("Query Dashboard Options")
+
+    dashboard_options.add_argument(
+        "--template-path", help="Path to a Jinja2 HTML template for the dashboard"
+    )
+
+    return [
+        "query",
+        "script",
+        "email_to",
+        "email_from",
+        "email_subject",
+        "smtp_server",
+        "smtp_port",
+        "smtp_user",
+        "smtp_password",
+        "inline_preview",
+        "zip_attachments",
+        "format",
+        "template_path",
+    ]
+
+
+def process_args(args, valid_args):
+    # do not add any of the arguments to the output config dict
+    ret = {}
+    return ret
+
+
+def execute(input, args, config=None, window_args=None, **kwargs):
+
+    importData = RocpdImportData(input)
+
+    apply_time_window(importData, **window_args)
+
+    config = (
+        output_config.output_config(**kwargs)
+        if config is None
+        else config.update(**kwargs)
+    )
+
+    if args.script:
+        # read script and execute statements
+        with open(args.script, "r") as ifs:
+            for itr in ifs.read().split(";"):
+                importData.execute(f"{itr}")
+
+    # Prepare parameters for export
+    query = args.query
+    db = importData
+    export_format = args.format
+    export_path = os.path.join(config.output_path, config.output_file)
+
+    # Dashboard-only extra
+    dashboard_template = kwargs.get("template_path", None)
+
+    # 1) Run and export
+    exported_file = export_sqlite_query(
+        db,
+        query=query,
+        params=(),
+        export_format=export_format,
+        export_path=export_path,
+        dashboard_template_path=dashboard_template,
+    )
+
+    # 2) If --email-to was provided and we have a file, send it
+    if args.email_to:
+        if not args.email_from:
+            raise ValueError("--email-from is required when --email-to is used.")
+        if not exported_file:
+            print("No file was exported; skipping email.")
+            return
+
+        recipients = [addr.strip() for addr in args.email_to.split(",")]
+        send_report_email(
+            file_paths=[exported_file],
+            to=recipients,
+            sender=args.email_from,
+            subject=args.email_subject,
+            inline_preview=args.inline_preview,
+            smtp_server=args.smtp_server,
+            smtp_port=args.smtp_port,
+            smtp_user=args.smtp_user,
+            smtp_password=args.smtp_password,
+            zip_attachments=args.zip_attachments,
+        )
+
+
+def main(argv=None):
+    import argparse
+    from .time_window import add_args as add_args_time_window
+    from .time_window import process_args as process_args_time_window
+    from .output_config import add_args as add_args_output_config
+    from .output_config import process_args as process_args_output_config
+    from .output_config import add_generic_args, process_generic_args
+
+    parser = argparse.ArgumentParser(
+        description="Generate report for rocpd query", allow_abbrev=False
+    )
+
+    required_params = parser.add_argument_group("Required options")
+
+    required_params.add_argument(
+        "-i",
+        "--input",
+        required=True,
+        type=output_config.check_file_exists,
+        nargs="+",
+        help="Input path and filename to one or more database(s), separated by spaces",
+    )
+
+    valid_out_config_args = add_args_output_config(parser)
+    valid_generic_args = add_generic_args(parser)
+    valid_time_window_args = add_args_time_window(parser)
+    valid_query_args = add_args(parser)
+
+    args = parser.parse_args(argv)
+
+    out_cfg_args = process_args_output_config(args, valid_out_config_args)
+    generic_out_cfg_args = process_generic_args(args, valid_generic_args)
+    window_args = process_args_time_window(args, valid_time_window_args)
+    query_args = process_args(args, valid_query_args)
+
+    all_args = {
+        **query_args,
+        **out_cfg_args,
+        **generic_out_cfg_args,
+    }
+
+    execute(
+        args.input,
+        args,
+        window_args=window_args,
+        **all_args,
+    )
+
+
+if __name__ == "__main__":
+    main()
@@ -0,0 +1,532 @@
+#!/usr/bin/env python3
+###############################################################################
+# MIT License
+#
+# Copyright (c) 2025 Advanced Micro Devices, Inc.
+#
+# Permission is hereby granted, free of charge, to any person obtaining a copy
+# of this software and associated documentation files (the "Software"), to deal
+# in the Software without restriction, including without limitation the rights
+# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+# copies of the Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+#
+# The above copyright notice and this permission notice shall be included in
+# all copies or substantial portions of the Software.
+#
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
+# THE SOFTWARE.
+###############################################################################
+
+import argparse
+import os
+
+from typing import Any, List, Tuple
+from .importer import RocpdImportData, execute_statement
+from .query import export_sqlite_query
+from . import output_config
+
+
+def get_temp_view_names(connection: RocpdImportData) -> List[str]:
+    """Return the names of all temporary views in the SQLite connection."""
+    return [
+        v[0]
+        for v in execute_statement(
+            connection, "SELECT name FROM sqlite_temp_master WHERE type='view';"
+        ).fetchall()
+    ]
+
+
+def get_temp_view_columns(connection: RocpdImportData, view_name: str) -> List[str]:
+    """Return the column names of a given temporary view."""
+    cursor = connection.cursor()
+    cursor.execute(f"PRAGMA table_xinfo('{view_name}')")
+    return [row[1] for row in cursor.fetchall()]
+
+
+def make_temp_view_query(view_name, query) -> str:
+    return "CREATE TEMPORARY VIEW IF NOT EXISTS `{}` AS {}".format(view_name, query)
+
+
+def export_view(
+    connection: RocpdImportData, view_name, output_format, output_path, filename=""
+) -> None:
+    """Write the contents of a SQL view to an output format."""
+
+    query = "SELECT * FROM `{}`".format(view_name)
+    query_one = "SELECT * FROM `{}` LIMIT 1".format(view_name)
+
+    # just return if view is empty
+    if not connection.execute(query_one).fetchone():
+        return
+
+    # prepare the output filename
+    if not filename:
+        output_filename = view_name
+    else:
+        output_filename = f"{filename}_{view_name}"
+
+    if output_format == "console":
+        print(f"\n{view_name.upper()}:")
+
+    # call query module to export.  query will append the extension
+    export_path = os.path.join(output_path, output_filename)
+    export_sqlite_query(
+        connection, query, export_format=output_format, export_path=export_path
+    )
+
+
+def generate_summary_query(
+    view_name: str,
+    name_column="name",
+    by_rank=False,
+) -> Tuple[str, str]:
+    """Generate the SQL statement to create a summary view."""
+
+    if by_rank:
+        view_suffix = "_summary_by_rank"
+        group_by_columns = "guid, {name_column}".format(name_column=name_column)
+        aggregation_group_by = "T.guid, T.nid, T.{name_column}".format(
+            name_column=name_column
+        )
+        total_duration_group_by = "guid"
+        additional_select_columns = "AD.pid AS ProcessID, P.hostname AS Hostname,"
+        additional_aggregated_columns = """
+                    T.guid,
+                    T.nid,
+                    T.pid,"""
+        join_condition = "T.guid = A.guid AND T.{name_column} = A.name".format(
+            name_column=name_column
+        )
+        total_duration_join = "JOIN total_duration TD ON AD.guid = TD.guid JOIN processes P ON AD.pid = P.pid"
+    else:
+        view_suffix = "_summary"
+        group_by_columns = name_column
+        aggregation_group_by = "T.{name_column}".format(name_column=name_column)
+        total_duration_group_by = ""
+        additional_select_columns = ""
+        additional_aggregated_columns = ""
+        join_condition = "T.{name_column} = A.name".format(name_column=name_column)
+        total_duration_join = "CROSS JOIN total_duration TD"
+
+    full_view_name = f"{view_name}{view_suffix}"
+
+    summary_query = f"""
+        WITH
+            avg_data AS (
+                SELECT
+                    {group_by_columns.replace(name_column, f"{name_column} AS name")},
+                    AVG(duration) AS avg_duration
+                FROM {view_name}
+                GROUP BY {group_by_columns}
+            ),
+            aggregated_data AS (
+                SELECT{additional_aggregated_columns}
+                    T.{name_column} as name,
+                    COUNT(*) AS calls,
+                    SUM(T.duration) AS total_duration,
+                    A.avg_duration AS average_duration,
+                    MIN(T.duration) AS min_duration,
+                    MAX(T.duration) AS max_duration,
+                    SQRT(SUM(CAST((T.duration - A.avg_duration) AS REAL) * CAST((T.duration - A.avg_duration) AS REAL)) / (COUNT(*) - 1)) AS std_dev_duration
+                FROM {view_name} T
+                JOIN avg_data A ON {join_condition}
+                GROUP BY {aggregation_group_by}
+            ),
+            total_duration AS (
+                SELECT
+                    {f"{total_duration_group_by}," if total_duration_group_by else ""}
+                    SUM(total_duration) AS grand_total_duration
+                FROM
+                    aggregated_data
+                {f"GROUP BY {total_duration_group_by}" if total_duration_group_by else ""}
+            )
+        SELECT
+            {additional_select_columns}
+            AD.name AS Name,
+            AD.calls AS Calls,
+            AD.total_duration AS "DURATION (nsec)",
+            AD.average_duration AS "AVERAGE (nsec)",
+            (CAST(AD.total_duration AS REAL) / TD.grand_total_duration) * 100 AS "PERCENT (INC)",
+            AD.min_duration AS "MIN (nsec)",
+            AD.max_duration AS "MAX (nsec)",
+            AD.std_dev_duration AS "STD_DEV"
+        FROM
+            aggregated_data AD
+            {total_duration_join}
+        ORDER BY
+            {"AD.pid," if by_rank else ""} AD.total_duration DESC;
+    """
+
+    return (full_view_name, summary_query)
+
+
+def generate_domain_query(connection: RocpdImportData, by_rank=False) -> Tuple[str, str]:
+    """Generate the SQL statement for domain summary by doing union over all summary views."""
+
+    if by_rank:
+        view_suffix = "_summary_by_rank"
+        view_name = "domain_summary_by_rank"
+        additional_group_columns = "ProcessID, Hostname,"
+        additional_select_columns = "GD.ProcessID, GD.Hostname,"
+        total_duration_group_by = "GROUP BY ProcessID"
+        join_condition = "JOIN total_duration TD ON GD.ProcessID = TD.ProcessID"
+        order_by = "ORDER BY GD.ProcessID"
+    else:
+        view_suffix = "_summary"
+        view_name = "domain_summary"
+        additional_group_columns = ""
+        additional_select_columns = ""
+        total_duration_group_by = ""
+        join_condition = "CROSS JOIN total_duration TD"
+        order_by = 'ORDER BY GD."DURATION (nsec)" DESC'
+
+    summary_views = [
+        itr for itr in get_temp_view_names(connection) if itr.endswith(view_suffix)
+    ]
+
+    if len(summary_views) < 1:
+        return view_name
+
+    union_selects = [
+        f" SELECT '{s.replace(view_suffix, '').upper()}' as domain, * FROM {s} "
+        for s in summary_views
+    ]
+
+    domain_select = f"""
+        WITH
+            all_domains AS (
+               {f" UNION ALL ".join(union_selects)}
+            ),
+            grouped_domains AS (
+                SELECT
+                    domain,
+                    {additional_group_columns}
+                    SUM(calls) AS calls,
+                    SUM("DURATION (nsec)") AS "DURATION (nsec)",
+                    SUM("AVERAGE (nsec)") AS "AVERAGE (nsec)",
+                    MIN("MIN (nsec)") AS "MIN (nsec)",
+                    MAX("MAX (nsec)") AS "MAX (nsec)",
+                    SUM("STD_DEV") AS "STD_DEV"
+                FROM all_domains
+                GROUP BY domain{", ProcessID" if by_rank else ""}
+            ),
+            total_duration AS (
+                SELECT
+                    {additional_group_columns}
+                    SUM("DURATION (nsec)") AS grand_total_duration
+                FROM grouped_domains
+                {total_duration_group_by}
+            )
+        SELECT
+            {additional_select_columns}
+            GD.domain AS Name,
+            GD.calls AS Calls,
+            GD."DURATION (nsec)",
+            GD."AVERAGE (nsec)",
+            (CAST(GD."DURATION (nsec)" AS REAL) / TD.grand_total_duration) * 100 AS "PERCENT (INC)",
+            GD."MIN (nsec)",
+            GD."MAX (nsec)",
+            GD."STD_DEV"
+        FROM
+            grouped_domains GD
+            {join_condition}
+        {order_by};
+    """
+
+    return (view_name, domain_select)
+
+
+def create_summary_views(connection: RocpdImportData, by_rank=False) -> None:
+    """Create summary views for eligible temporary views in the database."""
+
+    NAME_COLUMN_MAP = {
+        "memory_allocations": "type",
+        "scratch_memory": "operation",
+    }
+
+    avoid_view_pattern = ("rocpd", "region", "counter", "pmc")
+    required_columns = {"duration"}
+
+    views = get_temp_view_names(connection)
+
+    for view_name in views:
+        if any(pattern in view_name for pattern in avoid_view_pattern):
+            continue
+
+        columns = get_temp_view_columns(connection, view_name)
+        if not required_columns.issubset(columns):
+            continue
+
+        # Create regular summary view
+        summary_view_name, summary_query = generate_summary_query(
+            view_name, name_column=NAME_COLUMN_MAP.get(view_name, "name")
+        )
+        connection.execute(make_temp_view_query(summary_view_name, summary_query))
+
+        # Create per-rank summary
+        if by_rank:
+            per_rank_view_name, summary_by_rank_query = generate_summary_query(
+                view_name,
+                name_column=NAME_COLUMN_MAP.get(view_name, "name"),
+                by_rank=True,
+            )
+            connection.execute(
+                make_temp_view_query(per_rank_view_name, summary_by_rank_query)
+            )
+
+
+def create_summary_region_views(
+    connection: RocpdImportData, by_rank=False, region_categories=None
+) -> None:
+    """Create summary and region views"""
+
+    query = "SELECT DISTINCT(category) FROM regions_and_samples;"
+    categories = execute_statement(connection, query).fetchall()
+
+    if region_categories is None:
+        # Automatically retrieve region categories from the database
+        region_categories = set([cat[0].split("_")[0] for cat in categories])
+
+    category_map = {
+        cat.lower(): [c[0] for c in categories if c[0].startswith(cat + "_")]
+        for cat in region_categories
+        if "MARKER" not in cat.upper()
+    }
+
+    for k, v in category_map.items():
+        if len(v) > 0:
+            conditions = [f"category LIKE '{c}'" for c in v]
+            temp_region_view = f"""
+                CREATE TEMPORARY VIEW IF NOT EXISTS `{k}` AS
+                SELECT *
+                FROM regions_and_samples
+                WHERE {" OR ".join(conditions)};
+            """
+
+            connection.execute(temp_region_view)
+
+            # Create regular summary view
+            summary_view_name, summary_query = generate_summary_query(k)
+            connection.execute(make_temp_view_query(summary_view_name, summary_query))
+
+            # Create per-rank summary view
+            if by_rank:
+                per_rank_view_name, summary_by_rank_query = generate_summary_query(
+                    k, by_rank=True
+                )
+                connection.execute(
+                    make_temp_view_query(per_rank_view_name, summary_by_rank_query)
+                )
+
+    # Markers
+    if "MARKER" not in region_categories:
+        return
+
+    view_name = "markers"
+    markers_create = f"""
+        CREATE TEMPORARY VIEW IF NOT EXISTS `{view_name}` AS
+        SELECT JSON_EXTRACT(extdata, '$.message') AS marker_name, *
+        FROM regions_and_samples
+        WHERE category LIKE 'MARKER_%'
+    """
+    connection.execute(markers_create)
+
+    # Create regular summary view
+    summary_view_name, summary_query = generate_summary_query(
+        view_name, name_column="marker_name"
+    )
+    connection.execute(make_temp_view_query(summary_view_name, summary_query))
+
+    # Create per-rank summary view
+    if by_rank:
+        per_rank_view_name, summary_by_rank_query = generate_summary_query(
+            view_name, name_column="marker_name", by_rank=True
+        )
+        connection.execute(
+            make_temp_view_query(per_rank_view_name, summary_by_rank_query)
+        )
+
+
+def create_domain_view(connection: RocpdImportData, by_rank=False) -> str:
+    """Create a domain summary view by aggregating all summary views."""
+
+    view_name, domain_query = generate_domain_query(connection, by_rank=by_rank)
+
+    # Create the domain summary view
+    connection.execute(make_temp_view_query(view_name, domain_query))
+
+    return view_name
+
+
+def generate_all_summaries(connection: RocpdImportData, **kwargs: Any) -> None:
+    """Generate all summary views and write them to CSV files."""
+
+    domain_summary = kwargs.get("domain_summary", False)
+    by_rank = kwargs.get("summary_by_rank", False)
+    filename = kwargs.get("output_file", "")
+    output_path = kwargs.get("output_path", "./rocpd-output-data")
+    region_categories = kwargs.get("region_categories", None)
+    output_format = kwargs.get("format", "console")
+
+    # create the temporary summary views
+    create_summary_views(connection, by_rank)
+    create_summary_region_views(connection, by_rank, region_categories=region_categories)
+
+    if domain_summary:
+        create_domain_view(connection)
+        # Create domain summary per rank only if both domain_summary and summary_by_rank are enabled
+        if by_rank:
+            create_domain_view(connection, by_rank=True)
+
+    # Write regular summary views
+    print("\nSummary files:")
+    summary_views = [
+        itr for itr in get_temp_view_names(connection) if itr.endswith("_summary")
+    ]
+    for v in summary_views:
+        export_view(connection, v, output_format, output_path, filename)
+
+    # Write per-rank summary views if flag is set
+    if by_rank:
+        print("\nSummary files by rank:")
+        summary_by_rank_views = [
+            itr
+            for itr in get_temp_view_names(connection)
+            if itr.endswith("_summary_by_rank")
+        ]
+        for v in summary_by_rank_views:
+            export_view(connection, v, output_format, output_path, filename)
+
+
+#
+# Command-line interface functions
+#
+
+
+def add_io_args(parser):
+    """Add input/output arguments for summary."""
+    io_options = parser.add_argument_group("I/O options")
+
+    io_options.add_argument(
+        "-f",
+        "--format",
+        help="Sets the format the summaries are output to (default: console)",
+        choices=("console", "csv", "html", "json", "md", "pdf"),
+        default="console",
+        type=str,
+        required=False,
+    )
+    io_options.add_argument(
+        "-o",
+        "--output-file",
+        help="Sets the base output file name",
+        default=os.environ.get("ROCPD_OUTPUT_NAME", ""),
+        type=str,
+        required=False,
+    )
+    io_options.add_argument(
+        "-d",
+        "--output-path",
+        help="Sets the output path where the output files will be saved (default path: `./rocpd-output-data`)",
+        default=os.environ.get("ROCPD_OUTPUT_PATH", "./rocpd-output-data"),
+        type=str,
+        required=False,
+    )
+
+    return ["format", "output_file", "output_path"]
+
+
+def add_args(parser):
+    """Add arguments for summary."""
+    summary_options = parser.add_argument_group("Summary options")
+    summary_options.add_argument(
+        "--domain-summary",
+        action="store_true",
+        default=False,
+        help="Generate domain summary view",
+    )
+    summary_options.add_argument(
+        "--summary-by-rank",
+        action="store_true",
+        default=False,
+        help="Generate summary views by-rank (or Process ID)",
+    )
+    summary_options.add_argument(
+        "--region-categories",
+        nargs="+",
+        default=None,
+        help="Specify region categories to include in the summary (example: HIP, HSA, RCCL, ROCDECODE, ROCJPEG, MARKER). If not specified, categories will be automatically retrieved from the database.",
+    )
+
+    return ["domain_summary", "summary_by_rank", "region_categories"]
+
+
+def process_args(args, valid_args):
+
+    ret = {}
+    for itr in valid_args:
+        if hasattr(args, itr):
+            val = getattr(args, itr)
+            if val is not None:
+                ret[itr] = val
+    return ret
+
+
+def execute(input, window_args=None, **kwargs: Any) -> RocpdImportData:
+    from .time_window import apply_time_window
+
+    importData = RocpdImportData(input)
+
+    apply_time_window(importData, **window_args)
+
+    generate_all_summaries(importData, **kwargs)
+
+    return importData
+
+
+def main(argv=None) -> int:
+    """Main entry point for command line execution."""
+    from .time_window import add_args as add_args_time_window
+    from .time_window import process_args as process_args_time_window
+
+    parser = argparse.ArgumentParser(
+        description="Create ROCpd database summary region views"
+    )
+    required_params = parser.add_argument_group("Required options")
+
+    required_params.add_argument(
+        "-i",
+        "--input",
+        required=True,
+        type=output_config.check_file_exists,
+        nargs="+",
+        help="Input path and filename to one or more database(s), separated by spaces",
+    )
+
+    valid_io_args = add_io_args(parser)
+    valid_summary_args = add_args(parser)
+    valid_time_window_args = add_args_time_window(parser)
+
+    args = parser.parse_args(argv)
+
+    summary_args = process_args(args, valid_summary_args)
+    io_args = output_config.process_args(args, valid_io_args)
+    window_args = process_args_time_window(args, valid_time_window_args)
+
+    all_args = {**summary_args, **io_args}
+
+    execute(
+        args.input,
+        window_args=window_args,
+        **all_args,
+    )
+
+
+if __name__ == "__main__":
+    main()
@@ -38,8 +38,24 @@ __all__ = [
    "nameOsThread",
    "nameHipDevice",
    "context_decorators",
+    "version_info",
 ]

+version_info = {
+    "version": "@PROJECT_VERSION@",
+    "major": int("@PROJECT_VERSION_MAJOR@"),
+    "minor": int("@PROJECT_VERSION_MINOR@"),
+    "patch": int("@PROJECT_VERSION_PATCH@"),
+    "git_revision": "@ROCPROFILER_SDK_GIT_REVISION@",
+    "library_arch": "@CMAKE_LIBRARY_ARCHITECTURE@",
+    "system_name": "@CMAKE_SYSTEM_NAME@",
+    "system_processor": "@CMAKE_SYSTEM_PROCESSOR@",
+    "system_version": "@CMAKE_SYSTEM_VERSION@",
+    "compiler_id": "@CMAKE_CXX_COMPILER_ID@",
+    "compiler_version": "@CMAKE_CXX_COMPILER_VERSION@",
+    "rocm_version": "@rocm_version_FULL_VERSION@",
+}
+

 def mark(msg):
    return libpyroctx.roctxMark(msg) if msg is not None else None
@@ -97,7 +97,7 @@ function(rocprofiler_roctx_python_bindings _VERSION)

    foreach(_SOURCE ${roctx_PYTHON_SOURCES})
        configure_file(${CMAKE_CURRENT_LIST_DIR}/${_SOURCE}
-                       ${roctx_PYTHON_OUTPUT_DIRECTORY}/${_SOURCE} COPYONLY)
+                       ${roctx_PYTHON_OUTPUT_DIRECTORY}/${_SOURCE} @ONLY)
        install(
            FILES ${roctx_PYTHON_OUTPUT_DIRECTORY}/${_SOURCE}
            DESTINATION ${roctx_PYTHON_INSTALL_DIRECTORY}
@@ -154,12 +154,14 @@ function(rocprofiler_rocpd_python_bindings _VERSION)
        output_config.py
        otf2.py
        pftrace.py
+        query.py
        schema.py
+        summary.py
        time_window.py)

    foreach(_SOURCE ${rocpd_PYTHON_SOURCES})
        configure_file(${CMAKE_CURRENT_LIST_DIR}/${_SOURCE}
-                       ${rocpd_PYTHON_OUTPUT_DIRECTORY}/${_SOURCE} COPYONLY)
+                       ${rocpd_PYTHON_OUTPUT_DIRECTORY}/${_SOURCE} @ONLY)
        install(
            FILES ${rocpd_PYTHON_OUTPUT_DIRECTORY}/${_SOURCE}
            DESTINATION ${rocpd_PYTHON_INSTALL_DIRECTORY}
@@ -596,6 +596,7 @@ SELECT
    JSON_EXTRACT(M.extdata, '$.flags') AS alloc_flags,
    M.start,
    M.end,
+    (M.end - M.start) AS duration,
    M.size,
    M.address,
    E.correlation_id,
@@ -151,226 +151,3 @@ GROUP BY
    name
 ORDER BY
    total_duration DESC;
-
-- Kernel summary by name
-CREATE VIEW
-    `kernel_summary` AS
-WITH
-    avg_data AS (
-        SELECT
-            name,
-            AVG(duration) AS avg_duration
-        FROM
-            `kernels`
-        GROUP BY
-            name
-    ),
-    aggregated_data AS (
-        SELECT
-            K.name,
-            COUNT(*) AS calls,
-            SUM(K.duration) AS total_duration,
-            SUM(CAST(K.duration AS REAL) * CAST(K.duration AS REAL)) AS sqr_duration,
-            A.avg_duration AS average_duration,
-            MIN(K.duration) AS min_duration,
-            MAX(K.duration) AS max_duration,
-            SUM(CAST((K.duration - A.avg_duration) AS REAL) * CAST((K.duration - A.avg_duration) AS REAL)) / (COUNT(*) - 1) AS variance_duration,
-            SQRT(
-                SUM(CAST((K.duration - A.avg_duration) AS REAL) * CAST((K.duration - A.avg_duration) AS REAL)) / (COUNT(*) - 1)
-            ) AS std_dev_duration
-        FROM
-            `kernels` K
-            JOIN avg_data A ON K.name = A.name
-        GROUP BY
-            K.name
-    ),
-    total_duration AS (
-        SELECT
-            SUM(total_duration) AS grand_total_duration
-        FROM
-            aggregated_data
-    )
-SELECT
-    AD.name AS name,
-    AD.calls,
-    AD.total_duration AS "DURATION (nsec)",
-    AD.sqr_duration AS "SQR (nsec)",
-    AD.average_duration AS "AVERAGE (nsec)",
-    (CAST(AD.total_duration AS REAL) / TD.grand_total_duration) * 100 AS "PERCENT (INC)",
-    AD.min_duration AS "MIN (nsec)",
-    AD.max_duration AS "MAX (nsec)",
-    AD.variance_duration AS "VARIANCE",
-    AD.std_dev_duration AS "STD_DEV"
-FROM
-    aggregated_data AD
-    CROSS JOIN total_duration TD;
-
--
-- Kernel summary by region name
-CREATE VIEW
-    `kernel_summary_region` AS
-WITH
-    avg_data AS (
-        SELECT
-            region,
-            AVG(duration) AS avg_duration
-        FROM
-            `kernels`
-        GROUP BY
-            region
-    ),
-    aggregated_data AS (
-        SELECT
-            K.region AS name,
-            COUNT(*) AS calls,
-            SUM(K.duration) AS total_duration,
-            SUM(CAST(K.duration AS REAL) * CAST(K.duration AS REAL)) AS sqr_duration,
-            A.avg_duration AS average_duration,
-            MIN(K.duration) AS min_duration,
-            MAX(K.duration) AS max_duration,
-            SUM(CAST((K.duration - A.avg_duration) AS REAL) * CAST((K.duration - A.avg_duration) AS REAL)) / (COUNT(*) - 1) AS variance_duration,
-            SQRT(
-                SUM(CAST((K.duration - A.avg_duration) AS REAL) * CAST((K.duration - A.avg_duration) AS REAL)) / (COUNT(*) - 1)
-            ) AS std_dev_duration
-        FROM
-            `kernels` K
-            JOIN avg_data A ON K.region = A.region
-        GROUP BY
-            K.region
-    ),
-    total_duration AS (
-        SELECT
-            SUM(total_duration) AS grand_total_duration
-        FROM
-            aggregated_data
-    )
-SELECT
-    AD.name AS name,
-    AD.calls,
-    AD.total_duration AS "DURATION (nsec)",
-    AD.sqr_duration AS "SQR (nsec)",
-    AD.average_duration AS "AVERAGE (nsec)",
-    (CAST(AD.total_duration AS REAL) / TD.grand_total_duration) * 100 AS "PERCENT (INC)",
-    AD.min_duration AS "MIN (nsec)",
-    AD.max_duration AS "MAX (nsec)",
-    AD.variance_duration AS "VARIANCE",
-    AD.std_dev_duration AS "STD_DEV"
-FROM
-    aggregated_data AD
-    CROSS JOIN total_duration TD;
-
--
-- Memory copy summary
-CREATE VIEW
-    `memory_copy_summary` AS
-WITH
-    avg_data AS (
-        SELECT
-            name,
-            AVG(duration) AS avg_duration
-        FROM
-            `memory_copies`
-        GROUP BY
-            name
-    ),
-    aggregated_data AS (
-        SELECT
-            MC.name,
-            COUNT(*) AS calls,
-            SUM(MC.duration) AS total_duration,
-            SUM(CAST(MC.duration AS REAL) * CAST(MC.duration AS REAL)) AS sqr_duration,
-            A.avg_duration AS average_duration,
-            MIN(MC.duration) AS min_duration,
-            MAX(MC.duration) AS max_duration,
-            SUM(
-                CAST((MC.duration - A.avg_duration) AS REAL) * CAST((MC.duration - A.avg_duration) AS REAL)
-            ) / (COUNT(*) - 1) AS variance_duration,
-            SQRT(
-                SUM(
-                    CAST((MC.duration - A.avg_duration) AS REAL) * CAST((MC.duration - A.avg_duration) AS REAL)
-                ) / (COUNT(*) - 1)
-            ) AS std_dev_duration
-        FROM
-            `memory_copies` MC
-            JOIN avg_data A ON MC.name = A.name
-        GROUP BY
-            MC.name
-    ),
-    total_duration AS (
-        SELECT
-            SUM(total_duration) AS grand_total_duration
-        FROM
-            aggregated_data
-    )
-SELECT
-    AD.name AS name,
-    AD.calls,
-    AD.total_duration AS "DURATION (nsec)",
-    AD.sqr_duration AS "SQR (nsec)",
-    AD.average_duration AS "AVERAGE (nsec)",
-    (CAST(AD.total_duration AS REAL) / TD.grand_total_duration) * 100 AS "PERCENT (INC)",
-    AD.min_duration AS "MIN (nsec)",
-    AD.max_duration AS "MAX (nsec)",
-    AD.variance_duration AS "VARIANCE",
-    AD.std_dev_duration AS "STD_DEV"
-FROM
-    aggregated_data AD
-    CROSS JOIN total_duration TD;
-
--
-- Memory allocation summary
-CREATE VIEW
-    `memory_allocation_summary` AS
-WITH
-    avg_data AS (
-        SELECT
-            type AS name,
-            AVG(duration) AS avg_duration
-        FROM
-            `memory_allocations`
-        GROUP BY
-            type
-    ),
-    aggregated_data AS (
-        SELECT
-            MA.type AS name,
-            COUNT(*) AS calls,
-            SUM(MA.duration) AS total_duration,
-            SUM(CAST(MA.duration AS REAL) * CAST(MA.duration AS REAL)) AS sqr_duration,
-            A.avg_duration AS average_duration,
-            MIN(MA.duration) AS min_duration,
-            MAX(MA.duration) AS max_duration,
-            SUM(
-                CAST((MA.duration - A.avg_duration) AS REAL) * CAST((MA.duration - A.avg_duration) AS REAL)
-            ) / (COUNT(*) - 1) AS variance_duration,
-            SQRT(
-                SUM(
-                    CAST((MA.duration - A.avg_duration) AS REAL) * CAST((MA.duration - A.avg_duration) AS REAL)
-                ) / (COUNT(*) - 1)
-            ) AS std_dev_duration
-        FROM
-            `memory_allocations` MA
-            JOIN avg_data A ON MA.type = A.name
-        GROUP BY
-            MA.type
-    ),
-    total_duration AS (
-        SELECT
-            SUM(total_duration) AS grand_total_duration
-        FROM
-            aggregated_data
-    )
-SELECT
-    'MEMORY_ALLOCATION_' || AD.name AS name,
-    AD.calls,
-    AD.total_duration AS "DURATION (nsec)",
-    AD.sqr_duration AS "SQR (nsec)",
-    AD.average_duration AS "AVERAGE (nsec)",
-    (CAST(AD.total_duration AS REAL) / TD.grand_total_duration) * 100 AS "PERCENT (INC)",
-    AD.min_duration AS "MIN (nsec)",
-    AD.max_duration AS "MAX (nsec)",
-    AD.variance_duration AS "VARIANCE",
-    AD.std_dev_duration AS "STD_DEV"
-FROM
-    aggregated_data AD
-    CROSS JOIN total_duration TD;
@@ -22,7 +22,7 @@ set(rocpd-env
 #
 #########################################################################################

-foreach(_SUBPARSER "" "-convert")
+foreach(_SUBPARSER "" "-convert" "-query" "-summary")
    string(REPLACE "-" "" _CMD "${_SUBPARSER}")
    add_test(NAME rocpd${_SUBPARSER}-help COMMAND ${Python3_EXECUTABLE} -m rocpd ${_CMD}
                                                  --help)
@@ -34,7 +34,7 @@ foreach(_SUBPARSER "" "-convert")
                   "${ROCPROFILER_DEFAULT_FAIL_REGEX}")
 endforeach()

-foreach(_MODULE "csv" "pftrace" "otf2")
+foreach(_MODULE "csv" "pftrace" "otf2" "query" "summary")
    add_test(NAME rocpd-module-${_MODULE}-help COMMAND ${Python3_EXECUTABLE} -m
                                                       rocpd.${_MODULE} --help)

@@ -222,6 +222,58 @@ set_tests_properties(
               FIXTURES_REQUIRED
               rocprofv3-test-rocpd)

+#########################################################################################
+#
+# Summary generate
+#
+#########################################################################################
+add_test(
+    NAME rocprofv3-test-rocpd-summary-generation
+    COMMAND
+        ${Python3_EXECUTABLE} -m rocpd summary --domain-summary --summary-by-rank -f csv
+        -d ${CMAKE_CURRENT_BINARY_DIR}/rocpd-output-data/summary -i
+        ${CMAKE_CURRENT_BINARY_DIR}/rocpd-input-data/out_results.db)
+
+set_tests_properties(
+    rocprofv3-test-rocpd-summary-generation
+    PROPERTIES TIMEOUT
+               45
+               LABELS
+               "integration-tests;rocpd"
+               ENVIRONMENT
+               "${rocprofv3-rocpd-env}"
+               DEPENDS
+               "rocprofv3-test-rocpd-execute"
+               FAIL_REGULAR_EXPRESSION
+               "${ROCPROFILER_DEFAULT_FAIL_REGEX}"
+               FIXTURES_SETUP
+               rocprofv3-test-rocpd-generation
+               FIXTURES_REQUIRED
+               rocprofv3-test-rocpd)
+
+add_test(
+    NAME rocprofv3-test-rocpd-summary-generation-multiproc
+    COMMAND
+        ${Python3_EXECUTABLE} -m rocpd summary --domain-summary --summary-by-rank -f csv
+        -d ${CMAKE_CURRENT_BINARY_DIR}/rocpd-output-test/summary -o out_mp -i
+        ${CMAKE_CURRENT_BINARY_DIR}/rocpd-input-data-multiproc/out_mp_0_results.db
+        ${CMAKE_CURRENT_BINARY_DIR}/rocpd-input-data-multiproc/out_mp_1_results.db)
+
+set_tests_properties(
+    rocprofv3-test-rocpd-summary-generation-multiproc
+    PROPERTIES TIMEOUT
+               120
+               LABELS
+               "integration-tests;rocpd"
+               ENVIRONMENT
+               "${rocprofv3-rocpd-env}"
+               FAIL_REGULAR_EXPRESSION
+               "${ROCPROFILER_DEFAULT_FAIL_REGEX}"
+               DISABLED
+               "${MULTIPROC_IS_DISABLED}"
+               FIXTURES_REQUIRED
+               rocprofv3-test-rocpd-multiproc)
+
 #########################################################################################
 #
 # Validation