Source code for perun.io.text_report

"""Text report module."""

import logging
from typing import Any, Dict, List

import pandas as pd

from perun.data_model.data import DataNode, MetricType, Stats
from perun.io.util import value2MeanStdStr, value2ValueUnitStr

log = logging.getLogger(__name__)

tableMetrics = [
    MetricType.RUNTIME,
    MetricType.ENERGY,
    MetricType.POWER,
    MetricType.CPU_POWER,
    MetricType.CPU_UTIL,
    MetricType.GPU_POWER,
    MetricType.GPU_MEM,
    MetricType.DRAM_POWER,
    MetricType.DRAM_MEM,
]

regionMetrics = {
    MetricType.RUNTIME: "Avg Runtime",
    MetricType.POWER: "Avg Power",
    MetricType.CPU_UTIL: "Avg CPU Util",
    MetricType.DRAM_MEM: "Avg RAM Mem Util",
    MetricType.GPU_MEM: "Avg GPU Mem Util",
}



[docs]
def textReport(dataNode: DataNode, mr_id: str) -> str:
    """Create text report from selected MULTI_RUN node.

    Parameters
    ----------
    dataNode : DataNode
        Application data node
    mr_id : str
        Multirun id

    Returns
    -------
    str
        Report string
    """
    if not dataNode.processed:
        log.error("Data has not been processed, unable to create report.")
        raise Exception("Cannot generate report from unprocessed data node.")

    if mr_id not in dataNode.nodes:
        log.error("Non existent run id")
        raise Exception("Cannot generate report with non existent id.")

    # Report header
    report_header = (
        "PERUN REPORT\n"
        "\n"
        f"App name: {dataNode.id}\n"
        f"First run: {dataNode.metadata['creation_dt']}\n"
        f"Last run: {dataNode.metadata['last_execution_dt']}\n"
        "\n\n"
    )

    # Host and device table
    host_device_rows = []
    region_rows = []
    mr_node: DataNode = dataNode.nodes[mr_id]

    for run_number, run_node in mr_node.nodes.items():
        if run_node.regions:
            for region_name, region in run_node.regions.items():
                if region.processed:
                    row = {
                        "Round #": run_node.id,
                        "Function": region_name,
                        "Avg Calls / Rank": region.runs_per_rank.mean,
                    }
                    row.update(
                        {
                            regionMetrics[metric_type]: value2MeanStdStr(stats)
                            for metric_type, stats in region.metrics.items()
                            if metric_type in regionMetrics
                        }
                    )
                    region_rows.append(row)
        for host_name, host_node in run_node.nodes.items():
            entry = {
                "Round #": run_number,
                "Host": host_name,
            }
            for metric_type in tableMetrics:
                if metric_type in host_node.metrics:
                    m = host_node.metrics[metric_type]
                    entry[metric_type.name] = value2ValueUnitStr(m.value, m.metric_md)

            host_device_rows.append(entry)
        entry = {"Round #": run_number, "Host": "All"}
        for metric_type in tableMetrics:
            if metric_type in run_node.metrics:
                m = run_node.metrics[metric_type]
                entry[metric_type.name] = value2ValueUnitStr(m.value, m.metric_md)

        host_device_rows.append(entry)

    mr_table = pd.DataFrame.from_records(host_device_rows).sort_values(
        by=["Host", "Round #"]
    )
    mr_report_str = (
        f"RUN ID: {mr_id}\n\n"
        + mr_table.to_markdown(index=False, stralign="right")
        + "\n\n"
    )

    # Regions
    if len(region_rows) > 0:
        region_table = pd.DataFrame.from_records(region_rows).sort_values(
            by=["Function", "Round #"]
        )
        region_report_str = (
            "Monitored Functions\n\n"
            + region_table.to_markdown(index=False, stralign="right")
            + "\n\n"
        )
    else:
        region_report_str = ""

    n_runs = len(dataNode.nodes)
    if MetricType.ENERGY in dataNode.metrics and isinstance(
        dataNode.metrics[MetricType.ENERGY], Stats
    ):
        stats: Stats = dataNode.metrics[MetricType.ENERGY]  # type: ignore[assignment]

        # Application Summary
        total_energy = stats.sum
        e_kWh = total_energy / (3600 * 1e3)
        kgCO2 = dataNode.metrics[MetricType.CO2].sum / 1e3  # type: ignore[union-attr]
        money = dataNode.metrics[MetricType.MONEY].sum  # type: ignore[union-attr]
        money_icon = mr_node.metadata["post-processing.price_unit"]

        app_summary_str = f"Application Summary\n\nThe application has been run {n_runs} times. In total, it has used {e_kWh:.3f} kWh, released a total of {kgCO2:.3f} kgCO2e into the atmosphere, and you paid {money:.2f} {money_icon} in electricity for it."
    else:
        app_summary_str = f"The application has been run {n_runs} times."

    return report_header + mr_report_str + region_report_str + app_summary_str




[docs]
def sensors_table(sensors: List[Dict[str, Any]], by_rank: bool = True) -> str:
    """Create a text table from a list of sensor readings.

    Parameters
    ----------
    sensors : list[dict[str, Any]]
        List of sensor readings
    by_rank: bool, optional
        If the table should separate available sensors by rank.

    Returns
    -------
    str
        Table string
    """
    if not sensors:
        return "No sensor data available."

    result = ""
    if by_rank:
        for rank, rank_sensors in enumerate(sensors):
            result += f"RANK {rank}:\n"

            table = (
                pd.DataFrame.from_dict(
                    rank_sensors, orient="index", columns=["Source", "Device", "Unit"]
                )
                .reset_index()
                .rename(columns={"index": "Sensor"})
                .sort_values(by=["Source", "Sensor"])
                .to_markdown(index=False, stralign="right")
            )
            result += table + "\n\n"

    else:
        table = (
            pd.DataFrame.from_dict(
                sensors[0], orient="index", columns=["Source", "Device", "Unit"]
            )
            .reset_index()
            .rename(columns={"index": "Sensor"})
            .sort_values(by=["Source", "Sensor"])
            .to_markdown(index=False, stralign="right")
        )
        result += table + "\n"

    return result