Source code for ramble.test.reports

# Copyright 2022-2025 The Ramble Authors
#
# Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
# https://www.apache.org/licenses/LICENSE-2.0> or the MIT license
# <LICENSE-MIT or https://opensource.org/licenses/MIT>, at your
# option. This file may not be copied, modified, or distributed
# except according to those terms.

# Test command line args

# Test file import for JSON (done) and YAML
# - non-repeated experiments
# - repeated experiments

# Test normalization of data, and error when first value is zero

# Test that PDF is generated and contains data (size > some value?)

import os

import pandas as pd

# Possible to test that a specific chart was correctly generated? Not sure...
import pytest
from matplotlib.backends.backend_pdf import PdfPages

import ramble.reports
from ramble.util import foms

single_experiments = [
    {
        "RAMBLE_STATUS": "SUCCESS",
        "name": "single_exp_1",
        "n_nodes": 1,
        "simplified_workload_namespace": "test_app_test_workload",
        "RAMBLE_VARIABLES": {"repeat_index": "0"},
        "RAMBLE_RAW_VARIABLES": {},
        "CONTEXTS": [
            {
                "name": "null",
                "display_name": "null",
                "foms": [
                    {
                        "name": "fom_1",
                        "value": 42.0,
                        "units": "",
                        "origin": "dummy_app",
                        "origin_type": "application",
                        "fom_type": {"name": "MEASURE", "better_direction": "INDETERMINATE"},
                    },
                    {
                        "name": "fom_2",
                        "value": 50,
                        "units": "",
                        "origin": "dummy_app",
                        "origin_type": "application",
                        "fom_type": {"name": "MEASURE", "better_direction": "INDETERMINATE"},
                    },
                ],
            },
        ],
    },
    {
        "RAMBLE_STATUS": "SUCCESS",
        "name": "single_exp_2",
        "n_nodes": 2,
        "simplified_workload_namespace": "test_app_test_workload",
        "RAMBLE_VARIABLES": {"repeat_index": "0"},
        "RAMBLE_RAW_VARIABLES": {},
        "CONTEXTS": [
            {
                "name": "null",
                "display_name": "null",
                "foms": [
                    {
                        "name": "fom_1",
                        "value": 28.0,
                        "units": "",
                        "origin": "dummy_app",
                        "origin_type": "application",
                        "fom_type": {"name": "MEASURE", "better_direction": "INDETERMINATE"},
                    },
                    {
                        "name": "fom_2",
                        "value": 55,
                        "units": "",
                        "origin": "dummy_app",
                        "origin_type": "application",
                        "fom_type": {"name": "MEASURE", "better_direction": "INDETERMINATE"},
                    },
                ],
            },
        ],
    },
]

repeat_experiments = [
    {
        "RAMBLE_STATUS": "SUCCESS",
        "name": "repeat_exp_1",
        "n_nodes": 1,
        "simplified_workload_namespace": "test_app_test_workload",
        "N_REPEATS": 2,
        "RAMBLE_VARIABLES": {"repeat_index": 0},
        "RAMBLE_RAW_VARIABLES": {},
        "CONTEXTS": [
            {
                "name": "null",
                "display_name": "null",
                "foms": [
                    {
                        "value": 2,
                        "units": "repeats",
                        "origin": "dummy_app",
                        "origin_type": "summary::n_total_repeats",
                        "name": "Experiment Summary",
                        "fom_type": {"name": "MEASURE", "better_direction": "INDETERMINATE"},
                    },
                    {
                        "value": 2,
                        "units": "repeats",
                        "origin": "dummy_app",
                        "origin_type": "summary::n_successful_repeats",
                        "name": "Experiment Summary",
                        "fom_type": {"name": "MEASURE", "better_direction": "INDETERMINATE"},
                    },
                    {
                        "value": 28.0,
                        "units": "s",
                        "origin": "dummy_app",
                        "origin_type": "summary::min",
                        "name": "fom_1",
                        "fom_type": {"name": "TIME", "better_direction": "LOWER"},
                    },
                    {
                        "value": 30.0,
                        "units": "s",
                        "origin": "dummy_app",
                        "origin_type": "summary::max",
                        "name": "fom_1",
                        "fom_type": {"name": "TIME", "better_direction": "LOWER"},
                    },
                    {
                        "value": 29.0,
                        "units": "s",
                        "origin": "dummy_app",
                        "origin_type": "summary::mean",
                        "name": "fom_1",
                        "fom_type": {"name": "TIME", "better_direction": "LOWER"},
                    },
                ],
            },
        ],
    },
    {
        "RAMBLE_STATUS": "SUCCESS",
        "name": "repeat_exp_1.1",
        "n_nodes": 2,
        "simplified_workload_namespace": "test_app_test_workload",
        "N_REPEATS": 0,
        "RAMBLE_VARIABLES": {"repeat_index": 1},
        "RAMBLE_RAW_VARIABLES": {},
        "CONTEXTS": [
            {
                "name": "null",
                "display_name": "null",
                "foms": [
                    {
                        "name": "fom_1",
                        "value": 28.0,
                        "units": "",
                        "origin": "dummy_app",
                        "origin_type": "application",
                        "fom_type": {"name": "TIME", "better_direction": "LOWER"},
                    },
                    {
                        "name": "fom_2",
                        "value": 55,
                        "units": "",
                        "origin": "dummy_app",
                        "origin_type": "application",
                        "fom_type": {"name": "MEASURE", "better_direction": "INDETERMINATE"},
                    },
                ],
            },
        ],
    },
    {
        "RAMBLE_STATUS": "SUCCESS",
        "name": "repeat_exp_1.2",
        "n_nodes": 2,
        "simplified_workload_namespace": "test_app_test_workload",
        "N_REPEATS": 0,
        "RAMBLE_VARIABLES": {"repeat_index": 2},
        "RAMBLE_RAW_VARIABLES": {},
        "CONTEXTS": [
            {
                "name": "null",
                "display_name": "null",
                "foms": [
                    {
                        "name": "fom_1",
                        "value": 30.0,
                        "units": "",
                        "origin": "dummy_app",
                        "origin_type": "application",
                        "fom_type": {"name": "TIME", "better_direction": "LOWER"},
                    },
                    {
                        "name": "fom_2",
                        "value": 55,
                        "units": "",
                        "origin": "dummy_app",
                        "origin_type": "application",
                        "fom_type": {"name": "MEASURE", "better_direction": "INDETERMINATE"},
                    },
                ],
            },
        ],
    },
]

results = {"experiments": single_experiments}

all_experiments = repeat_experiments + single_experiments
repeat_results = {"experiments": all_experiments}



[docs]
def create_test_exp(
    success,
    name,
    n_nodes,
    wl_ns,
    ramble_vars,
    ramble_raw_vars,
    context,
    fom_name,
    fom_value,
    units,
    origin,
    origin_type,
    fom_type,
    better_direction,
    fv,
    ifv,
    normalized=False,
    repeat_index="0",
):
    test_exp_dict = {
        "RAMBLE_STATUS": success,
        "name": name,
        "n_nodes": n_nodes,
        "simplified_workload_namespace": wl_ns,
        "RAMBLE_VARIABLES": ramble_vars,
        "RAMBLE_RAW_VARIABLES": ramble_raw_vars,
        "context": context,
        "fom_name": fom_name,
        "fom_type": fom_type,
        "better_direction": better_direction,
        "fom_value": fom_value,
        "fom_units": units,
        "fom_origin": origin,
        "fom_origin_type": origin_type,
        "repeat_index": repeat_index,
        "series": wl_ns,
        "normalized_fom_value" if normalized else "fom_value": fv,
    }
    # ideal_perf_value is not calculated for plots without better_direction
    if ifv:
        test_exp_dict["ideal_perf_value"] = ifv
    return test_exp_dict




[docs]
@pytest.mark.parametrize(
    "values",
    [
        (ramble.reports.StrongScalingPlot, "fom_1", 42.0, 42.0, 42.0, 28.0, 28.0, 21.0, False),
        (ramble.reports.StrongScalingPlot, "fom_1", 42.0, 1.0, 1.0, 28.0, 28.0 / 42.0, 2.0, True),
        (ramble.reports.WeakScalingPlot, "fom_2", 50, 50, None, 55, 55.0, None, False),
        (ramble.reports.WeakScalingPlot, "fom_2", 50.0, 1.0, None, 55.0, 1.1, None, True),
    ],
)
def test_scaling_plots(mutable_mock_workspace_path, tmpdir_factory, values):

    report_name = "unit_test"
    report_dir_path = tmpdir_factory.mktemp(report_name)
    pdf_path = os.path.join(report_dir_path, f"{report_name}.pdf")

    plot_type, fom_name, fom1, nfv1, ideal1, fom2, nfv2, ideal2, normalize = values

    test_spec = [fom_name, "n_nodes"]

    ideal_data = []
    ideal_data.append(
        create_test_exp(
            "SUCCESS",
            "single_exp_1",
            1,
            "test_app_test_workload",
            {"repeat_index": "0"},
            {},
            "null",
            fom_name,
            fom1,
            "",
            "dummy_app",
            "application",
            foms.FomType.MEASURE,
            foms.BetterDirection.INDETERMINATE,
            nfv1,
            ideal1,
            normalized=normalize,
        )
    )
    ideal_data.append(
        create_test_exp(
            "SUCCESS",
            "single_exp_2",
            2,
            "test_app_test_workload",
            {"repeat_index": "0"},
            {},
            "null",
            fom_name,
            fom2,
            "",
            "dummy_app",
            "application",
            foms.FomType.MEASURE,
            foms.BetterDirection.INDETERMINATE,
            nfv2,
            ideal2,
            normalized=normalize,
        )
    )

    ideal_df = pd.DataFrame(ideal_data, columns=ideal_data[0].keys())

    # Update index to match
    ideal_df = ideal_df.set_index("n_nodes")

    ideal_df[["RAMBLE_VARIABLES", "RAMBLE_RAW_VARIABLES", "repeat_index", "fom_units"]] = ideal_df[
        ["RAMBLE_VARIABLES", "RAMBLE_RAW_VARIABLES", "repeat_index", "fom_units"]
    ].astype(object)

    logx = False
    logy = False
    split_by = "simplified_workload_namespace"

    where_query = None
    results_df = ramble.reports.prepare_data(results, where_query)
    plot = plot_type(test_spec, normalize, report_dir_path, results_df, logx, logy, split_by)

    with PdfPages(pdf_path) as pdf_report:
        plot.generate_plot_data(pdf_report)

        # Sort columns alphabetically, order is not important
        plot.output_df.sort_index(axis=1, inplace=True)
        ideal_df.sort_index(axis=1, inplace=True)

        assert plot.output_df.equals(ideal_df)
        assert os.path.isfile(pdf_path)




[docs]
def test_repeat_import(mutable_mock_workspace_path):
    where_query = None
    results_df = ramble.reports.prepare_data(repeat_results, where_query)

    # DF contains only summary exp and not individual repeats
    assert "repeat_exp_1" in results_df.values
    assert "repeat_exp_1.1" not in results_df.values
    assert "single_exp_1" in results_df.values

    # Summary FOMs are present in DF, types converted to objects
    row_mean = results_df.query("fom_origin_type == 'summary::mean'")
    assert row_mean["fom_value"].values == [29.0]
    assert row_mean["fom_type"].values == [foms.FomType.TIME]
    assert row_mean["better_direction"].values == [foms.BetterDirection.LOWER]

    single_exp_rows = results_df.query("name == 'single_exp_1' and fom_name == 'fom_1'")
    assert single_exp_rows["fom_value"].values == [42.0]




[docs]
def test_fom_plot(mutable_mock_workspace_path, tmpdir_factory):
    report_name = "unit_test"
    report_dir_path = tmpdir_factory.mktemp(report_name)
    pdf_path = os.path.join(report_dir_path, f"{report_name}.pdf")

    where_query = None
    for exp in results["experiments"]:
        exp.update({"simplified_experiment_namespace": "test_exp"})

    results_df = ramble.reports.prepare_data(results, where_query)

    plot = ramble.reports.FomPlot(None, False, report_dir_path, results_df, False, False, None)
    with PdfPages(pdf_path) as pdf_report:
        plot.generate_plot_data(pdf_report)

    assert os.path.isfile(pdf_path)
    assert os.path.isfile(os.path.join(report_dir_path, "foms_fom_1_by_experiments.png"))




[docs]
def test_compare_plot(mutable_mock_workspace_path, tmpdir_factory):
    report_name = "unit_test"
    report_dir_path = tmpdir_factory.mktemp(report_name)
    pdf_path = os.path.join(report_dir_path, f"{report_name}.pdf")

    where_query = None
    results_df = ramble.reports.prepare_data(results, where_query)

    spec = ["fom_1", "n_nodes"]
    plot = ramble.reports.ComparisonPlot(
        spec, False, report_dir_path, results_df, False, False, None
    )
    with PdfPages(pdf_path) as pdf_report:
        plot.generate_plot_data(pdf_report)

    assert os.path.isfile(pdf_path)
    assert os.path.isfile(os.path.join(report_dir_path, "fom_1_by_n_nodes.png"))




[docs]
def test_where_query(mutable_mock_workspace_path):
    where_query = 'fom_name == "fom_1"'
    results_df = ramble.reports.prepare_data(results, where_query)
    filtered_foms = results_df["fom_name"].tolist()

    assert "fom_1" in filtered_foms
    assert "fom_2" not in filtered_foms




[docs]
def test_multiple_groupby(mutable_mock_workspace_path, tmpdir_factory, capsys):
    report_name = "unit_test"
    report_dir_path = tmpdir_factory.mktemp(report_name)
    pdf_path = os.path.join(report_dir_path, f"{report_name}.pdf")

    in_data = [
        ("exp_1", 1, "test_wl_1", "1.0", "app_v1"),
        ("exp_2", 1, "test_wl_2", "2.0", "app_v1"),
        ("exp_3", 2, "test_wl_1", "3.0", "app_v1"),
        ("exp_4", 2, "test_wl_2", "4.0", "app_v1"),
        ("exp_5", 1, "test_wl_1", "10.0", "app_v2"),
        ("exp_6", 1, "test_wl_2", "20.0", "app_v2"),
        ("exp_7", 2, "test_wl_1", "30.0", "app_v2"),
        ("exp_8", 2, "test_wl_2", "40.0", "app_v2"),
    ]
    experiments = []
    for exp in in_data:
        name, n_nodes, wl_ns, fom_value, test_app = exp

        experiments.append(
            create_test_exp(
                success="SUCCESS",
                name=name,
                n_nodes=n_nodes,
                wl_ns=wl_ns,
                ramble_vars={"repeat_index": "0"},
                ramble_raw_vars={},
                context="null",
                fom_name="fom_1",
                fom_value=fom_value,
                units="",
                origin=test_app,
                origin_type="application",
                fom_type=foms.FomType.MEASURE,
                better_direction=foms.BetterDirection.INDETERMINATE,
                fv=fom_value,
                ifv=None,
                normalized=False,
            )
        )

    test_df = pd.DataFrame(experiments, columns=experiments[0].keys())

    test_spec = ["fom_1", "n_nodes", "simplified_workload_namespace"]
    logx = False
    logy = False
    split_by = "simplified_workload_namespace"
    plot = ramble.reports.StrongScalingPlot(
        test_spec, False, report_dir_path, test_df, logx, logy, split_by
    )

    with PdfPages(pdf_path) as pdf_report:
        with pytest.raises(SystemExit):
            plot.generate_plot_data(pdf_report)
        captured = capsys.readouterr().err
        assert "Error: Attempting to plot non-unique data." in captured

    test_spec = ["fom_1", "n_nodes", "simplified_workload_namespace", "fom_origin"]
    plot = ramble.reports.StrongScalingPlot(
        test_spec, False, report_dir_path, test_df, logx, logy, split_by
    )
    with PdfPages(pdf_path) as pdf_report:
        plot.generate_plot_data(pdf_report)

    assert os.path.isfile(pdf_path)
    assert os.path.isfile(
        os.path.join(
            report_dir_path, "strong-scaling_fom_1_vs_n_nodes_test_wl_1_x_test_wl_1_x_app_v1.png"
        )
    )