Source code for ramble.test.end_to_end.wrfv4_dry_run

# Copyright 2022-2026 The Ramble Authors
#
# Licensed under the Apache License, Version 2.0 <LICENSE-APACHE or
# https://www.apache.org/licenses/LICENSE-2.0> or the MIT license
# <LICENSE-MIT or https://opensource.org/licenses/MIT>, at your
# option. This file may not be copied, modified, or distributed
# except according to those terms.

import glob
import os
import re

import pytest

import ramble.workspace
from ramble.main import RambleCommand
from ramble.test.dry_run_helpers import search_files_for_string

# everything here uses the mock_workspace_path
pytestmark = pytest.mark.usefixtures("mutable_config", "mutable_mock_workspace_path")

workspace = RambleCommand("workspace")



[docs]
@pytest.mark.long
def test_wrfv4_spack_dry_run(mutable_config, mutable_mock_workspace_path, workspace_name):
    test_config = """
ramble:
  variants:
    package_manager: spack
  variables:
    mpi_command: 'mpirun -n {n_ranks} -ppn {processes_per_node}'
    batch_submit: 'batch_submit {execute_experiment}'
    partition: ['part1', 'part2']
    processes_per_node: ['16', '36']
    n_ranks: '{processes_per_node}*{n_nodes}'
    n_threads: '1'
  applications:
    wrfv4:
      variables:
        env_name: ['wrfv4', 'wrfv4-portable']
      workloads:
        CONUS_12km:
          experiments:
            scaling_{n_nodes}_{partition}_{env_name}:
              success_criteria:
              - name: 'timing'
                mode: 'string'
                match: '.*Timing for main.*'
                file: '{experiment_run_dir}/rsl.out.base'
              env_vars:
                set:
                  OMP_NUM_THREADS: '{n_threads}'
                  TEST_VAR: '1'
                append:
                - var-separator: ', '
                  vars:
                    TEST_VAR: 'add_var'
                - paths:
                    TEST_VAR: 'new_path'
                prepend:
                - paths:
                    TEST_VAR: 'pre_path'
                unset:
                - TEST_VAR
              variables:
                n_nodes: ['1', '2', '4', '8', '16']
                lic_path: /fake/lic/path
              matrix:
              - n_nodes
              - env_name
  software:
    packages:
      gcc:
        pkg_spec: gcc@13.2.0
      intel-mpi:
        pkg_spec: intel-oneapi-mpi@2021.11.0
        compiler: gcc
      wrfv4:
        pkg_spec: wrf@4.2 build_type=dm+sm compile_type=em_real nesting=basic ~chem ~pnetcdf
        compiler: gcc
      wrfv4-portable:
        pkg_spec: 'wrf@4.2 build_type=dm+sm compile_type=em_real
          nesting=basic ~chem ~pnetcdf target=x86_64'
        compiler: gcc
    environments:
      wrfv4:
        packages:
        - wrfv4
        - intel-mpi
      wrfv4-portable:
        packages:
        - wrfv4-portable
        - intel-mpi
"""

    test_licenses = """
licenses:
  wrfv4:
    set:
      WRF_LICENSE: port@server
      WRF_CERTIFICATE_PATH: '{lic_path}'
"""

    test_compilers = """
compilers:
- compiler:
    spec: gcc@=13.2.0
    paths:
      cc: /usr/bin/gcc
      cxx: /usr/bin/g++
      f77: null
      fc: null
    flags: {}
    operating_system: rocky8
    target: x86_64
    modules: []
    environment: {}
    extra_rpaths: []
"""

    with ramble.workspace.create(workspace_name) as ws1:
        ws1.write()

        config_path = os.path.join(ws1.config_dir, ramble.workspace.CONFIG_FILE_NAME)
        license_path = os.path.join(ws1.config_dir, "licenses.yaml")

        compilers_path = os.path.join(
            ws1.config_dir, ramble.workspace.AUXILIARY_SOFTWARE_DIR_NAME, "compilers.yaml"
        )

        aux_software_path = os.path.join(
            ws1.config_dir, ramble.workspace.AUXILIARY_SOFTWARE_DIR_NAME
        )
        aux_software_files = ["packages.yaml", "my_test.sh"]

        with open(config_path, "w+") as f:
            f.write(test_config)

        with open(license_path, "w+") as f:
            f.write(test_licenses)

        with open(compilers_path, "w+") as f:
            f.write(test_compilers)

        for file in aux_software_files:
            file_path = os.path.join(aux_software_path, file)
            with open(file_path, "w+") as f:
                f.write("")

        # Write a command template
        with open(os.path.join(ws1.config_dir, "full_command.tpl"), "w+") as f:
            f.write("{command}")

        ws1._re_read()

        workspace("setup", "--dry-run", global_args=["-w", workspace_name])

        out_files = glob.glob(os.path.join(ws1.log_dir, "**", "*.out"), recursive=True)

        assert search_files_for_string(
            out_files,
            "Would download https://www2.mmm.ucar.edu/wrf/users/benchmark/v422/v42_bench_conus12km.tar.gz",
        )

        # Test software directories
        software_dirs = ["wrfv4", "wrfv4-portable"]
        software_base_dir = ws1.software_dir
        assert os.path.exists(software_base_dir)
        for software_dir in software_dirs:
            software_path = os.path.join(software_base_dir, "spack", software_dir)
            assert os.path.exists(software_path)

            spack_file = os.path.join(software_path, "spack.yaml")
            assert os.path.exists(spack_file)
            for file in aux_software_files:
                if not file.endswith(".yaml"):
                    file_path = os.path.join(software_path, file)
                    assert os.path.exists(file_path)

        expected_experiments = [
            "scaling_1_part1_wrfv4",
            "scaling_2_part1_wrfv4",
            "scaling_4_part1_wrfv4",
            "scaling_8_part1_wrfv4",
            "scaling_16_part1_wrfv4",
            "scaling_1_part2_wrfv4",
            "scaling_2_part2_wrfv4",
            "scaling_4_part2_wrfv4",
            "scaling_8_part2_wrfv4",
            "scaling_16_part2_wrfv4",
            "scaling_1_part1_wrfv4-portable",
            "scaling_2_part1_wrfv4-portable",
            "scaling_4_part1_wrfv4-portable",
            "scaling_8_part1_wrfv4-portable",
            "scaling_16_part1_wrfv4-portable",
            "scaling_1_part2_wrfv4-portable",
            "scaling_2_part2_wrfv4-portable",
            "scaling_4_part2_wrfv4-portable",
            "scaling_8_part2_wrfv4-portable",
            "scaling_16_part2_wrfv4-portable",
        ]

        # Test experiment directories
        for exp in expected_experiments:
            exp_dir = os.path.join(ws1.root, "experiments", "wrfv4", "CONUS_12km", exp)
            assert os.path.isdir(exp_dir)
            assert os.path.exists(os.path.join(exp_dir, "execute_experiment"))
            assert os.path.exists(os.path.join(exp_dir, "full_command"))

            license_inc_path = os.path.join(ws1.root, "shared", "licenses", "wrfv4", "license.inc")
            with open(os.path.join(exp_dir, "full_command")) as f:
                data = f.read()
                # Test the license exists
                assert f". {license_inc_path}" in data

                # Test the required environment variables exist
                assert 'export OMP_NUM_THREADS="1"' in data
                assert "export TEST_VAR=1" in data
                assert "unset TEST_VAR" in data

                # Test the expected portions of the execution command exist
                assert "sed -i -e 's/ start_hour.*/ start_hour" in data
                assert "sed -i -e 's/ restart .*/ restart" in data
                assert re.search("\nmpirun", data)
                assert "wrf.exe" in data

                # Test the run script has a reference to the experiment log file
                assert os.path.join(exp_dir, f"{exp}.out") in data

            assert os.path.isdir(os.path.join(ws1.root, "shared"))
            assert os.path.isdir(os.path.join(ws1.root, "shared", "licenses"))
            assert os.path.isdir(os.path.join(ws1.root, "shared", "licenses", "wrfv4"))
            assert os.path.exists(license_inc_path)

            with open(license_inc_path) as f:
                data = f.read()
                # Test the license is added to the include file
                assert "export WRF_LICENSE=port@server" in data
                assert 'export WRF_CERTIFICATE_PATH="/fake/lic/path"' in data

            with open(os.path.join(exp_dir, "execute_experiment")) as f:
                data = f.read()

                # Test the required environment variables exist
                assert 'export OMP_NUM_THREADS="1"' in data
                assert "export TEST_VAR=1" in data
                assert "unset TEST_VAR" in data

                # Test the expected portions of the execution command exist
                assert "sed -i -e 's/ start_hour.*/ start_hour" in data
                assert "sed -i -e 's/ restart .*/ restart" in data
                assert "mpirun" in data
                assert "wrf.exe" in data

                # Test the run script has a reference to the experiment log file
                assert os.path.join(exp_dir, f"{exp}.out") in data

                # Test that spack is used
                assert "spack env activate" in data

            # Create fake figures of merit.
            with open(os.path.join(exp_dir, "rsl.out.base"), "w+") as f:
                for i in range(1, 6):
                    f.write(f"Timing for main: time 2019-11-27_00:00:00 on domain 1: {i}{i}.{i}\n")
                f.write("wrf: SUCCESS COMPLETE WRF\n")

            # Create files that match archive patterns
            new_file = os.path.join(exp_dir, "rsl.error.base")

            f = open(new_file, "w+")
            f.close()

        tmp_results_file = os.path.join(ws1.root, "temp.results.txt")
        if not os.path.exists(ws1.results_dir):
            os.makedirs(ws1.results_dir)
        symlink_results_file = os.path.join(ws1.results_dir, "results.latest.txt")
        # Temporarily store some temp data in the "latest" result and check it
        # gets updated
        with open(tmp_results_file, "w+") as f:
            f.write("Dummy data...")
        os.symlink(tmp_results_file, symlink_results_file)

        workspace("analyze", "-f", "text", "json", "yaml", global_args=["-w", workspace_name])

        text_results_files = glob.glob(os.path.join(ws1.results_dir, "results*.txt"))
        json_results_files = glob.glob(os.path.join(ws1.results_dir, "results*.json"))
        yaml_results_files = glob.glob(os.path.join(ws1.results_dir, "results*.yaml"))

        # Match both the file and the symlink
        assert len(text_results_files) == 2
        assert len(json_results_files) == 2
        assert len(yaml_results_files) == 2

        for text_result in text_results_files:
            with open(text_result) as f:
                data = f.read()
                assert "Tags =" in data
                assert "Average Timestep Time = 33.3 s" in data
                assert "Cumulative Timestep Time = 166.5 s" in data
                assert "Minimum Timestep Time = 11.1 s" in data
                assert "Maximum Timestep Time = 55.5 s" in data
                assert "Avg. Max Ratio Time = 0.6" in data
                assert "Number of timesteps = 5" in data
                assert "Software definitions:" in data
                assert "spack packages:" in data

        workspace("archive", global_args=["-w", workspace_name])

        assert ws1.latest_archive
        assert os.path.exists(ws1.latest_archive_path)

        for exp in expected_experiments:
            exp_dir = os.path.join(
                ws1.latest_archive_path, "experiments", "wrfv4", "CONUS_12km", exp
            )
            assert os.path.isdir(exp_dir)
            assert os.path.exists(os.path.join(exp_dir, "execute_experiment"))
            assert os.path.exists(os.path.join(exp_dir, "full_command"))
            assert os.path.exists(os.path.join(exp_dir, "rsl.out.base"))
            assert os.path.exists(os.path.join(exp_dir, "rsl.error.base"))




[docs]
@pytest.mark.maybeslow
def test_wrfv4_no_pkg_man_dry_run(mutable_config, mutable_mock_workspace_path, workspace_name):
    test_config = """
ramble:
  variables:
    mpi_command: 'mpirun -n {n_ranks} -ppn {processes_per_node}'
    batch_submit: 'batch_submit {execute_experiment}'
    partition: ['part1', 'part2']
    processes_per_node: ['16', '36']
    n_ranks: '{processes_per_node}*{n_nodes}'
    n_threads: '1'
  applications:
    wrfv4:
      variables:
        env_name: ['wrfv4', 'wrfv4-portable']
      workloads:
        CONUS_12km:
          experiments:
            scaling_{n_nodes}_{partition}_{env_name}:
              success_criteria:
              - name: 'timing'
                mode: 'string'
                match: '.*Timing for main.*'
                file: '{experiment_run_dir}/rsl.out.base'
              env_vars:
                set:
                  OMP_NUM_THREADS: '{n_threads}'
                  TEST_VAR: '1'
                append:
                - var-separator: ', '
                  vars:
                    TEST_VAR: 'add_var'
                - paths:
                    TEST_VAR: 'new_path'
                prepend:
                - paths:
                    TEST_VAR: 'pre_path'
                unset:
                - TEST_VAR
              variables:
                wrf_path: '/not/a/real/path'
                n_nodes: ['1', '2', '4', '8', '16']
              matrix:
              - n_nodes
              - env_name
"""

    test_licenses = """
licenses:
  wrfv4:
    set:
      WRF_LICENSE: port@server
"""

    with ramble.workspace.create(workspace_name) as ws1:
        ws1.write()

        config_path = os.path.join(ws1.config_dir, ramble.workspace.CONFIG_FILE_NAME)
        license_path = os.path.join(ws1.config_dir, "licenses.yaml")

        aux_software_path = os.path.join(
            ws1.config_dir, ramble.workspace.AUXILIARY_SOFTWARE_DIR_NAME
        )
        aux_software_files = ["packages.yaml", "my_test.sh"]

        with open(config_path, "w+") as f:
            f.write(test_config)

        with open(license_path, "w+") as f:
            f.write(test_licenses)

        for file in aux_software_files:
            file_path = os.path.join(aux_software_path, file)
            with open(file_path, "w+") as f:
                f.write("")

        # Write a command template
        with open(os.path.join(ws1.config_dir, "full_command.tpl"), "w+") as f:
            f.write("{command}")

        ws1._re_read()

        workspace("setup", "--dry-run", global_args=["-w", workspace_name])

        out_files = glob.glob(os.path.join(ws1.log_dir, "**", "*.out"), recursive=True)

        assert search_files_for_string(
            out_files,
            "Would download https://www2.mmm.ucar.edu/wrf/users/benchmark/v422/v42_bench_conus12km.tar.gz",
        )

        expected_experiments = [
            "scaling_1_part1_wrfv4",
            "scaling_2_part1_wrfv4",
            "scaling_4_part1_wrfv4",
            "scaling_8_part1_wrfv4",
            "scaling_16_part1_wrfv4",
            "scaling_1_part2_wrfv4",
            "scaling_2_part2_wrfv4",
            "scaling_4_part2_wrfv4",
            "scaling_8_part2_wrfv4",
            "scaling_16_part2_wrfv4",
            "scaling_1_part1_wrfv4-portable",
            "scaling_2_part1_wrfv4-portable",
            "scaling_4_part1_wrfv4-portable",
            "scaling_8_part1_wrfv4-portable",
            "scaling_16_part1_wrfv4-portable",
            "scaling_1_part2_wrfv4-portable",
            "scaling_2_part2_wrfv4-portable",
            "scaling_4_part2_wrfv4-portable",
            "scaling_8_part2_wrfv4-portable",
            "scaling_16_part2_wrfv4-portable",
        ]

        # Test experiment directories
        for exp in expected_experiments:
            exp_dir = os.path.join(ws1.root, "experiments", "wrfv4", "CONUS_12km", exp)
            assert os.path.isdir(exp_dir)
            assert os.path.exists(os.path.join(exp_dir, "execute_experiment"))
            assert os.path.exists(os.path.join(exp_dir, "full_command"))

            license_inc_path = os.path.join(ws1.root, "shared", "licenses", "wrfv4", "license.inc")
            with open(os.path.join(exp_dir, "full_command")) as f:
                data = f.read()
                # Test the license exists
                assert f". {license_inc_path}" in data

                # Test the required environment variables exist
                assert 'export OMP_NUM_THREADS="1"' in data
                assert "export TEST_VAR=1" in data
                assert "unset TEST_VAR" in data

                # Test the expected portions of the execution command exist
                assert "sed -i -e 's/ start_hour.*/ start_hour" in data
                assert "sed -i -e 's/ restart .*/ restart" in data
                assert "mpirun" in data
                assert "wrf.exe" in data

                # Test the run script has a reference to the experiment log file
                assert os.path.join(exp_dir, f"{exp}.out") in data

            assert os.path.isdir(os.path.join(ws1.root, "shared"))
            assert os.path.isdir(os.path.join(ws1.root, "shared", "licenses"))
            assert os.path.isdir(os.path.join(ws1.root, "shared", "licenses", "wrfv4"))
            assert os.path.exists(license_inc_path)

            with open(license_inc_path) as f:
                data = f.read()
                # Test the license is added to the include file
                assert "export WRF_LICENSE=port@server" in data

            with open(os.path.join(exp_dir, "execute_experiment")) as f:
                data = f.read()

                # Test the required environment variables exist
                assert 'export OMP_NUM_THREADS="1"' in data
                assert "export TEST_VAR=1" in data
                assert "unset TEST_VAR" in data

                # Test the expected portions of the execution command exist
                assert "sed -i -e 's/ start_hour.*/ start_hour" in data
                assert "sed -i -e 's/ restart .*/ restart" in data
                assert "mpirun" in data
                assert "wrf.exe" in data

                # Test the run script has a reference to the experiment log file
                assert os.path.join(exp_dir, f"{exp}.out") in data

            # Create fake figures of merit.
            with open(os.path.join(exp_dir, "rsl.out.base"), "w+") as f:
                for i in range(1, 6):
                    f.write(f"Timing for main: time 2019-11-27_00:00:00 on domain 1: {i}{i}.{i}\n")
                f.write("wrf: SUCCESS COMPLETE WRF\n")

            # Create files that match archive patterns
            new_file = os.path.join(exp_dir, "rsl.error.base")

            f = open(new_file, "w+")
            f.close()

        tmp_results_file = os.path.join(ws1.root, "temp.results.txt")
        if not os.path.exists(ws1.results_dir):
            os.makedirs(ws1.results_dir)
        symlink_results_file = os.path.join(ws1.results_dir, "results.latest.txt")
        # Temporarily store some temp data in the "latest" result and check it
        # gets updated
        with open(tmp_results_file, "w+") as f:
            f.write("Dummy data...")
        os.symlink(tmp_results_file, symlink_results_file)

        workspace("analyze", "-f", "text", "json", "yaml", global_args=["-w", workspace_name])

        text_results_files = glob.glob(os.path.join(ws1.results_dir, "results*.txt"))
        json_results_files = glob.glob(os.path.join(ws1.results_dir, "results*.json"))
        yaml_results_files = glob.glob(os.path.join(ws1.results_dir, "results*.yaml"))

        # Match both the file and the symlink
        assert len(text_results_files) == 2
        assert len(json_results_files) == 2
        assert len(yaml_results_files) == 2

        for text_result in text_results_files:
            with open(text_result) as f:
                data = f.read()
                assert "Tags =" in data
                assert "Average Timestep Time = 33.3 s" in data
                assert "Cumulative Timestep Time = 166.5 s" in data
                assert "Minimum Timestep Time = 11.1 s" in data
                assert "Maximum Timestep Time = 55.5 s" in data
                assert "Avg. Max Ratio Time = 0.6" in data
                assert "Number of timesteps = 5" in data

        workspace("archive", global_args=["-w", workspace_name])

        assert ws1.latest_archive
        assert os.path.exists(ws1.latest_archive_path)

        for exp in expected_experiments:
            exp_dir = os.path.join(
                ws1.latest_archive_path, "experiments", "wrfv4", "CONUS_12km", exp
            )
            assert os.path.isdir(exp_dir)
            assert os.path.exists(os.path.join(exp_dir, "execute_experiment"))
            assert os.path.exists(os.path.join(exp_dir, "full_command"))
            assert os.path.exists(os.path.join(exp_dir, "rsl.out.base"))
            assert os.path.exists(os.path.join(exp_dir, "rsl.error.base"))