Usage#

We’ve designed the package so it is easy to write scripts that run MOBO for a particular JETTO problem. To do so, you need to:

Define your inputs
Define your objective functions
Write the main evaluation script

In this section, we run through the ecrh_q_optimisation example from theo-brown/jetto-mobo; this formed the basis of our SOFE2023 poster, looking at MOBO of the ECRH input to find good q-profiles.

1. Define inputs#

First, we define the ECRH parameterisation to use. As ECRH is a plasma profile, we decorate it with @jetto_mobo.inputs.plasma_profile, which tells the optimiser to expect a function of the form f(xrho, parameters).

examples/ecrh_q_optimisation/ecrh_inputs.py#

from typing import Union

import numpy as np
from scipy.interpolate import CubicSpline
from scipy.special import comb

from jetto_mobo.inputs import plasma_profile


@plasma_profile
def marsden_piecewise_linear(xrho: np.ndarray, parameters: np.ndarray) -> np.ndarray:
    """
    12-parameter piecewise linear profile, originally designed for ECRH profiles by Stephen Marsden.

    Parameters
    ----------
    xrho : np.ndarray
        Normalised radial position.
    parameters : np.ndarray
        Profile parameters:
        - parameters[0]: on-axis peak power
        - parameters[1]: on-axis descent end power
        - parameters[2]: on-axis descent end xrho
        - parameters[3]: minimum power fraction
        - parameters[4]: minimum power
        - parameters[5]: minimum xrho
        - parameters[6]: off-axis shaper 1 fraction
        - parameters[7]: off-axis shaper 2 fraction
        - parameters[8]: off-axis peak power
        - parameters[9]: off-axis peak xrho
        - parameters[10]: turn-off shaper fraction
        - parameters[11]: turn-off xrho

    Raises
    ------
    ValueError
        If the number of parameters is not 12.
    """
    if len(parameters) != 12:
        raise ValueError(f"Expected 12 parameters, got {len(parameters)}.")

    lower_bounds = np.array([0, 0.05, 0.01, 0.1, 0, 0.1, 0.1, 0.1, 0.1, 0.1, 0.1, 0.1])
    upper_bounds = np.array([1, 1, 0.09, 1, 1, 0.29, 0.9, 0.9, 1, 0.75, 0.9, 0.45])
    is_outside_bounds = (parameters < lower_bounds) | (parameters > upper_bounds)
    if np.any(is_outside_bounds):
        raise ValueError(
            f"Parameter(s) outside of bounds at indices {np.nonzero(is_outside_bounds)}"
        )

    on_axis_peak_power = parameters[0]
    on_axis_descent_end_power = parameters[1] * on_axis_peak_power
    minimum_power = parameters[4]
    minimum_shaper_power = (
        parameters[3] * minimum_power + (1 - parameters[3]) * on_axis_descent_end_power
    )
    off_axis_peak_power = parameters[8]
    off_axis_shaper_2_power = (
        parameters[7] * off_axis_peak_power + (1 - parameters[7]) * minimum_power
    )
    off_axis_shaper_1_power = (
        parameters[6] * off_axis_shaper_2_power + (1 - parameters[6]) * minimum_power
    )
    turn_off_shaper_power = parameters[10] * off_axis_peak_power
    turn_off_power = 0
    on_axis_peak_xrho = 0
    on_axis_descent_end_xrho = parameters[2]
    minimum_xrho = parameters[5]
    minimum_shaper_xrho = (minimum_xrho + on_axis_descent_end_xrho) / 2
    off_axis_peak_xrho = minimum_xrho + parameters[9]
    turn_off_xrho = off_axis_peak_xrho + parameters[11]
    off_axis_shaper_1_xrho = 2 / 3 * minimum_xrho + 1 / 3 * off_axis_peak_xrho
    off_axis_shaper_2_xrho = 1 / 3 * minimum_xrho + 2 / 3 * off_axis_peak_xrho
    turn_off_shaper_xrho = 1 / 2 * off_axis_peak_xrho + 1 / 2 * turn_off_xrho

    xdata = [
        on_axis_peak_xrho,
        on_axis_descent_end_xrho,
        minimum_shaper_xrho,
        minimum_xrho,
        off_axis_shaper_1_xrho,
        off_axis_shaper_2_xrho,
        off_axis_peak_xrho,
        turn_off_shaper_xrho,
        turn_off_xrho,
    ]
    ydata = [
        on_axis_peak_power,
        on_axis_descent_end_power,
        minimum_shaper_power,
        minimum_power,
        off_axis_shaper_1_power,
        off_axis_shaper_2_power,
        off_axis_peak_power,
        turn_off_shaper_power,
        turn_off_power,
    ]

    # Linearly interpolate between each of the points.
    qece = np.zeros(len(xrho))
    for i_point in range(len(xdata) - 1):
        # Get just the pair of points.
        points_xrho = [xdata[i_point], xdata[i_point + 1]]
        points_power = [ydata[i_point], ydata[i_point + 1]]
        # Fit with a straight line between them.
        cs = CubicSpline(
            points_xrho, points_power, bc_type=[(2, 0), (2, 0)], extrapolate=False
        )
        # Set the values in the profile.
        qece = np.array([v if v > 0 else qece[i] for i, v in enumerate(cs(xrho))])

We also need to define the bounds on the parameter values.

examples/ecrh_q_optimisation/ecrh_inputs.py#

marsden_piecewise_linear_bounds = np.array(
    [
        [0, 0.05, 0.01, 0.1, 0, 0.1, 0.1, 0.1, 0.1, 0.1, 0.1, 0.1],
        [1, 1, 0.09, 1, 1, 0.29, 0.9, 0.9, 1, 0.75, 0.9, 0.45],
    ]
)


def bernstein(i: Union[int, np.ndarray], n: int, t: np.ndarray) -> np.ndarray:
    """
    Evaluate the Bernstein basis polynomials at t.

    $$
    b_{i,n}(t) = \sum_{i=0}^n \binom{n}{i} t^i (1-t)^{n-i}
    $$
    """
    return comb(n, i) * np.power.outer(t, i) * np.power.outer((1 - t), (n - i))


def bezier_parametric(t: np.ndarray, control_points: np.ndarray) -> np.ndarray:
    """
    Parameters
    ----------
    t : np.ndarray
        Array of parametric coordinate values, length M.
    control_points : np.ndarray
        Array of shape (N, 2), giving N control points in the form [[x1, y1], ..., [xN, yN]].

    Returns
    -------
    np.ndarray
        Bezier curve defined by the control points, evaluated at t. Shape (M, 2), where [:, 0] is x and [:, 1] y coordinates.
    """
    # Check control points
    if not len(control_points.shape) == 2 or not control_points.shape[1] == 2:
        raise ValueError(
            f"control_points must be an array of shape (N, 2) (got {control_points.shape})."
        )

    n = control_points.shape[0]

    # Evaluate basis functions
    i = np.arange(n)
    basis_functions = bernstein(i, n - 1, t)

    # Evaluate bezier curve
    return basis_functions @ control_points


def bezier_x(
    x: np.ndarray, control_points: np.ndarray, parametric_resolution: int = int(1e3)
) -> np.ndarray:
    """
    Parameters
    ----------
    x : np.ndarray
        Array of x coordinates to evaluate the bezier curve at.
    control_points : np.ndarray
        Array of shape (N, 2), giving N control points in the form [[x1, y1], ..., [xN, yN]].
    parametric_resolution : int, default int(1e3)
        Number of points to evaluate the bezier curve at to obtain the implicit/parametric coordinates.

    Returns
    -------
    np.ndarray
        Array of y coordinates, evaluated at x.
    """
    t = np.linspace(0, 1, parametric_resolution)
    b = bezier_parametric(t, control_points)
    implicit_points_x = b[:, 0]
    implicit_points_y = b[:, 1]

    # Interpolate into x coordinates
    t_x = np.interp(
        x, implicit_points_x, t
    )  # t_x is the implicit/parametric value corresponding to x
    b = bezier_parametric(t_x, control_points)
    x_ = b[:, 0]
    y = b[:, 1]

    return y


on_axis_smoothness = 0.05
off_axis_smoothness = 0.05


@plasma_profile
def constrained_bezier_profile(xrho: np.ndarray, parameters: np.ndarray) -> np.ndarray:
    """
    Bezier curve evaluated at x, with added hyperparameters to control the behaviour at the ends of the curve.

    Parameters are of the form [y0, x1, y1, ..., xn].
    Control points are [[0, y0], [on_axis_smoothness, y_0], [x1, y1], ..., [xn - off_axis_smoothness, 0], [xn, 0]].
    """
    y0 = parameters[0]
    x_parameters = parameters[1:-1:2]
    y_parameters = parameters[2:-1:2]
    xn = parameters[-1]

    control_points_x = np.concatenate(
        [
            [0, on_axis_smoothness],
            # Sort the x coordinates of the control points so that they are monotonically increasing in x.
            # np.sort(x_parameters),
            # OR
            # Product the x coordinates of the control points so that they are monotonically increasing in x.
            # x coordinates will be [x0*x1*...*xn, x1*...*xn, ..., xn]
            # np.cumprod(x_parameters[::-1])[::-1],
            # OR
            # Use the x coordinates of the control points as they are.
            x_parameters * xn,
            [xn - off_axis_smoothness, xn],
        ]
    )
    control_points_y = np.concatenate([[y0, y0], y_parameters, [0, 0]])
    if not control_points_x.shape == control_points_y.shape:
        raise ValueError(
            f"control_points_x and control_points_y must have the same shape (got {control_points_x.shape} and {control_points_y.shape})."
        )
    control_points = np.array([control_points_x, control_points_y]).T
    return bezier_x(xrho, control_points, parametric_resolution=int(1e3))


@plasma_profile
def bezier_profile(xrho: np.ndarray, parameters: np.ndarray) -> np.ndarray:
    """
    Bezier curve evaluated at x.

    Parameters are of the form [y0, x1, y1, ..., xn].
    Control points are [[0, y0], [x1, y1], ..., [xn, 0]].
    """
    y0 = parameters[0]
    x_parameters = parameters[1:-1:2]
    y_parameters = parameters[2:-1:2]
    xn = parameters[-1]

    control_points_x = np.concatenate([[0], x_parameters * xn, [xn]])
    control_points_y = np.concatenate([[y0], y_parameters, [0]])
    if not control_points_x.shape == control_points_y.shape:
        raise ValueError(
            f"control_points_x and control_points_y must have the same shape (got {control_points_x.shape} and {control_points_y.shape})."
        )
    control_points = np.array([control_points_x, control_points_y]).T
    return bezier_x(xrho, control_points, parametric_resolution=int(1e3))

1. Define objective functions#

Next, we define the objective functions. For our q-profile optimisation problem, we want to do multi-objective optimisation. Each of the objectives can be computed from the JETTO profiles and timetraces datasets:

examples/ecrh_q_optimisation/q_objectives.py#

from typing import Union

import numpy as np
from jetto_tools.results import JettoResults
from netCDF4 import Dataset

from jetto_mobo.objectives import objective


def soft_hat(
    x: Union[float, np.ndarray],
    x_lower: float = 0,
    y_lower: float = 1e-3,
    x_plateau_start: float = 0,
    x_plateau_end: float = 0,
    x_upper: float = 0,
    y_upper: float = 1e-3,
) -> np.ndarray:
    """
    Smooth tophat function.

    Passes through (x_lower, y_lower), (x_plateau_start, 1), (x_plateau_end, 1), (x_upper, y_upper).
    Squared exponential decay from 0 to x_plateau_start and from x_plateau_end to infinity, with rate of decay such that y=y_lower at x=x_lower and y=y_upper at x=x_upper.

    Parameters
    ----------
    x : Union[float, np.ndarray]
        Input value
    x_lower : float, optional
        x-value at which y=y_lower (default: 0)
    y_lower : float, optional
        y-value at x=x_lower (default: 1e-3)
    x_plateau_start : float, optional
        x-value at which the plateau starts (default: 0)
    x_plateau_end : float, optional
        x-value at which the plateau ends (default: 0)
    x_upper : float, optional
        x-value at which y=y_upper (default: 0)
    y_upper : float, optional
        y-value at x=x_upper (default: 1e-3)

    Returns
    -------
    np.ndarray
        Smooth objective value
    """
    k_lower = -np.log(y_lower) / np.power(x_lower - x_plateau_start, 2)
    k_upper = -np.log(y_upper) / np.power(x_upper - x_plateau_end, 2)
    return np.piecewise(
        x,
        [
            x < x_plateau_start,
            (x >= x_plateau_start) & (x <= x_plateau_end),
            x > x_plateau_end,
        ],
        [
            lambda x: np.exp(-k_lower * np.power(x - x_plateau_start, 2)),
            1,
            lambda x: np.exp(-k_upper * np.power(x - x_plateau_end, 2)),
        ],

We can then use @jetto_mobo.objectives.objective to decorate a function that takes a JettoResults object and returns the vector of objective values:

examples/ecrh_q_optimisation/q_objectives.py#

def softmax(x: np.ndarray) -> np.ndarray:
    exp = np.exp(x)
    return exp / np.sum(exp)


def q0_close_to_qmin(profiles: Dataset, timetraces: Dataset) -> np.ndarray:
    """1 if q0 = qmin, decaying to 0.5 at ||q0 - qmin|| = 2"""
    distance = np.abs(timetraces["Q0"][-1].data - timetraces["QMIN"][-1].data)
    return soft_hat(
        distance,
        x_lower=-1,  # Not used, as 0 < x < 1
        y_lower=1e-3,  # Not used, as 0 < x < 1
        x_plateau_start=0,
        x_plateau_end=0,
        x_upper=2,
        y_upper=0.5,
    )


def qmin_close_to_centre(profiles: Dataset, timetraces: Dataset) -> np.ndarray:
    """1 if argmin(q) = 0, decaying to 1e-3 at ||argmin(q)|| = 1"""
    return soft_hat(
        timetraces["ROQM"][-1].data,
        x_lower=-1,  # Not used, as 0 < x < 1
        y_lower=1e-3,  # Not used, as 0 < x < 1
        x_plateau_start=0,
        x_plateau_end=0,
        x_upper=1,
        y_upper=1e-3,
    )


def qmin_in_safe_region(profiles: Dataset, timetraces: Dataset) -> float:
    """1 if qmin between 2.2 and 2.5, decaying to 0.5 at 2 and 3"""

If instead we wanted to do single-objective optimisation, we can use jetto_mobo.objectives.objective(weights=True) to decorate a scalar weighted version of the vector objective function:

examples/ecrh_q_optimisation/q_objectives.py#

        x_lower=2.2,
        y_lower=0.5,
        x_plateau_start=2.2,
        x_plateau_end=2.5,
        x_upper=3,
        y_upper=0.5,
    )


def q_increasing(profiles: Dataset, timetraces: Dataset) -> np.ndarray:
    """1 if q is increasing at every radial point, decaying to 1e-3 if q is non-increasing at every radial point"""
    is_increasing = np.gradient(profiles["Q"][-1].data) > 0
    return soft_hat(
        np.mean(is_increasing),  # Fraction of curve where q is increasing
        x_lower=0,
        y_lower=1e-3,
        x_plateau_start=1,
        x_plateau_end=1,
        x_upper=2,  # Not used, as 0 < x < 1
        y_upper=1e-3,  # Not used, as 0 < x < 1
    )


def maximise_radius_at_which_q_is_value(
    profiles: Dataset, timetraces: Dataset, value: float
) -> np.ndarray:
    """1 if q=value at r>0.8 decaying to 0.5 if q=value at r=0.5

    Note that this excludes points where q=value but r < argmin(q)."""
    xrho = profiles["XRHO"][-1].data
    condition_1 = profiles["Q"][-1].data >= value
    condition_2 = xrho >= timetraces["ROQM"][-1].data
    i = np.where(condition_1 & condition_2)[0][0]
    radius_of_q_is_value = xrho[i]
    return soft_hat(
        radius_of_q_is_value,
        x_lower=0.5,
        y_lower=0.5,
        x_plateau_start=0.8,
        x_plateau_end=1,
        x_upper=2,  # Not used, as 0 < x < 1
        y_upper=2,  # Not used, as 0 < x < 1
    )


@objective
def q_vector_objective(results: JettoResults) -> np.ndarray:
    """
    Vector of 6 objective functions relating to the shape of the q-profile.

    Returns
    -------
    np.ndarray
        Vector of objective values:
        - Reduced 'height' of reversed shear at axis (q0 close to qmin)
        - Reduced 'width' of reversed shear at axis (qmin close to r=0)
        - Monotonic q (q increasing at every radial point)
        - qmin in safe region (2 < qmin < 3)
        - Maximise radius at which q=3
        - Maximise radius at which q=4
    """
    profiles = results.load_profiles()
    timetraces = results.load_timetraces()

    return q_vector_objective_from_cdf(profiles, timetraces)


def q_vector_objective_from_cdf(profiles: Dataset, timetraces: Dataset) -> np.ndarray:
    return np.array(
        [
            q0_close_to_qmin(profiles, timetraces),
            qmin_close_to_centre(profiles, timetraces),
            q_increasing(profiles, timetraces),
            qmin_in_safe_region(profiles, timetraces),
            maximise_radius_at_which_q_is_value(profiles, timetraces, 3),
            maximise_radius_at_which_q_is_value(profiles, timetraces, 4),
        ]
    )


def q_constraints(results: JettoResults) -> np.ndarray:
    """Vector of constraints on the q profile.

    Constraint functions are of the form ``g(x) <= 0`` (i.e. negative if the constraint is satisfied).

    Returns
    -------
    np.ndarray
        Vector of constraint values:
        - qmin > 2
        - qmin < 3
    """
    return q_constraints_from_cdf(results.load_profiles(), results.load_timetraces())


def q_constraints_from_cdf(profiles: Dataset, timetraces: Dataset) -> np.ndarray:
    return np.array(
        [
            2 - timetraces["QMIN"][-1].data,
            timetraces["QMIN"][-1].data - 3,
        ]
    )


@objective(weights=True)
def q_scalar_objective(results: JettoResults, weights: np.ndarray) -> np.ndarray:
    """
    Weighted sum of q_vector_objective.
    """
    v = q_vector_objective(results)
    return v @ weights


def q_scalar_objective_from_cdf(
    profiles: Dataset, timetraces: Dataset, weights: np.ndarray
) -> np.ndarray:
    v = q_vector_objective_from_cdf(profiles, timetraces)
    return v @ weights

3. Write the main evaluation script#

As the evaluation of the objective functions depends on the particular problem at hand, we haven’t yet implemented a general framework to run the MOBO loop. (If you think it would be useful, do get in touch!)

Consequently, you’ll have to write the evaluation by hand, using our pre-built wrappers.

3.1 Evaluation helper function#

We define a helper function that takes a set of parameters, creates a JETTO config, sends the config off to be run, and returns the relevant values (input, output, objective) on completion.

3.2 Data storage#

We also define a helper function to save our results to a file. Use your team’s preferred data format!

3.3 Argument parsing#

Because we want it to be easy to use our final script for multiple different runs, we use argparse to parse the command line arguments:

examples/ecrh_q_optimisation/main.py#

import argparse
import asyncio
import logging
import sys
from os import sched_getaffinity
from pathlib import Path
from typing import Tuple

import h5py
import jetto_tools
import numpy as np
import torch
from ecrh_inputs import (
    bezier_profile,
    constrained_bezier_profile,
    marsden_piecewise_linear,
    marsden_piecewise_linear_bounds,
)
from q_objectives import q_vector_objective
from utils import write_to_file

from jetto_mobo import acquisition, simulation, surrogate, utils

logger = logging.getLogger(__name__)
logger.setLevel(logging.DEBUG)
logger.addHandler(logging.StreamHandler(sys.stdout))

3.4 Initialisation#

Important

Parameter bounds must be a tensor! If you initialised them as a numpy array, cast them to a tensor before continuing. We do this with:

examples/ecrh_q_optimisation/main.py#

parser.add_argument(

Before starting, we need to generate some initial candidates.

examples/ecrh_q_optimisation/main.py#

)
parser.add_argument("--jetto_timelimit", type=int, default=10400)
parser.add_argument("--jetto_fail_value", type=float, default=0)
parser.add_argument("--discard_failures", action="store_true")
parser.add_argument("--sobol_only", action="store_true")
parser.add_argument("--n_xrho_points", type=int, default=150)
parser.add_argument("--batch_size", type=int, default=10)
parser.add_argument("--initial_batch_size", type=int, default=30)
parser.add_argument("--n_iterations", type=int, default=16)
parser.add_argument("--reference_values", type=float, nargs="+", default=None)
parser.add_argument(
    "--device",
    type=str,
    default=torch.device("cuda") if torch.cuda.is_available() else torch.device("cpu"),
)
parser.add_argument("--dtype", type=torch.dtype, default=torch.float64)
parser.add_argument(
    "--output_dir", type=Path, default=Path("data/piecewise_linear_mobo")
)
parser.add_argument(
    "--parameterisation",
    choices=["piecewise_linear", "bezier", "bezier2"],
    default="piecewise_linear",
)
parser.add_argument("--n_parameters", type=int, default=12)
parser.add_argument("--alpha", type=float, default=0.0)
parser.add_argument("--seed", type=int, default=0)
parser.add_argument("--resume", action="store_true")
args = parser.parse_args()

torch.manual_seed(args.seed)

# Objectives
n_objectives = 6

# Input parameterisation
if args.parameterisation == "piecewise_linear":
    ecrh_function = marsden_piecewise_linear
    parameter_bounds = torch.tensor(marsden_piecewise_linear_bounds)
elif args.parameterisation == "bezier":
    ecrh_function = constrained_bezier_profile
    parameter_bounds = torch.tensor([[0] * args.n_parameters, [1] * args.n_parameters])
elif args.parameterisation == "bezier2":
    ecrh_function = bezier_profile
    parameter_bounds = torch.tensor([[0] * args.n_parameters, [1] * args.n_parameters])


# Reference values
if args.reference_values is None:
    reference_values = torch.tensor([0.0] * n_objectives)

3.5 Main loop#

Now we can bring it all together in the main loop.

examples/ecrh_q_optimisation/main.py#

    reference_values = torch.tensor(args.reference_values)
else:
    raise ValueError(
        f"Length of reference values ({len(args.reference_values)}) does not match number of objectives ({n_objectives})."
    )

# Failure behaviour
if not args.discard_failures:
    failure_objective_value = args.jetto_fail_value


def evaluate(
    ecrh_parameters_batch: np.ndarray,
    batch_directory: Path,
) -> Tuple[np.ndarray, np.ndarray, np.ndarray]:
    """
    Evaluate a batch of ECRH parameters.

    Runs JETTO in parallel for each set of ECRH parameters, and returns the converged ECRH profiles and objective values.

    Parameters
    ----------
    ecrh_parameters_batch: np.ndarray
    batch_directory: Path

    Returns
    -------
    Tuple[np.ndarray, np.ndarray, np.ndarray]
    """
    configs = {}

    for i, ecrh_parameters in enumerate(ecrh_parameters_batch):
        # Initialise config object
        config_directory = Path(f"{batch_directory}/candidate_{i}")
        config_object = simulation.create_config(
            template=args.jetto_template, directory=config_directory
        )

        # Set the ECRH function
        exfile = jetto_tools.binary.read_binary_file(config_object.exfile)
        exfile["QECE"][0] = ecrh_function(
            xrho=exfile["XRHO"][0], parameters=ecrh_parameters
        )
        jetto_tools.binary.write_binary_exfile(exfile, config_object.exfile)

        # Store in dict
        # Currently this is necessary as the JettoTools RunConfig does not store the directory path
        configs[config_object] = config_directory

    # Run asynchronously in parallel
    batch_output = asyncio.run(
        simulation.run_many(
            jetto_image=args.jetto_image,
            run_configs=configs,
            timelimit=args.jetto_timelimit,
        )
    )

    # Parse outputs
    converged_ecrh = []
    converged_q = []
    objective_values = []
    for results in batch_output:
        if results is not None:
            try:
                profiles = results.load_profiles()
            except:
                logger.warning("Failed to load profiles. Maybe the file was corrupted?")
                converged_ecrh.append(np.full(args.n_xrho_points, np.nan))
                converged_q.append(np.full(args.n_xrho_points, np.nan))
                objective_values.append(np.full(n_objectives, np.nan))
            else:
                converged_ecrh.append(profiles["QECE"][-1])
                converged_q.append(profiles["Q"][-1])
                objective_values.append(q_vector_objective(results))
        else:
            logger.warning("JETTO failed to converge.")
            converged_ecrh.append(np.full(args.n_xrho_points, np.nan))
            converged_q.append(np.full(args.n_xrho_points, np.nan))
            objective_values.append(np.full(n_objectives, np.nan))

    # Compress outputs
    for _, config_directory in configs.items():
        simulation.compress_jetto_dir(config_directory, delete=True)

    return (
        np.array(converged_ecrh),
        np.array(converged_q),
        np.array(objective_values),
    )


if args.resume:
    # TODO: Update to permit batched initialisation data
    logger.info("Resuming from file...")
    with h5py.File(args.output_dir / "results.h5", "r") as f:
        # Read initialisation data
        ecrh_parameters = [torch.tensor(f["initialisation/ecrh_parameters"][:])]
        objective_values = [torch.tensor(f["initialisation/objective_values"][:])]
        # Read any additional optimisation steps
        completed_optimisation_steps = len(f.keys()) - 1
        if completed_optimisation_steps > 0:
            for i in range(1, completed_optimisation_steps + 1):
                logger.info(f"Loading data from optimisation step {i}...")
                ecrh_parameters.append(
                    torch.tensor(f[f"optimisation_step_{i}/ecrh_parameters"][:])
                )
                objective_values.append(
                    torch.tensor(f[f"optimisation_step_{i}/objective_values"][:])
                )

        # Concatenate
        ecrh_parameters = torch.cat(ecrh_parameters).to(
            device=args.device, dtype=args.dtype
        )
        objective_values = torch.cat(objective_values).to(
            device=args.device, dtype=args.dtype
        )

else:
    # Generate initial data
    logger.info("Generating initial data...")

    # Get number of cores
    n_cores = len(sched_getaffinity(0))
    n_batches = args.initial_batch_size // n_cores

    # Evaluate initial candidates in batches of size n_cores
    for batch_index in range(n_batches):
        # Sobol sampling for initial candidates
        ecrh_parameters = acquisition.generate_initial_candidates(
            bounds=parameter_bounds,
            n=n_cores,
            device=args.device,
            dtype=args.dtype,
        )

        logger.info(f"Evaluating initial candidates (batch {batch_index})...")
        # Save initial candidates to file
        write_to_file(
            output_file=args.output_dir / "results.h5",
            root_label=f"initialisation/batch_{batch_index}",
            ecrh_parameters_batch=ecrh_parameters.detach().cpu().numpy(),
            preconverged_ecrh=np.array(
                [
                    ecrh_function(
                        xrho=np.linspace(0, 1, args.n_xrho_points), parameters=p
                    )
                    for p in ecrh_parameters.detach().cpu().numpy()
                ]
            ),
        )
        (
            converged_ecrh,
            converged_q,
            objective_values,
        ) = evaluate(
            ecrh_parameters_batch=ecrh_parameters.detach().cpu().numpy(),
            batch_directory=args.output_dir / f"0_initialisation_batch_{batch_index}",
        )
        # Save evaluated results to file
        write_to_file(
            output_file=args.output_dir / "results.h5",
            root_label=f"initialisation/batch_{batch_index}",
            converged_ecrh=converged_ecrh,
            converged_q=converged_q,
            objective_values=objective_values,
        )

    # Rearrange the file structure
    with h5py.File(args.output_dir / "results.h5", "a") as h5file:
        n_evaluations = n_cores * n_batches
        # Create new datasets
        h5file.create_dataset(
            "initialisation/converged_ecrh",
            (n_evaluations, args.n_xrho_points),
        )
        h5file.create_dataset(
            "initialisation/converged_q", (n_evaluations, args.n_xrho_points)
        )
        h5file.create_dataset(
            "initialisation/ecrh_parameters",
            (n_evaluations, args.n_parameters),
        )
        h5file.create_dataset(
            "initialisation/objective_values",
            (n_evaluations, n_objectives),
        )
        h5file.create_dataset(
            "initialisation/preconverged_ecrh",
            (n_evaluations, args.n_xrho_points),
        )

        # Copy data across
        for batch_index in range(n_batches):
            lower_index = batch_index * n_cores
            upper_index = lower_index + n_cores
            h5file["initialisation/converged_ecrh"][lower_index:upper_index] = h5file[
                f"initialisation/batch_{batch_index}/converged_ecrh"
            ]
            h5file["initialisation/converged_q"][lower_index:upper_index] = h5file[
                f"initialisation/batch_{batch_index}/converged_q"
            ]
            h5file["initialisation/ecrh_parameters"][lower_index:upper_index] = h5file[
                f"initialisation/batch_{batch_index}/ecrh_parameters"
            ]
            h5file["initialisation/objective_values"][lower_index:upper_index] = h5file[
                f"initialisation/batch_{batch_index}/objective_values"
            ]
            h5file["initialisation/preconverged_ecrh"][
                lower_index:upper_index
            ] = h5file[f"initialisation/batch_{batch_index}/preconverged_ecrh"]

            del h5file[f"initialisation/batch_{batch_index}"]

        # Load back into a tensor
        ecrh_parameters = torch.tensor(
            h5file["initialisation/ecrh_parameters"][:],
            device=args.device,
            dtype=args.dtype,
        )
        objective_values = torch.tensor(
            h5file["initialisation/objective_values"][:],
            device=args.device,
            dtype=args.dtype,
        )

        # Compute and save the HVI
        log_hypervolume = utils.compute_pareto_loghypervolume(
            objective_values=objective_values,
            reference_point=reference_values,
        )
        h5file["initialisation"].attrs["log_hypervolume"] = log_hypervolume

    # Initialise optimisation step
    completed_optimisation_steps = 0


for optimisation_step in range(
    completed_optimisation_steps + 1,
    completed_optimisation_steps + 1 + args.n_iterations,
):
    logger.info(f"Optimisation step {optimisation_step}")

    # Drop any NaNs
    logger.info("Handling NaNs...")
    if args.discard_failures:
        mask = ~torch.isnan(objective_values).any(dim=1)
        ecrh_parameters = ecrh_parameters[mask]
        objective_values = objective_values[mask]
    else:
        # Replace NaNs with failure values
        objective_values[torch.isnan(objective_values)] = failure_objective_value

    # Generate trial candidates
    if args.sobol_only or objective_values.nelement() == 0:
        # Use quasirandom Sobol sampling to generate trial candidates
        logger.info("Generating trial candidates using Sobol sampling...")
        new_ecrh_parameters = acquisition.generate_initial_candidates(
            bounds=parameter_bounds,
            n=args.batch_size,
            device=args.device,
            dtype=args.dtype,
        )
    else:
        logger.info("Fitting surrogate model...")
        model = surrogate.fit_surrogate_model(
            inputs=ecrh_parameters,
            input_bounds=parameter_bounds,
            objective_values=objective_values,
            device=args.device,
            dtype=args.dtype,
        )

        # Use qNEHVI to generate trial candidates
        logger.info("Generating trial candidates using qNEHVI...")
        new_ecrh_parameters = acquisition.generate_trial_candidates(
            observed_inputs=ecrh_parameters,
            bounds=parameter_bounds,
            model=model,
            acquisition_function=acquisition.qNoisyExpectedHypervolumeImprovement,
            n_constraints=0,
            device=args.device,
            dtype=args.dtype,
            batch_size=args.batch_size,
            mode="sequential" if args.batch_size > 5 else "joint",
            acqf_kwargs={
                "ref_point": reference_values,
                "alpha": args.alpha,
                "prune_baseline": True,
            },
        )
    write_to_file(
        output_file=args.output_dir / "results.h5",
        root_label=f"optimisation_step_{optimisation_step}",
        ecrh_parameters_batch=new_ecrh_parameters.detach().cpu().numpy(),
        preconverged_ecrh=np.array(
            [
                ecrh_function(xrho=np.linspace(0, 1, args.n_xrho_points), parameters=p)
                for p in new_ecrh_parameters.detach().cpu().numpy()
            ]
        ),
    )

    # Evaluate candidates
    logger.info("Evaluating trial candidates...")
    (
        converged_ecrh,
        converged_q,
        new_objective_values,
    ) = evaluate(
        ecrh_parameters_batch=new_ecrh_parameters.detach().cpu().numpy(),
        batch_directory=args.output_dir / str(optimisation_step),
    )
    write_to_file(
        output_file=args.output_dir / "results.h5",
        root_label=f"optimisation_step_{optimisation_step}",
        converged_ecrh=converged_ecrh,
        converged_q=converged_q,
        objective_values=new_objective_values,
    )

    # Concatenate new data
    ecrh_parameters = torch.cat([ecrh_parameters, new_ecrh_parameters])
    # Have to convert new_objective_values to tensor, because it is a np.ndarray output from reading JettoResults
    objective_values = torch.cat(
        [
            objective_values,
            torch.tensor(
                new_objective_values,
                device=args.device,
                dtype=args.dtype,
            ),
        ]
    )

    # Compute and save the HVI
    log_hypervolume = utils.compute_pareto_loghypervolume(
        objective_values=objective_values,
        reference_point=reference_values,
    )
    write_to_file(
        output_file=args.output_dir / "results.h5",
        root_label=f"optimisation_step_{optimisation_step}",
        log_hypervolume=log_hypervolume,
    )