Source code for ccvm_simulators.solvers.mf_solver

import torch
import numpy as np
import torch.distributions as tdist
import time
from pandas import DataFrame

from ccvm_simulators.solvers.ccvm_solver import CCVMSolver
from ccvm_simulators.solvers.algorithms import AdamParameters
from ccvm_simulators.solution import Solution
from ccvm_simulators.post_processor.factory import PostProcessorFactory

MF_SCALING_MULTIPLIER = 0.05
"""The value used by the MFSolver when calculating a scaling value in
super.get_scaling_factor()"""



[docs]
class MFSolver(CCVMSolver):
    """Constructor method"""

    def __init__(
        self,
        device,
        problem_category="boxqp",
        batch_size=1000,
    ):
        """
        Args:
            device (str): The device to use for the solver. Can be "cpu" or "cuda".
            problem_category (str): The category of problem to solve. Can be one
                of "boxqp". Defaults to "boxqp".
            batch_size (int): The number of times to solve a problem instance
                simultaneously. Defaults to 1000.

        Raises:
            ValueError: If the problem category is not supported by the solver.

        Returns:
            DLSolver: The DLSolver object.
        """
        super().__init__(device)
        self.batch_size = batch_size
        self._default_optics_machine_parameters = {
            "laser_clock": 100e-12,
            "FPGA_clock": 3.33e-9,
            "FPGA_fixed": 34,
            "FPGA_var_fac": 0.1,
            "FPGA_power": {
                20: 15.74,
                30: 16.97,
                40: 18.54,
                50: 20.25,
                60: 22.08,
                70: 24.01,
            },
            "buffer_time": 3.33e-9,
            "laser_power": 1000e-6,
            "postprocessing_power": {
                20: 4.87,
                30: 5.14,
                40: 5.11,
                50: 5.08,
                60: 5.09,
                70: 5.3,
            },
        }
        self._scaling_multiplier = MF_SCALING_MULTIPLIER
        # Use the method selector to choose the problem-specific methods to use
        self._method_selector(problem_category)

    @property
    def parameter_key(self):
        """The parameters that will be used by the solver when solving the problem.

        Note:
            Setting this parameter after calling tune() will overwrite tuned parameters.

        The parameter_key must match the following format:

            * key: problem size (the number of variables in the problem).
            * value: dict with these keys:
                * pump (float)
                * feedback_scale (float)
                * j (float)
                    * The measurement strength
                * S (float or vector of float with size 'problem_size')
                    * The enforced saturation value
                * dt (float)
                    * The time step or the learning rate (old name was lr)
                * noise_ratio (float)

            With values, the parameter key might look like this::

                {
                    20:
                        {
                            "pump": 2.5,
                            "feedback_scale": 400,
                            "j": 399,
                            "S": 20.0,
                            "dt": 0.0025,
                            "iterations": 15000
                        },
                    30:
                        {
                            "pump": 3.0,
                            "feedback_scale": 250,
                            "j": 399,
                            "S": 20.0,
                            "dt": 0.0025,
                            "iterations": 15000
                        },
                }

        Raises:
            ValueError: If the parameter key does not contain the solver-specific
                combination of keys described above.
        """
        return self._parameter_key

    @parameter_key.setter
    def parameter_key(self, parameters):
        expected_mfparameter_key_set = set(
            ["pump", "feedback_scale", "j", "S", "dt", "iterations"]
        )
        parameter_key_list = parameters.values()
        # Iterate over the parameters for each given problem size
        for parameter_key in parameter_key_list:
            if parameter_key.keys() != expected_mfparameter_key_set:
                # The parameter key is not valid for this solver
                raise ValueError(
                    "The parameter key is not valid for this solver. Expected keys: "
                    + str(expected_mfparameter_key_set)
                    + " Given keys: "
                    + str(parameter_key.keys())
                )

        # If we get here, the parameter key is valid
        self._parameter_key = parameters
        self._is_tuned = False

    def _calculate_drift_boxqp(
        self,
        mu,
        mu_tilde,
        sigma,
        pump,
        j,
        g,
        S,
        fs,
        lower_limit=0,
        upper_limit=1,
    ):
        """We treat the SDE that simulates the CIM of NTT as drift
        calculation.

        Args:
            mu (torch.Tensor): Mean-field amplitudes
            mu_tilde (torch.Tensor): Mean-field measured amplitudes
            sigma (torch.Tensor): Variance of the in-phase position operator
            pump (float): Instantaneous pump value
            j (float): The measurement strength
            g (float): The nonlinearity coefficient
            S (float): The enforced saturation value
            fs (float): The coefficient of the feedback term
            lower_limit (float): The lower bound of the box constraint
            upper_limit (float): The upper bound of the box constraint

        Returns:
            tuple: The gradients of the mean-field amplitudes and the variance.
        """
        mu_pow = torch.pow(mu, 2)

        mu_term1 = (-(1 + j) + pump - g**2 * mu_pow) * mu

        mu_term2_1 = (
            -(1 / 4)
            * (
                torch.einsum(
                    "bi,ij -> bj",
                    mu_tilde * (upper_limit - lower_limit) / S
                    + (upper_limit + lower_limit),
                    self.q_matrix,
                )
            )
            * (upper_limit - lower_limit)
            / S
        )
        mu_term2_2 = -self.v_vector * (upper_limit - lower_limit) / (2 * S)

        sigma_term1 = 2 * (-(1 + j) + pump - 3 * g**2 * mu_pow) * sigma
        sigma_term2 = -2 * j * (sigma - 0.5).pow(2)
        sigma_term3 = (1 + j) + 2 * g**2 * mu_pow

        drift_mu = mu_term1 + fs * (mu_term2_1 + mu_term2_2)
        drift_sigma = sigma_term1 + sigma_term2 + sigma_term3

        return drift_mu, drift_sigma

    def _calculate_grads_boxqp(self, mu_tilde, S, fs, lower_limit=0, upper_limit=1):
        """We treat the SDE that simulates the CIM of NTT as gradient
        calculation. Original SDE considers only quadratic part of the objective
        function. Therefore, we need to modify and add linear part of the QP to
        the SDE.

        Args:
            mu_tilde (torch.Tensor): Mean-field measured amplitudes
            S (float): The enforced saturation value
            fs (float): The coefficient of the feedback term
            lower_limit (float): The lower bound of the box constraints
            upper_limit (float): The upper bound of the box constraints

        Returns:
            tensor: The gradients of the mean-field amplitude.
        """
        mu_term2_1 = (
            -(1 / 4)
            * (
                torch.einsum(
                    "bi,ij -> bj",
                    mu_tilde * (upper_limit - lower_limit) / S
                    + (upper_limit + lower_limit),
                    self.q_matrix,
                )
            )
            * (upper_limit - lower_limit)
            / S
        )
        mu_term2_2 = -self.v_vector * (upper_limit - lower_limit) / (2 * S)

        grads_mu = fs * (mu_term2_1 + mu_term2_2)

        return grads_mu

    def _change_variables_boxqp(
        self, problem_variables, lower_limit=0, upper_limit=1, S=1
    ):
        """Perform a change of variables to enforce the box constraints.

        Args:
            problem_variables (torch.Tensor): The variables to change.
            lower_limit (float): The lower bound of the box constraints. Defaults to 0.
            upper_limit (float): The upper bound of the box constraints. Defaults to 1.
            S (float or torch.tensor): The enforced saturation value. Defaults to 1

        Returns:
            torch.Tensor: The changed variables.
        """
        return 0.5 * problem_variables / S * (upper_limit - lower_limit) + 0.5 * (
            upper_limit + lower_limit
        )

    def _fit_to_constraints_boxqp(self, mu_tilde, lower_clamp, upper_clamp):
        """Clamps the values of mu_tilde to be within the box constraints

        Args:
            mu_tilde (torch.Tensor): The mean-field measured amplitudes.
            lower_clamp (float or torch.tensor): The lower bound of the box constraints.
            upper_clamp (float or torch.tensor): The upper bound of the box constraints.

        Returns:
            torch.Tensor: The clamped values of mu_tilde, now within the box constraints.
        """
        mu_tilde_clamped = torch.clamp(mu_tilde, lower_clamp, upper_clamp)
        return mu_tilde_clamped

    def _append_samples_to_file(self, mu_sample, sigma_sample, evolution_file_object):
        """Saves samples of the mean-field amplitudes and the variance of the in-phase
        position operator to a file. The end file will contain the values of the
        mu_sample followed by the sigma_sample. Each line corresponds to a row in the
        tensor, with tab-delineated values.

        Args:
            mu_sample (torch.Tensor): The sample of mean-field amplitudes to add to the
                file. Expected Dimensions: problem_size x num_samples.
            sigma_sample (torch.Tensor): The sample of the variance of the in-phase
                position operator to add to the file. Expected Dimensions: problem_size
                x num_samples.
            evolution_file_object (io.TextIOWrapper): The file object of the file to
                save the samples to.
        """
        # Save the mu samples to the file
        mu_rows = mu_sample.shape[0]  # problem_size
        mu_columns = mu_sample.shape[1]  # num_samples
        for nn in range(mu_rows):
            for ii in range(mu_columns):
                evolution_file_object.write(str(round(mu_sample[nn, ii].item(), 4)))
                if ii != mu_columns - 1:
                    evolution_file_object.write("\t")
            evolution_file_object.write("\n")

        # Save the sigma samples to the file
        sigma_rows = sigma_sample.shape[0]  # problem_size
        sigma_columns = sigma_sample.shape[1]  # num_samples
        for nn in range(sigma_rows):
            for ii in range(sigma_columns):
                evolution_file_object.write(str(round(sigma_sample[nn, ii].item(), 4)))
                if ii != sigma_columns - 1:
                    evolution_file_object.write("\t")
            evolution_file_object.write("\n")

    def _is_valid_optics_machine_parameters(self, machine_parameters):
        """Validates that the given optics machine parameters are valid for this solver.

        Args:
            machine_parameters (dict): The machine parameters to validate.

        Raises:
            ValueError: If the given machine parameters are invalid.
        """

        required_keys = [
            "laser_clock",
            "FPGA_clock",
            "FPGA_fixed",
            "FPGA_var_fac",
            "FPGA_power",
            "buffer_time",
            "laser_power",
            "postprocessing_power",
        ]

        # Check that all required keys are present
        missing_keys = [key for key in required_keys if key not in machine_parameters]

        if missing_keys:
            raise ValueError(
                f"Invalid optics_machine_parameters: Missing required keys - {missing_keys}"
            )


[docs]
    def tune(self, instances, post_processor, g=0.01):
        """Determines the best parameters for the solver to use by adjusting each
        parameter over a number of iterations on the problems in the given set of
        problems instances. The `parameter_key` attribute of the solver will be
        updated with the best parameters found.

        Args:
            instances (list): A list of problem instances to tune the solver on.
            post_processor (str): The name of the post processor to use to process the
                results of the solver. None if no post processing is desired.
                Defaults to None.
            g (float): The nonlinearity coefficient. Defaults to 0.01.
        """
        # TODO: This implementation is a placeholder; full implementation is a
        #       future consideration
        self.is_tuned = True


    def _optics_machine_energy(
        self,
        machine_parameters=None,
    ):
        """The wrapper function of calculating the average energy consumption of the
            solver, as if the solving process was to be performed on an optical DL-CCVM
            machine.

        Args:
            machine_parameters (dict, optional): Parameters of the machine. Defaults to
                None.

        Raises:
            ValueError: when the given machine parameters are not valid.
            ValueError: when the given dataframe does not contain the required columns.

        Returns:
            Callable: A callable function that takes in a dataframe and problem size and
                returns the average energy consumption of the solver.
        """
        if machine_parameters is None:
            machine_parameters = self._default_optics_machine_parameters
        else:
            self._is_valid_optics_machine_parameters(machine_parameters)

        def _optics_machine_energy_callable(
            dataframe: DataFrame,
            problem_size: int,
        ):
            """Calculate the average energy consumption of the solver simulating on a
                MF-CCVM machine.

            Args:
                dataframe (DataFrame): The necessary data to calculate the average
                    energy.
                problem_size (int): The size of the problem.

            Raises:
                ValueError: when the given dataframe does not contain the required
                    columns.

            Returns:
                float: The average energy consumption of the solver.
            """
            self._validate_machine_energy_dataframe_columns(dataframe)

            try:
                pump = self.parameter_key[problem_size]["pump"]
                measure_strength = self.parameter_key[problem_size]["j"]
            except KeyError as e:
                raise KeyError(
                    f"The parameter '{e.args[0]}' for the given instance size: {problem_size} is not defined."
                ) from e

            iterations = np.mean(dataframe["iterations"].values)
            postprocessing_time = np.mean(dataframe["pp_time"].values)
            roundtrip_time = (
                (
                    machine_parameters["FPGA_fixed"]
                    + machine_parameters["FPGA_var_fac"] * float(problem_size)
                )
                * machine_parameters["FPGA_clock"]
                + float(problem_size) * machine_parameters["laser_clock"]
                + machine_parameters["buffer_time"]
            )
            optics_power = machine_parameters["FPGA_power"][
                problem_size
            ] + machine_parameters["laser_power"] * (pump + 1 + measure_strength)
            optics_energy = (
                roundtrip_time * optics_power
                - machine_parameters["FPGA_power"][problem_size]
                * machine_parameters["buffer_time"]
            ) * iterations
            postprocessing_energy = (
                machine_parameters["postprocessing_power"][problem_size]
                * postprocessing_time
            )
            machine_energy = optics_energy + postprocessing_energy
            return machine_energy

        return _optics_machine_energy_callable

    def _optics_machine_time(self, machine_parameters: dict = None):
        """The wrapper function of calculating the average time spent by the
            solver on a single instance, as if the solving process was to be performed on
            an optical MF-CCVM machine.

        Args:
            machine_parameters (dict, optional): Parameters of the optical MF-CCVM
                machine. Defaults to None.

        Raises:
            ValueError: when the given machine parameters are not valid.
            ValueError: when the given dataframe does not contain the required columns.

        Returns:
            Callable: A callable function that takes in a dataframe and problem size and
                returns the average time spent by the solver on a single instance.
        """

        if machine_parameters is None:
            machine_parameters = self._default_optics_machine_parameters
        else:
            self._is_valid_optics_machine_parameters(machine_parameters)

        def _optics_machine_time_callable(dataframe: DataFrame, problem_size: int):
            """Calculate the average time spent by the solver on a single instance,
                simulating on a MF-CCVM machine.

            Args:
                dataframe (DataFrame): The necessary data to calculate the average
                    time.
                problem_size (int): The size of the problem.

            Raises:
                ValueError: when the given dataframe does not contain the required
                    columns.

            Returns:
                float: The average time spent by the solver on a single instance.
            """
            try:
                iterations = np.mean(dataframe["iterations"].values)
                postprocessing_time = np.mean(dataframe["pp_time"].values)
            except KeyError as e:
                missing_column = e.args[0]
                raise KeyError(
                    f"The given dataframe is missing the {missing_column} column. Required columns are: ['iterations', 'pp_time']."
                )

            roundtrip_time = (
                (
                    machine_parameters["FPGA_fixed"]
                    + machine_parameters["FPGA_var_fac"] * float(problem_size)
                )
                * machine_parameters["FPGA_clock"]
                + float(problem_size) * machine_parameters["laser_clock"]
                + machine_parameters["buffer_time"]
            )
            machine_time = roundtrip_time * iterations + postprocessing_time

            return machine_time

        return _optics_machine_time_callable

    def _solve(
        self,
        problem_size,
        batch_size,
        device,
        S,
        pump,
        dt,
        iterations,
        j,
        feedback_scale,
        pump_rate_flag,
        g,
        evolution_step_size,
        samples_taken,
    ):
        """Solves the given problem instance using the original MF-CCVM solver with
        tuned or specified parameters in the parameter key.

        Args:
            problem_size (int): instance size.
            batch_size (int): The number of times to solve a problem instance
            device (str): The device to use for the solver. Can be "cpu" or "cuda".
            S (float): Saturation bound.
            pump (float): Pump field strength.
            dt (float): Simulation time step.
            iterations (int): number of steps.
            noise_ratio (float): noise ratio.
            pump_rate_flag (bool): Whether or not to scale the pump rate based on the
                iteration number.
            g (float): The nonlinearity coefficient.
            evolution_step_size (int): If set, the c/s values will be sampled once
                per number of iterations equivalent to the value of this variable.
                At the end of the solve process, the best batch of sampled values
                will be written to a file that can be specified by setting the
                evolution_file parameter.
            samples_taken (int): sample slice.

        Returns:
            mu, mu_tilde, sigma (tensor): random variables
        """
        # Initialize tensor variables on the device that will be used to perform
        # the calculations

        mu = torch.zeros((batch_size, problem_size), dtype=torch.float, device=device)
        sigma = torch.ones(
            (batch_size, problem_size), dtype=torch.float, device=device
        ) * (1 / 2)

        wiener_dist = tdist.Normal(
            torch.tensor([0.0] * batch_size, device=device),
            torch.tensor([1.0] * batch_size, device=device),
        )

        # Perform the solve over the specified number of iterations
        pump_rate = 1
        for i in range(iterations):
            j_i = j * np.exp(-(i + 1) / iterations * 3.0)
            wiener = wiener_dist.sample((problem_size,)).transpose(0, 1)
            wiener_increment = wiener / np.sqrt(dt)
            mu_tilde = mu + np.sqrt(1 / (4 * j_i)) * wiener_increment
            mu_tilde_c = self.fit_to_constraints(mu_tilde, -S, S)

            if pump_rate_flag:
                pump_rate = (i + 1) / iterations

            instantaneous_pump = pump * pump_rate + 1 + j_i

            (drift_mu, drift_sigma) = self.calculate_drift(
                mu,
                mu_tilde_c,
                sigma,
                instantaneous_pump,
                j_i,
                g,
                S,
                feedback_scale,
                self.solution_bounds[0],
                self.solution_bounds[1],
            )

            # mu_term3-> mu_diffusion
            mu_diffusion = np.sqrt(j_i) * (sigma - 0.5) * wiener_increment

            mu += dt * (drift_mu + mu_diffusion)
            sigma += dt * drift_sigma

            # If evolution_step_size is specified, save the values if this iteration
            # aligns with the step size or if this is the last iteration
            if evolution_step_size and (
                i % evolution_step_size == 0 or i + 1 >= iterations
            ):
                # Update the record of the sample values with the values found at
                # this iteration
                self.mu_sample[:, :, samples_taken] = mu
                self.sigma_sample[:, :, samples_taken] = sigma
                samples_taken += 1

        mu_tilde = self.fit_to_constraints(mu_tilde, -S, S)

        return mu, mu_tilde, sigma

    def _solve_adam(
        self,
        problem_size,
        batch_size,
        device,
        S,
        pump,
        dt,
        iterations,
        j,
        feedback_scale,
        pump_rate_flag,
        g,
        evolution_step_size,
        samples_taken,
        hyperparameters,
    ):
        """Solves the given problem instance using the MF-CCVM solver with Adam
        algorithm tuned or specified parameters in the parameter key.

        Args:
            problem_size (int): instance size.
            batch_size (int): The number of times to solve a problem instance
            device (str): The device to use for the solver. Can be "cpu" or "cuda".
            S (float): Saturation bound.
            pump (float): Pump field strength.
            dt (float): Simulation time step.
            iterations (int): number of steps.
            noise_ratio (float): noise ratio.
            pump_rate_flag (bool): Whether or not to scale the pump rate based on the
                iteration number.
            g (float): The nonlinearity coefficient.
            evolution_step_size (int): If set, the c/s values will be sampled once
                per number of iterations equivalent to the value of this variable.
                At the end of the solve process, the best batch of sampled values
                will be written to a file that can be specified by setting the
                evolution_file parameter.
            samples_taken (int): sample slice.
            hyperparameters (dict): Hyperparameters for Adam algorithm.

        Returns:
            mu, mu_tilde, sigma (tensor): random variables
        """
        # Initialize tensor variables on the device that will be used to perform
        # the calculations

        mu = torch.zeros((batch_size, problem_size), dtype=torch.float, device=device)
        sigma = torch.ones(
            (batch_size, problem_size), dtype=torch.float, device=device
        ) * (1 / 2)

        wiener_dist = tdist.Normal(
            torch.tensor([0.0] * batch_size, device=device),
            torch.tensor([1.0] * batch_size, device=device),
        )

        # Pump rate update selection: time-dependent
        pump_rate_i = lambda i: (i + 1) / iterations
        pump_rate_c = lambda i: 1.0
        if pump_rate_flag:
            pump_rate = pump_rate_i
        else:
            pump_rate = pump_rate_c

        alpha = hyperparameters["alpha"]
        beta1 = hyperparameters["beta1"]
        beta2 = hyperparameters["beta2"]
        epsilon = 1e-8

        # Compute bias corrected grads using 1st and 2nd moments
        # with element-wise division
        def update_grads_with_moment2_assign(grads, mhat, vhat):
            return alpha * torch.div(mhat, torch.sqrt(vhat) + epsilon)

        def update_grads_with_moment2_addassign(grads, mhat, vhat):
            return grads + alpha * torch.div(mhat, torch.sqrt(vhat) + epsilon)

        # Compute bias corrected grads using only 1st moment
        def update_grads_without_moment2_assign(grads, mhat):
            return alpha * mhat

        def update_grads_without_moment2_addassign(grads, mhat):
            return grads + alpha * mhat

        # Choose desired update method.
        if hyperparameters["add_assign"]:
            update_grads_with_moment2 = update_grads_with_moment2_addassign
            update_grads_without_moment2 = update_grads_without_moment2_addassign
        else:
            update_grads_with_moment2 = update_grads_with_moment2_assign
            update_grads_without_moment2 = update_grads_without_moment2_assign

        # Initialize first moment vector
        m_mu = torch.zeros((batch_size, problem_size), dtype=torch.float, device=device)
        # Initialize second moment vector conditionally
        if not beta2 == 1.0:
            v_mu = torch.zeros(
                (batch_size, problem_size), dtype=torch.float, device=device
            )
        else:
            v_mu = None

        # Perform the solve over the specified number of iterations
        for i in range(iterations):
            j_i = j * np.exp(-(i + 1) / iterations * 3.0)
            wiener = wiener_dist.sample((problem_size,)).transpose(0, 1)
            wiener_increment = wiener / np.sqrt(dt)
            mu_tilde = mu + np.sqrt(1 / (4 * j_i)) * wiener_increment
            mu_tilde_c = self.fit_to_constraints(mu_tilde, -S, S)

            rate = pump_rate(i)  # t/T

            pump_i = pump * rate + 1 + j_i

            grads_mu = self.calculate_grads(
                mu_tilde_c,
                S,
                feedback_scale,
                self.solution_bounds[0],
                self.solution_bounds[1],
            )

            # Update biased first moment estimate
            m_mu = beta1 * m_mu + (1.0 - beta1) * grads_mu

            # Compute bias correction in 1st moment
            beta1i = 1.0 - beta1 ** (i + 1)
            mhat_mu = m_mu / beta1i

            # Conditional second moment estimation
            if not beta2 == 1.0:
                # Update biased 2nd moment estimate
                v_mu = beta2 * v_mu + (1.0 - beta2) * torch.pow(grads_mu, 2)

                # Compute bias correction in 2nd moment
                beta2i = 1.0 - beta2 ** (i + 1)
                vhat_mu = v_mu / beta2i

                # Compute bias corrected grad using 1st and 2nd moments
                # in the form of element-wise division
                grads_mu = update_grads_with_moment2(grads_mu, mhat_mu, vhat_mu)
            else:
                # Compute bias corrected grad only with 1st moment
                grads_mu = update_grads_without_moment2(grads_mu, mhat_mu)

            # Calculate drift and diffusion terms of mf-ccvm
            mu_pow = torch.pow(mu, 2)
            mu_drift = (-(1 + j_i) + pump_i - g**2 * mu_pow) * mu
            mu_drift += np.sqrt(j_i) * (sigma - 0.5) * wiener_increment
            mu += dt * (grads_mu + mu_drift)

            sigma_drift = 2 * (-(1 + j_i) + pump_i - 3 * g**2 * mu_pow) * sigma
            sigma_drift += -2 * j_i * (sigma - 0.5).pow(2)
            sigma_drift += (1 + j_i) + 2 * g**2 * mu_pow
            sigma += dt * sigma_drift

            # If evolution_step_size is specified, save the values if this iteration
            # aligns with the step size or if this is the last iteration
            if evolution_step_size and (
                i % evolution_step_size == 0 or i + 1 >= iterations
            ):
                # Update the record of the sample values with the values found at
                # this iteration
                self.mu_sample[:, :, samples_taken] = mu
                self.sigma_sample[:, :, samples_taken] = sigma
                samples_taken += 1

        mu_tilde = self.fit_to_constraints(mu_tilde, -S, S)

        return mu, mu_tilde, sigma

    def __call__(
        self,
        instance,
        post_processor=None,
        g=0.01,
        pump_rate_flag=True,
        evolution_step_size=None,
        evolution_file=None,
        algorithm_parameters=None,
    ):
        """Solves the given problem instance by choosing one of the available
        MF-CCVM solvers tuned or specified parameters in the parameter key.

        Args:
            instance (boxqp.boxqp.ProblemInstance): The problem to solve.
            solve_type (str): Flag to choose one of the available solve methods
            post_processor (str): The name of the post processor to use to process
                the results of the solver. None if no post processing is desired.
            g (float, optional): The nonlinearity coefficient. Defaults to 0.01
            pump_rate_flag (bool, optional): Whether or not to scale the pump rate
                based on the iteration number. If False, the pump rate will be 1.0.
                Defaults to True.
            evolution_step_size (int): If set, the mu/sigma values will be sampled once
                per number of iterations equivalent to the value of this variable. At
                the end of the solve process, the best batch of sampled values will be
                written to a file that can be specified by setting the evolution_file
                parameter.Defaults to None, meaning no problem variables will be written
                to the file.
            evolution_file (str): The file to save the best set of mu/sigma samples to.
                Only revelant when evolution_step_size is set. If a file already exists
                with the same name, it will be overwritten. Defaults to None, which
                generates a filename based on the problem instance name.
            algorithm_parameters (None, AdamParameters): Specify for the solver to use a
                specialized algorithm by passing in an instance of the algorithm's
                parameters class. Options include: AdamParameters. Defaults to None,
                which uses the original MF solver.

        Returns:
            solution (Solution): The solution to the problem instance.
        """
        # If the instance and the solver don't specify the same device type, raise an
        # error
        if instance.device != self.device:
            raise ValueError(
                f"The device type of the instance ({instance.device}) and the solver"
                f" ({self.device}) must match."
            )

        # Get problem from problem instance
        problem_size = instance.problem_size
        self.q_matrix = instance.q_matrix
        self.v_vector = instance.v_vector
        self.solution_bounds = instance.solution_bounds

        # Get solver setup variables
        batch_size = self.batch_size
        device = self.device

        # Get parameters from parameter_key
        try:
            pump = self.parameter_key[problem_size]["pump"]
            dt = self.parameter_key[problem_size]["dt"]
            iterations = self.parameter_key[problem_size]["iterations"]
            j = self.parameter_key[problem_size]["j"]
            feedback_scale = self.parameter_key[problem_size]["feedback_scale"]
            S = self.parameter_key[problem_size]["S"]

            # If S is a 1-D tensor, convert it to to a 2-D tensor
            if torch.is_tensor(S) and S.ndim == 1:
                # Dimension indexing in pytorch starts at 0
                if S.size(dim=0) == problem_size:
                    S = torch.outer(torch.ones(batch_size), S)
                else:
                    raise ValueError("Tensor S size should be equal to problem size.")
        except KeyError as e:
            raise KeyError(
                f"The parameter '{e.args[0]}' for the given instance size is not"
                " defined."
            ) from e

        # Start timing the solve process
        solve_time_start = time.time()

        samples_taken = None
        self.mu_sample = None
        self.sigma_sample = None
        if evolution_step_size:
            # Check that the value is valid
            if evolution_step_size < 1:
                raise ValueError(
                    f"The evolution step size must be greater than or equal to 1."
                )
            # Generate evolution file name
            if evolution_file is None:
                evolution_file = f"./{instance.name}_evolution.txt"

            # Get the number of samples to save
            # Find the number of full steps that will be taken
            num_steps = int(iterations / evolution_step_size)
            # We will also capture the first iteration through
            num_samples = num_steps + 1
            # And capture the last iteration if the step size doesn't evenly divide
            if iterations % evolution_step_size != 0:
                num_samples += 1

            # Initialize tensors
            # Store on CPU to keep the memory usage lower on the GPU
            self.mu_sample = torch.zeros(
                (batch_size, problem_size, num_samples), device="cpu"
            )
            self.sigma_sample = torch.zeros(
                (batch_size, problem_size, num_samples), device="cpu"
            )
            samples_taken = 0

        if algorithm_parameters is None:
            # Use the original MF solver
            mu, mu_tilde, sigma = self._solve(
                problem_size,
                batch_size,
                device,
                S,
                pump,
                dt,
                iterations,
                j,
                feedback_scale,
                pump_rate_flag,
                g,
                evolution_step_size,
                samples_taken,
            )
        elif isinstance(algorithm_parameters, AdamParameters):
            # Use the MF solver with Adam algorithm
            mu, mu_tilde, sigma = self._solve_adam(
                problem_size,
                batch_size,
                device,
                S,
                pump,
                dt,
                iterations,
                j,
                feedback_scale,
                pump_rate_flag,
                g,
                evolution_step_size,
                samples_taken,
                algorithm_parameters.to_dict(),
            )
        else:
            raise ValueError(
                f"Solver option type {type(algorithm_parameters)} is not supported."
            )

        # Stop the timer for the solve to compute the solution time for solving an instance once
        # Due to the division by batch_size, the solve_time improves for larger batches
        # when the solver is run on GPU. This is expected since GPU is hardware specifically
        # deployed to improve the solution time of solving one single instance by using parallelization
        solve_time = (time.time() - solve_time_start) / batch_size

        # Run the post processor on the results, if specified
        if post_processor:
            post_processor_object = PostProcessorFactory.create_postprocessor(
                post_processor
            )

            problem_variables = post_processor_object.postprocess(
                self.change_variables(
                    mu_tilde, self.solution_bounds[0], self.solution_bounds[1], S
                ),
                self.q_matrix,
                self.v_vector,
            )
            # Post-processing time for solving an instance once
            pp_time = post_processor_object.pp_time / batch_size
        else:
            problem_variables = self.change_variables(
                mu_tilde, self.solution_bounds[0], self.solution_bounds[1], S
            )
            pp_time = 0.0

        objval = instance.compute_energy(problem_variables)

        if evolution_step_size:
            # Write samples to file
            # Overwrite file if it exists
            open(evolution_file, "w")

            # Get the indices of the best objective values over the sampled iterations
            # to use to get and save the best sampled values of mu and sigma
            batch_index = torch.argmax(-objval)
            with open(evolution_file, "a") as evolution_file_obj:
                self._append_samples_to_file(
                    mu_sample=self.mu_sample[batch_index],
                    sigma_sample=self.sigma_sample[batch_index],
                    evolution_file_object=evolution_file_obj,
                )

        solution = Solution(
            problem_size=instance.problem_size,
            batch_size=batch_size,
            instance_name=instance.name,
            iterations=iterations,
            objective_values=objval,
            solve_time=solve_time,
            pp_time=pp_time,
            optimal_value=instance.optimal_sol,
            best_value=instance.best_sol,
            num_frac_values=instance.num_frac_values,
            solution_vector=instance.solution_vector,
            variables={
                "problem_variables": problem_variables,
                "mu": mu,
                "sigma": sigma,
            },
            device=device,
        )

        # Add evolution filename to solution if it was generated
        if evolution_step_size:
            solution.evolution_file = evolution_file

        return solution