Source code for TrainingFuncs

import pennylane as qml
from pennylane import numpy as np
import sklearn
from sklearn.preprocessing import MinMaxScaler
from matplotlib import pyplot as plt
from tqdm import tqdm
import pickle
import jax
from jax import numpy as jnp
import os



[docs]
def split_train_test(
    data, n_qubits: int, train_ratio: float = 2 / 3, random: bool = False, seed: int = 0
):
    """
    Splits data into two sub-datsets: one for training and one for testing.

            Parameters:
                    data (numpy.array): 1-D data to be split
                    n_qubits (int): number of qubits in the circuit
                    train_ratio (float): fraction of full data to be used for training. Must be less than 1.
                    random (bool): if False (default), the data is split chronologically e.g., the first 2/3 of the data are used for training and the last 1/3 are used for testing. If True, the data is split randomly.
                    seed (int): seed for np.random
            Returns:
                    train (numpy.ndarray): 2-D array containing the training data. The shape of the data is (train_size//n_qubits, n_qubits)
                    test (numpy.ndarray): 2-D array containing the testing data. The shape of the data is (test_size//n_qubits, n_qubits)
                    train_size: the total number of values in train divided by n_qubits (i.e., the number of n_qubits-sized "groups" in train)
                    test_size: the total number of values in test divided by n_qubits (i.e., the number of n_qubits-sized "groups" in test)
                    train_ratio: fraction of full data to be used for training. Must be less than 1.
                    indices: gives the index of each "group" in the original data. If random is False, indices is just the range of integers from 0 to the number of groups.
    """

    # This transforms the data, creating subgroups of n_qubits consecutive elements each. The first group contains the first n_qubits elements, the second contains the second n_qubits elements, and so on.
    # For example, if the data is [1,2,3,4,5,6] and n_qubits is 3, this returns [[1,2,3],[2,3,4],[3,4,5],[4,5,6]]
    grouped_data = np.zeros((len(data) - n_qubits + 1, n_qubits))
    for i in range(len(data) - n_qubits + 1):
        grouped_data[i] = (np.array(data[i : i + n_qubits])).squeeze()

    indices = np.arange(0, len(grouped_data))
    if random == True:
        np.random.seed(seed)
        np.random.shuffle(indices)
    shuffled_grouped_data = grouped_data[indices]

    train = shuffled_grouped_data[: int(train_ratio * (len(shuffled_grouped_data)))]
    test = shuffled_grouped_data[int(train_ratio * (len(shuffled_grouped_data))) :]
    train_size = len(train)
    test_size = len(test)

    return train, test, train_size, test_size, train_ratio, indices




[docs]
def scale_data(
    train,
    test,
    train_size: int,
    test_size: int,
    n_qubits: int,
    scaler_min: float = 0.2,
    scaler_max: float = 0.8,
):
    """
    Scales the data for embedding in the circuit. By default, scales all values to be between 0.2 and 0.8.

            Parameters:
                    train (numpy.ndarray): 2-D array containing the training data. The shape of the data is (train_size, n_qubits)
                    test (numpy.ndarray): 2-D array containing the testing data. The shape of the data is (test_size, n_qubits)
                    train_size (int): the length of the training set
                    test_size (int): the length of the training set
                    n_qubits (int): number of qubits in the circuit
                    scaler_min (float)= the target minimum value for all values in the full dataset
                    scaler_max (float)= the target maximum value for all values in the full dataset
            Returns:
                    final_train (numpy.ndarray): 2-D array containing the scaled training data. The shape of the data is (train_size, n_qubits)
                    final_test (numpy.ndarray): 2-D array containing the scaled testing data. The shape of the data is (test_size, n_qubits)
                    scaler: The initialized and fitted scaler
    """
    init_scaler = MinMaxScaler((scaler_min, scaler_max))
    train_1d = train.reshape(train_size * n_qubits, 1)
    test_1d = test.reshape(test_size * n_qubits, 1)
    train_test_1d = np.concatenate((train_1d, test_1d))
    scaler = init_scaler.fit(train_test_1d)
    scaled_train_1d = scaler.transform(train_1d)
    scaled_test_1d = scaler.transform(test_1d)
    scaled_train = scaled_train_1d.reshape(train_size, n_qubits)
    scaled_test = scaled_test_1d.reshape(test_size, n_qubits)

    final_train = scaled_train
    final_test = scaled_test

    return final_train, final_test, scaler




[docs]
def train_model(
    train,
    test,
    weights,
    circuit,
    n_qubits: int,
    max_steps: int,
    epochs: int,
    loss_function="mean square error",
    learning_rate=0.1,
    bool_plot=False,
    save_plot: str = None,
):
    """
    Trains the circuit using the "train" dataset and according to the specified hyperparameters.

            Parameters:
                    train (numpy.ndarray): 2-D array containing the scaled training data. Used to train the model and update weights.
                    test (numpy.ndarray): 2-D array containing the scaled testing data. Used to check progress of training.
                    weights: parameters of the circuit updated by the optimizer to change output.
                    circuit (pennylane.qnode.QNode): The circuit which encodes the training data and, according to its parameters, returns an output to be compared with "target" data
                    n_qubits (int): The number of qubits in the quantum circuit
                    max_steps (int): The number of times the weights should be updated before the entire dataset has been evaluated.
                    max_epochs (int): The maximum number of times the full dataset should be evaluated.
                    loss_function: the function to evaluate the performance of the model i.e., the function to be minimized
                    optimizer: The algorithm that adjusts the weights in the circuit.
                    learning_rate: the learning rate of the optimizer.
                    bool_plot (bool): If True, will plot the loss as a function of epochs once training is completed
                    save_plot (str): If None, the plot will not be saved, otherwise it will be saved as the string entered
            Returns:
                    weights: the most-recently updated weights that were obtained when training is complete
                    x_t: input values for testing
                    target_y_t: target values for training
    """

    def input_target_split(data):
        """
        For a 2-D array, moves along axis = 0 and splits each array of size N into an "input" array of size N-1 and a "target" array of size N.

                Parameters:
                        data (numpy.ndarray): The 2-D array to be split
                Returns:
                        x (numpy.ndarray): A 2-D "input" array. x[i] is a 1-D array containing data[i][:-1]
                        target_y (numpy.ndarray): A 2-D "target" array. target_y[i]  is a 1-D array of containing data[i][-1]
        """
        data_size = len(data)
        x = np.zeros((data_size, n_qubits - 1))
        target_y = np.zeros((data_size, 1))
        for i in range(data_size):
            x[i] = data[i][:-1]
            target_y[i] = data[i][-1]
        return x, target_y

    valid_loss_functions = ["mean square error"]
    if loss_function not in valid_loss_functions:
        raise ValueError(
            "Invalid loss function! Only currently supported loss function is 'mean square error'"
        )
    elif loss_function == "mean square error":

        def square_loss(targets, predictions):
            """
            Calculate the mean squared error (MSE) between target values and predicted values.

                    Parameters:
                            targets: The true target values.
                            predictions: The predicted values.

                    Returns:
                            DynamicJaxprTracer: The calculated mean squared error between targets and predictions.
            """
            reshaped_predictions = predictions.reshape(len(predictions), 1)
            return jnp.mean((targets - reshaped_predictions) ** 2)

        def not_jit_cost(weights, x, y):
            """
            Calculate the cost function by evaluating the mean squared error between predicted values and target values.

            This function calculates predictions using the vmapped function 'circuit' and computes
            the mean squared error between the predictions and true target values.

                    Parameters:
                            weights: Quantum circuit parameters.
                            x (Jax tensor): Input data for making predictions.
                            y (Jax tensor): True target values.

                    Returns:
                            DynamicJaxprTracer: Mean squared error between predicted values and true target values.
            """
            predictions = circuit(weights, x)
            return square_loss(y, predictions)

        # Create a jitted version of the cost function for just-in-time compilation
        cost = jax.jit(not_jit_cost)

    x, target_y = input_target_split(train)
    x_t, target_y_t = input_target_split(test)

    train_size = len(train)
    batch_size = train_size // max_steps
    cst = []
    cst.append(cost(weights, x, target_y))
    cst_t = []
    cst_t.append(cost(weights, x_t, target_y_t))

    for i in tqdm(range(epochs)):
        for step in range(max_steps):
            # Select batch of data
            batch_index = np.random.randint(0, max_steps, batch_size)
            x_batch = x[batch_index]
            y_batch = target_y[batch_index]
            # Convert arrays into Jax tensors for vmapped circuit
            jax_x_batch = jnp.array(x_batch)
            jax_y_batch = jnp.array(y_batch)
            # Update the weights by one optimizer step
            gradient = jax.grad(cost)(weights, jax_x_batch, jax_y_batch)
            weights -= learning_rate * gradient
        c = cost(
            weights, x, target_y
        )  # Calculating the cost using the whole train data
        c_t = cost(weights, x_t, target_y_t)
        cst.append(c)
        cst_t.append(c_t)

    if bool_plot == True or save_plot != None:
        plt.figure()
        plt.semilogy(range(len(cst)), cst, "b", label="train")
        plt.semilogy(cst_t, "r", label="test")
        plt.ylabel("Cost")
        plt.xlabel("Step")
        plt.title("Loss")
        plt.legend()
        plt.figtext(
            x=0,
            y=0,
            s="initial train cost" + str(cst[0]) + "; final train cost:" + str(cst[-1]),
        )
        if save_plot != None:
            if not os.path.exists(save_plot):
                os.makedirs(save_plot)
            plt.savefig(save_plot + "loss")
        if bool_plot == True:
            plt.show()

    return (weights, x_t, target_y_t)




[docs]
def save_results_params(results_and_params, path: str):
    """
    Saves a dictionary containing n_qubits, indices, scaler, weights, inputs, and targets to the specified path

            Parameters:
                    results_and_params (dict): A dictionary containing n_qubits, indices, scaler, weights, inputs, and targets
                    path (str): path to which the dictionary will be saved as "dict"
    """
    if not os.path.exists(path):
        os.makedirs(path)
    with open(path + "dict", "wb") as fp:
        pickle.dump(results_and_params, fp)




[docs]
def import_circuit(circuit: str):
    if circuit == "MPS":
        from Circuits.MPS import initialize_MPS_circuit

        return initialize_MPS_circuit
    if circuit == "Ising":
        from Circuits.Ising import initialize_Ising_circuit

        return initialize_Ising_circuit
    else:
        raise ValueError(
            "Invalid circuit. Only currently supported circuits are 'MPS' and 'Ising': use one of these or add a circuit to the Circuits library."
        )