Source code for neurophox.ml.linear

from typing import Optional, Callable, List, Union

import numpy as np
import tensorflow as tf
import pickle

from ..config import TF_COMPLEX, NP_COMPLEX
from ..helpers import random_gaussian_batch
from ..tensorflow import MeshLayer, SVD


[docs]def complex_mse(y_true: tf.Tensor, y_pred: tf.Tensor):
    """

    Args:
        y_true: The true labels, :math:`V \in \mathbb{C}^{B \\times N}`
        y_pred: The true labels, :math:`\\widehat{V} \in \mathbb{C}^{B \\times N}`

    Returns:
        The complex mean squared error :math:`\\boldsymbol{e} \in \mathbb{R}^B`,
        where given example :math:`\\widehat{V}_i \in \mathbb{C}^N`,
        we have :math:`e_i = \\frac{\|V_i - \\widehat{V}_i\|^2}{N}`.

    """
    real_loss = tf.losses.mse(tf.math.real(y_true), tf.math.real(y_pred))
    imag_loss = tf.losses.mse(tf.math.imag(y_true), tf.math.imag(y_pred))
    return (real_loss + imag_loss) / 2


[docs]def normalized_fidelity(u: tf.Tensor, u_hat: tf.Tensor):
    """

    Args:
        u: The true (target) unitary, :math:`U \in \mathrm{U}(N)`
        u_hat: The estimated unitary (not necessarily unitary), :math:`\\widehat{U}`

    Returns:
        The normalized fidelity independent of the norm of :math:`\\widehat{U}`.

    """

    def trf(x: tf.Tensor, y=None):
        y = x if y is None else y
        trace = tf.linalg.trace(tf.transpose(tf.math.conj(x)) @ y)
        return tf.math.real(trace) ** 2 + tf.math.imag(trace) ** 2

    return trf(u_hat, u) / trf(u_hat)


[docs]class LinearMultiModelRunner:
    """
    Complex mean square error linear optimization experiment that can run and track multiple model optimizations in parallel.

    Args:
        experiment_name: Name of the experiment
        layer_names: List of layer names
        layers: List of transformer layers
        optimizer: Optimizer for all layers or list of optimizers for each layer
        batch_size: Batch size for the optimization
        iterations_per_epoch: Iterations per epoch
        iterations_per_tb_update: Iterations per update of TensorBoard
        logdir: Logging directory for TensorBoard to track losses of each layer (default to `None` for no logging)
        train_on_test: Use same training and testing set
        store_params: Store params during the training for visualization later
    """
    def __init__(self, experiment_name: str, layer_names: List[str],
                 layers: List[MeshLayer], optimizer: Union[tf.keras.optimizers.Optimizer, List[tf.keras.optimizers.Optimizer]],
                 batch_size: int, iterations_per_epoch: int=50, iterations_per_tb_update: int=5,
                 logdir: Optional[str]=None, train_on_test: bool=False, store_params: bool=True):  # e.g., logdir=/data/tensorboard/neurophox/
        self.losses = {name: [] for name in layer_names}
        self.results = {name: [] for name in layer_names}
        self.layer_names = layer_names
        self.layers = layers
        self.optimizers = optimizer if isinstance(optimizer, List) else [optimizer for _ in layer_names]
        if not (len(layer_names) == len(layers) and len(layers) == len(self.optimizers)):
            raise ValueError("layer_names, layers, and optimizers must all be the same length")
        self.batch_size = batch_size
        self.iters = 0
        self.iterations_per_epoch = iterations_per_epoch
        self.iterations_per_tb_update = iterations_per_tb_update
        self.experiment_name = experiment_name
        self.logdir = logdir
        self.train_on_test = train_on_test
        self.store_params = store_params
        if self.logdir:
            self.summary_writers = {name: tf.summary.create_file_writer(
                f'{self.logdir}/{experiment_name}/{name}/'
            ) for name in layer_names}

[docs]    def iterate(self, target_unitary: np.ndarray, cost_fn: Callable = complex_mse):
        """
        Run gradient update toward a target unitary :math:`U`.

        Args:
            target_unitary: Target unitary, :math:`U`.
            cost_fn: Cost function for linear model (default to complex mean square error)

        """
        if self.train_on_test:
            x_train, y_train = tf.eye(self.layers[0].units, dtype=TF_COMPLEX),\
                               tf.convert_to_tensor(target_unitary, dtype=TF_COMPLEX)
        else:
            x_train, y_train = generate_keras_batch(self.layers[0].units, target_unitary, self.batch_size)
        for name, layer, optimizer in zip(self.layer_names, self.layers, self.optimizers):
            with tf.GradientTape() as tape:
                loss = cost_fn(layer(x_train), y_train)
            grads = tape.gradient(loss, layer.trainable_variables)
            optimizer.apply_gradients(grads_and_vars=zip(grads, layer.trainable_variables))
            self.losses[name].append(tf.reduce_sum(
                cost_fn(layer(tf.eye(layer.units, dtype=TF_COMPLEX)),
                        tf.convert_to_tensor(target_unitary.astype(NP_COMPLEX)))).numpy()
            )
            if self.iters % self.iterations_per_tb_update and self.logdir:
                self.update_tensorboard(name)
            if self.iters % self.iterations_per_epoch == 0 and self.store_params:
                if not isinstance(layer, SVD):
                    phases = layer.phases
                    mask = layer.mesh.model.mask
                    estimate = layer(tf.eye(layer.units, dtype=TF_COMPLEX)).numpy()
                    self.results[name].append({
                        "theta_list": phases.theta.param_list(mask),
                        "phi_list": phases.phi.param_list(mask),
                        "theta_checkerboard": phases.theta.checkerboard_arrangement,
                        "phi_checkerboard": phases.phi.checkerboard_arrangement,
                        "gamma": phases.gamma,
                        "estimate_mag": np.abs(estimate),
                        "error_mag": np.abs(estimate - target_unitary)
                    })

        self.iters += 1

[docs]    def update_tensorboard(self, name: str):
        """
        Update TensorBoard variables.

        Args:
            name: Layer name corresponding to variables that are updated

        """
        with self.summary_writers[name].as_default():
            tf.summary.scalar(f'loss-{self.experiment_name}', self.losses[name][-1], step=self.iters)

[docs]    def run(self, num_epochs: int, target_unitary: np.ndarray, pbar: Optional[Callable]=None):
        """

        Args:
            num_epochs: Number of epochs (defined in terms of `iterations_per_epoch`)
            target_unitary: Target unitary, :math:`U`.
            pbar: Progress bar (tqdm recommended)

        """
        iterator = pbar(range(num_epochs * self.iterations_per_epoch)) if pbar else range(num_epochs * self.iterations_per_epoch)
        for _ in iterator:
            self.iterate(target_unitary)

[docs]    def save(self, savepath: str):
        """
        Save results for the multi-model runner to pickle file.

        Args:
            savepath: Path to save results.
        """
        with open(f"{savepath}/{self.experiment_name}.p", "wb") as f:
            pickle.dump({"losses": self.losses, "results": self.results}, f)


[docs]def generate_keras_batch(units, target_unitary, batch_size):
    x_train = random_gaussian_batch(batch_size=batch_size, units=units)
    y_train = x_train @ target_unitary
    return tf.convert_to_tensor(x_train, dtype=TF_COMPLEX), tf.convert_to_tensor(y_train, dtype=TF_COMPLEX)