Source code for neuroptica.layers

'''The layers submodule contains functionality for implementing a logical "layer" in the simulated optical neural
network. The API for this module is based loosely on Keras.'''

import numpy as np

from neuroptica.component_layers import MZILayer, OpticalMesh, PhaseShifterLayer
from neuroptica.nonlinearities import Nonlinearity
from neuroptica.settings import NP_COMPLEX


[docs]class NetworkLayer:
    '''Represents a logical layer in a simulated optical neural network. A NetworkLayer is different from a
    ComponentLayer, but it may contain a ComponentLayer or an OpticalMesh to compute the forward and backward logic.'''

[docs]    def __init__(self, input_size: int, output_size: int, initializer=None):
        '''
        Initialize the NetworkLayer
        :param input_size: number of input ports
        :param output_size: number of output ports (usually the same as input_size, unless DropMask is used)
        :param initializer: optional initializer method (WIP)
        '''
        self.input_size = input_size
        self.output_size = output_size
        self.initializer = initializer
        self.input_prev: np.ndarray = None
        self.output_prev: np.ndarray = None

[docs]    def forward_pass(self, X: np.ndarray) -> np.ndarray:
        '''
        Compute the forward pass of input fields into the network layer
        :param X: input fields to the NetworkLayer
        :return: transformed output fields to feed into the next layer of the ONN
        '''
        raise NotImplementedError('forward_pass() must be overridden in child class!')

[docs]    def backward_pass(self, delta: np.ndarray) -> np.ndarray:
        '''
        Compute the backward (adjoint) pass, given a backward-propagating field shined into the layer from the outputs
        :param delta: backward-propagating field shining into the NetworkLayer outputs
        :return: transformed "input" fields to feed to the previous layer of the ONN
        '''
        raise NotImplementedError('backward_pass() must be overridden in child class!')


[docs]class DropMask(NetworkLayer):
    '''Drop specified ports entirely, reducing the size of the network for the next layer.'''

[docs]    def __init__(self, N: int, keep_ports=None, drop_ports=None):
        '''
        :param N: number of input ports to the DropMask layer
        :param keep_ports: list or iterable of which ports to keep (drop_ports must be None if keep_ports is specified)
        :param drop_ports: list or iterable of which ports to drop (keep_ports must be None if drop_ports is specified)
        '''
        if (keep_ports is not None and drop_ports is not None) or (keep_ports is None and drop_ports is None):
            raise ValueError("specify exactly one of keep_ports or drop_ports")
        if keep_ports:
            if isinstance(keep_ports, range):
                keep_ports = list(keep_ports)
            elif isinstance(keep_ports, int):
                keep_ports = [keep_ports]
            self.ports = keep_ports
        elif drop_ports:
            ports = list(range(N))
            for port in drop_ports:
                ports.remove(port)
            self.ports = ports
        super().__init__(N, len(self.ports))

[docs]    def forward_pass(self, X: np.ndarray):
        return X[self.ports]

[docs]    def backward_pass(self, delta: np.ndarray) -> np.ndarray:
        n_features, n_samples = delta.shape
        delta_back = np.zeros((self.input_size, n_samples), dtype=NP_COMPLEX)
        for i in range(n_features):
            delta_back[self.ports[i]] = delta[i]
        return delta_back


[docs]class StaticMatrix(NetworkLayer):
    '''Multiplies inputs by a static matrix (this is an aphysical layer)'''

    # TODO: make less hacky

[docs]    def __init__(self, matrix: np.ndarray):
        '''
        :param matrix: matrix to multiply inputs by
        '''
        N_out, N_in = matrix.shape
        super().__init__(N_in, N_out)
        self.matrix = matrix

[docs]    def forward_pass(self, X: np.ndarray):
        return self.matrix @ X

[docs]    def backward_pass(self, delta: np.ndarray):
        return self.matrix.T @ delta


[docs]class Activation(NetworkLayer):
    '''Represents a (nonlinear) activation layer. Note that in this layer, the usage of X and Z are reversed!
    (Z is input, X is output, input for next linear layer)
    '''

[docs]    def __init__(self, nonlinearity: Nonlinearity):
        '''
        Initialize the activation layer
        :param nonlinearity: a Nonlinearity instance
        '''
        super().__init__(nonlinearity.N, nonlinearity.N)
        self.nonlinearity = nonlinearity

[docs]    def forward_pass(self, Z: np.ndarray) -> np.ndarray:
        self.input_prev = Z
        self.output_prev = self.nonlinearity.forward_pass(Z)
        return self.output_prev

[docs]    def backward_pass(self, gamma: np.ndarray) -> np.ndarray:
        return self.nonlinearity.backward_pass(gamma, self.input_prev)


[docs]class OpticalMeshNetworkLayer(NetworkLayer):
    '''Base class for any network layer consisting of an optical mesh of phase shifters and MZIs'''

[docs]    def __init__(self, input_size: int, output_size: int, initializer=None):
        '''
        Initialize the OpticalMeshNetworkLayer
        :param input_size: number of input waveguides
        :param output_size: number of output waveguides
        :param initializer: optional initializer method (WIP)
        '''
        super().__init__(input_size, output_size, initializer=initializer)
        self.mesh: OpticalMesh = None

[docs]    def forward_pass(self, X: np.ndarray, cache_fields=False, use_partial_vectors=False) -> np.ndarray:
        raise NotImplementedError('forward_pass() must be overridden in child class!')

[docs]    def backward_pass(self, delta: np.ndarray, cache_fields=False, use_partial_vectors=False) -> np.ndarray:
        raise NotImplementedError('backward_pass() must be overridden in child class!')


[docs]class ClementsLayer(OpticalMeshNetworkLayer):
    '''Performs a unitary NxM operator with MZIs arranged in a Clements decomposition. If M=N then the layer can
    perform any arbitrary unitary operator
    '''

[docs]    def __init__(self, N: int, M=None, include_phase_shifter_layer=True, initializer=None):
        '''
        Initialize the ClementsLayer
        :param N: number of input and output waveguides
        :param M: number of MZI columns; equal to N by default
        :param include_phase_shifter_layer: if true, include a layer of single-mode phase shifters at the beginning of
        the mesh (required to implement arbitrary unitary)
        :param initializer: optional initializer method (WIP)
        '''
        super().__init__(N, N, initializer=initializer)

        layers = []
        if include_phase_shifter_layer:
            layers.append(PhaseShifterLayer(N))

        if M is None:
            M = N

        for layer_index in range(M):
            if N % 2 == 0:  # even number of waveguides
                if layer_index % 2 == 0:
                    layers.append(MZILayer.from_waveguide_indices(N, list(range(0, N))))
                else:
                    layers.append(MZILayer.from_waveguide_indices(N, list(range(1, N - 1))))
            else:  # odd number of waveguides
                if layer_index % 2 == 0:
                    layers.append(MZILayer.from_waveguide_indices(N, list(range(0, N - 1))))
                else:
                    layers.append(MZILayer.from_waveguide_indices(N, list(range(1, N))))

        self.mesh = OpticalMesh(N, layers)

[docs]    def forward_pass(self, X: np.ndarray, cache_fields=False, use_partial_vectors=False) -> np.ndarray:
        '''
        Compute the forward pass
        :param X: input electric fields
        :param cache_fields: if true, fields are cached
        :param use_partial_vectors: if true, use partial vector method to speed up transfer matrix computations
        :return: output fields for next ONN layer
        '''
        self.input_prev = X
        if cache_fields:
            self.mesh.forward_fields = self.mesh.compute_phase_shifter_fields(
                X, align="right", use_partial_vectors=use_partial_vectors)
            self.output_prev = np.copy(self.mesh.forward_fields[-1][-1])
        else:
            self.output_prev = np.dot(self.mesh.get_transfer_matrix(), X)

        return self.output_prev

[docs]    def backward_pass(self, delta: np.ndarray, cache_fields=False, use_partial_vectors=False) -> np.ndarray:
        '''
        Compute the backward pass
        :param delta: adjoint "output" electric fields backpropagated from the next ONN layer
        :param cache_fields: if true, fields are cached
        :param use_partial_vectors: if true, use partial vector method to speed up transfer matrix computations
        :return: adjoint "input" fields for previous ONN layer
        '''
        if cache_fields:
            self.mesh.adjoint_fields = self.mesh.compute_adjoint_phase_shifter_fields(
                delta, align="right", use_partial_vectors=use_partial_vectors)
            if isinstance(self.mesh.layers[0], PhaseShifterLayer):
                return np.dot(self.mesh.layers[0].get_transfer_matrix().T, self.mesh.adjoint_fields[-1][-1])
            else:
                raise ValueError("Field_store will not work in this case, please set to False")
        else:
            return np.dot(self.mesh.get_transfer_matrix().T, delta)


[docs]class ReckLayer(OpticalMeshNetworkLayer):
    '''Performs a unitary NxN operator with MZIs arranged in a Reck decomposition'''

[docs]    def __init__(self, N: int, include_phase_shifter_layer=True, initializer=None):
        '''
        Initialize the ReckLayer
        :param N: number of input and output waveguides
        :param include_phase_shifter_layer: if true, include a layer of single-mode phase shifters at the beginning of
        the mesh (required to implement arbitrary unitary)
        :param initializer: optional initializer method (WIP)
        '''
        super().__init__(N, N, initializer=initializer)

        layers = []
        if include_phase_shifter_layer:
            layers.append(PhaseShifterLayer(N))

        mzi_limits_upper = [i for i in range(1, N)] + [i for i in range(N - 2, 1 - 1, -1)]
        mzi_limits_lower = [(i + 1) % 2 for i in mzi_limits_upper]

        for start, end in zip(mzi_limits_lower, mzi_limits_upper):
            layers.append(MZILayer.from_waveguide_indices(N, list(range(start, end + 1))))

        self.mesh = OpticalMesh(N, layers)

[docs]    def forward_pass(self, X: np.ndarray) -> np.ndarray:
        self.input_prev = X
        self.output_prev = np.dot(self.mesh.get_transfer_matrix(), X)
        return self.output_prev

[docs]    def backward_pass(self, delta: np.ndarray) -> np.ndarray:
        return np.dot(self.mesh.get_transfer_matrix().T, delta)