Source code for neuroptica.models

'''This module contains classes to implement Keras-style Models, which combine several NetworkLayers to simulate a full
optical neural network. Currently, only sequential models are supported, but more may be added in the future.'''

from typing import Dict, List

import numpy as np

from neuroptica.layers import NetworkLayer, OpticalMeshNetworkLayer


[docs]class BaseModel:
    '''Base class for all models'''

    def forward_pass(self, X: np.ndarray) -> np.ndarray:
        raise NotImplementedError

    def backward_pass(self, d_loss: np.ndarray) -> Dict[str, np.ndarray]:
        raise NotImplementedError


[docs]class Model(BaseModel):
    '''
    Functional model class similar to the Keras model class, simulating an optical neural network with multiple layers
    '''

[docs]    def __init__(self):  # TODO
        pass


[docs]class Sequential(BaseModel):
    '''Feed-foward model class similar to the Keras Sequential() model class'''

[docs]    def __init__(self, layers: List[NetworkLayer]):
        '''
        Initialize the model
        :param layers: list of NetworkLayers contained in the optical neural network
        '''
        self.layers = layers
        self.input_cache = {}
        self.output_cache = {}
        for i, layer in enumerate(self.layers):
            layer.__name__ = "Layer{}_{}".format(i, layer.__class__.__name__)
            self.input_cache[layer.__name__] = []
            self.output_cache[layer.__name__] = []

[docs]    def __repr__(self):
        return "<Sequential Model: {}>".format([layer.__name__ for layer in self.layers])

[docs]    def forward_pass(self, X: np.ndarray, cache_fields=False, use_partial_vectors=False) -> np.ndarray:
        '''
        Propagate an input field throughout the entire network
        :param X: input electric fields
        :param cache_fields: if true, fields will be cached internally
        :param use_partial_vectors: if true, use the partial vectors method to speed up transfer matrix computation
        :return: output electric fields (to be fed into a loss function)
        '''
        X_out = X
        for layer in self.layers:
            if isinstance(layer, OpticalMeshNetworkLayer):
                X_out = layer.forward_pass(X_out,
                                           cache_fields=cache_fields,
                                           use_partial_vectors=use_partial_vectors)
            else:
                X_out = layer.forward_pass(X_out)
        return X_out

[docs]    def backward_pass(self, d_loss: np.ndarray, cache_fields=False, use_partial_vectors=False) -> Dict[str, np.ndarray]:
        '''
        Returns the gradients for each layer resulting from backpropagating from derivative loss function d_loss
        :param d_loss: derivative of the loss function of the outputs
        :param cache_fields: if true, fields will be cached internally
        :param use_partial_vectors: if true, use the partial vectors method to speed up transfer matrix computation
        :return: dictionary of {layer: gradients}
        '''
        backprop_signal = d_loss
        gradients = {"output": d_loss}
        for layer in reversed(self.layers):
            if isinstance(layer, OpticalMeshNetworkLayer):
                backprop_signal = layer.backward_pass(backprop_signal,
                                                      cache_fields=cache_fields,
                                                      use_partial_vectors=use_partial_vectors)
            else:
                backprop_signal = layer.backward_pass(backprop_signal)

            gradients[layer.__name__] = backprop_signal
        return gradients