NeuroRNN.py


import torch
import torch.nn as nn
import numpy as np


# There are two ways of initializing recurrent weight matrices:
# 1)  Pass in the recurrent dimensions:
#         model = RateModel(N_recurrent=N, ...)
#     In this case, do not pass in recurrent_weight.
#     The spectral radius of the recurrent weight matrix can optionally be passed as rho_recurrent
#
# 2)  Pass in the weight matrix itself:
#         model = RateModel(recurrent_weight=J, ...)
#     In this case, do not pass in N_recurrent. It will be inferred from the matrix.
#     rho_recurrent will be ignored in this case.
#
# The input and output weight matrices are defined similarly, except there is an option to have
# no input and/or no output layer by not passing anything in (keep N and weight as None)
# In this case, the input and/or output layer will be an identity function.
#
# Example:
#     model = RateModel(recurrent_weight=J, N_input=100, rho_input=0.5)
# creates a model with recurrent weight matrix J, a new random matrix for the
# 100-dimensional input, and no readout matrix (so the output is the hidden state)
#
# TO DO:
#    - Implement network types (or just layers) EchoR and EchoZ which feed output back into input. Requires Readout==True
#    - Implement multiple RNN layers (maybe in separate function?)
#    - Check to make sure initial state is consistent with z and r.
#    - Check that forward Euler actually makes sense wrt init condition. Maybe range(1,Nt) with init before that?
class RateModel(nn.Module):

    def __init__(self, recurrent, readin=None, readout=None, f='tanh', eta=1, rho_recurrent=1, rho_input=1, rho_output=1, bias_recurrent=True, bias_output=True, Network_Type='R'):
        super(RateModel, self).__init__()

        # Step size for RNN dynamics
        self.eta = eta

        self.Network_Type = Network_Type
        if Network_Type not in ('R','Z'):
            raise Exception("Network_Type must be 'R' or 'Z'.")

        # Bias True or False for each linear component.
        # Bias in input and recurrent would be redundant, so bias=False for input.
        self.bias_recurrent = bias_recurrent
        self.bias_output = bias_output

        # If recurrent is an int, then generate a matrix with that size.
        # If it's a matrix, use that matrix for the weights.
        if isinstance(recurrent, int):
            self.N_recurrent = recurrent
            self.rho_recurrent = rho_recurrent
            self.recurrent_layer = nn.Linear(self.N_recurrent, self.N_recurrent, bias=bias_recurrent)
            self.recurrent_layer.weight.data = rho_recurrent * torch.randn(self.N_recurrent, self.N_recurrent) / torch.sqrt(torch.tensor(self.N_recurrent))
        elif torch.is_tensor(recurrent) and len(recurrent.shape)==2:
            self.N_recurrent = recurrent.shape[0]
            self.rho_recurrent = None
            self.recurrent_layer = nn.Linear(self.N_recurrent, self.N_recurrent, bias=bias_recurrent)
            self.recurrent_layer.weight = nn.Parameter(recurrent)
        else:
            raise Exception('argument recurrent should be an int or a square, 2-dimensional tensor.')

        # Do the same for readin, except also allow readin==None, which means that there is no
        # readin layer, e.g., the readin layer is an identity function.
        if isinstance(readin, int):
            self.N_input = readin
            self.rho_input = rho_input
            self.input_layer = nn.Linear(self.N_input, self.N_recurrent, bias=False)
            self.input_layer.weight.data = rho_input * torch.randn(self.N_recurrent, self.N_input) / torch.sqrt(torch.tensor(self.N_input))
            self.readin = True
        elif torch.is_tensor(readin) and len(readin.shape)==2:
            self.N_input = readin.shape[1]
            self.rho_input = None
            self.input_layer = nn.Linear(self.N_input, self.N_recurrent, bias=False)
            self.input_layer.weight.data = readin
            self.readin = True
        elif (readin is None) or (readin is False):
            self.readin = False
            self.N_input = self.N_recurrent
            self.rho_input = None
            self.input_layer = nn.Identity()
        else:
            raise Exception('readin should be an int, a 2-dim tensor, False, or None')

        # Same as readin above.
        if isinstance(readout, int):
            self.N_output = readout
            self.rho_output = rho_output
            self.output_layer = nn.Linear(self.N_recurrent, self.N_output, bias=bias_output)
            self.output_layer.weight.data = rho_output * torch.randn(self.N_output, self.N_recurrent) / torch.sqrt(torch.tensor(self.N_output))
            self.Readout = True
        elif torch.is_tensor(readout) and len(readout.shape)==2:
            self.N_output = readout.shape[0]
            self.rho_output = None
            self.output_layer = nn.Linear(self.N_recurrent, self.N_output, bias=bias_output)
            self.output_layer.weight.data = readout
            self.Readout = True
        elif (readout is None) or (readout is False):
            self.Readout = False
            self.N_output = self.N_recurrent
            self.rho_output = None
            self.output_layer = nn.Identity()
        else:
            raise Exception('readout should be an int, a 2-dim tensor, False, or None')

        # # Same as readin above.
        # if (echo is True):
        #     self.rho_echo = rho_echo
        #     self.echo_layer = nn.Linear(self.N_output, self.N_recurrent, bias=bias_echo)
        #     self.echo_layer.weight.data = rho_echo * torch.randn(self.N_recurrent, self.N_output) / torch.sqrt(torch.tensor(self.N_output))
        #     self.echo = True
        # elif torch.is_tensor(echo) and len(echo.shape)==2:
        #     self.rho_echo = None
        #     self.echo_layer = nn.Linear(self.N_output, self.N_recurrent, bias=bias_echo)
        #     self.echo_layer.weight.data = echo
        #     self.echo = True
        # elif (echo is None) or (echo is False):
        #     self.echo = False
        #     self.rho_echo = None
        #     self.echo_layer = (lambda x: 0)
        # else:
        #     raise Exception('echo should be True, a 2-dim tensor, False, or None')


        # activation == fI curve, f, can be a string for relu, tanh, or identity
        # OR it can be any function
        if f == 'relu':
            self.f = torch.relu
        elif f == 'tanh':
            self.f = torch.tanh
        elif f == 'id':
            self.f = (lambda x: x)
        elif callable(f):
            self.f = f
        else:
            raise Exception("f should be 'tanh', 'relu', 'id', or a callable function.")

        # Initialize recurrent state
        self.hidden_state = None
        self.hidden_state_history = None


    # Forward pass.
    # If Nt==None then the second dimension of x is assumed to be time.
    # If Nt is an integer, then x is interpreted to be constant in time and Nt is the number of time steps.
    def forward(self, x, Nt = None, initial_state = 'zero', return_time_series = True, store_hidden_history = True):

        # Get batch size, device, and requires_grad
        batch_size = x.shape[0]
        this_device = x.device
        this_req_grad = self.recurrent_layer.weight.requires_grad

        # Check that last dim of input is correct
        if x.shape[-1]!=self.N_input:
            raise Exception('last dim of x should be N_input ='+str(self.N_input)+'but got'+str(x.shape[-1]))

        # If x is 3-dimensional then Nt should be None (or equal to second dim of x) and input is dynamical.
        # Otherwise, x should be 2-dimensional and Nt needs to be passed in as an int, and input is time-constant.
        if len(x.shape)==3 and ((Nt is None) or Nt==x.shape[1]) :
            Nt = x.shape[1]
            dynamical_input = True
        elif (Nt is not None) and len(x.shape)==2:
            dynamical_input = False
        else:
            raise Exception('x should be 3 dim (in which case Nt should be None) or x should be 2 dim in which case you need to pass Nt.')

        # If initial_state is 'zero' initialize to zeros
        # If initial_state is 'keep' then keep old initial state
        # If initial_state is a tensor, intialize to that state
        if initial_state == 'zero':
            self.hidden_state = torch.zeros(batch_size, self.N_recurrent, requires_grad=this_req_grad).to(this_device)
        elif initial_state == 'keep':
            if (not torch.is_tensor(self.hidden_state)) or (not (self.hidden_state.shape[0]==batch_size)):
                #print("initial_state = 'keep' but old state is not consistent type or shape. Using zero initial state instead.")
                self.hidden_state = torch.zeros(batch_size, self.N_recurrent, requires_grad=this_req_grad).to(this_device)
        elif torch.is_tensor(initial_state):
            self.hidden_state = initial_state
        else:
            raise Exception("initial_state should be 'zero', 'keep', or an initial state tensor.")
        self.hidden_state.to(this_device)

        # If we return time series, then initialize a variable for it.
        if return_time_series or store_hidden_history:
            hidden_state_history = torch.zeros(batch_size, Nt, self.N_recurrent).to(this_device)
        else:
            hidden_state_history = None

        # Rate type network
        if self.Network_Type == 'R':
            if dynamical_input:
                for i in range(Nt):
                    self.hidden_state = self.hidden_state + self.eta * (-self.hidden_state + self.f(self.recurrent_layer(self.hidden_state) + self.input_layer(x[:, i, :])))
                    if return_time_series or store_hidden_history:
                        hidden_state_history[:, i, :] = self.hidden_state
            else:
                JxX = self.input_layer(x)
                for i in range(Nt):
                    self.hidden_state = self.hidden_state + self.eta * (-self.hidden_state + self.f(self.recurrent_layer(self.hidden_state) + JxX))
                    if return_time_series or store_hidden_history:
                        hidden_state_history[:, i, :] = self.hidden_state

            if store_hidden_history:
                self.hidden_state_history = hidden_state_history
            else:
                self.hidden_state_history = None

            if return_time_series:
                return self.output_layer(hidden_state_history)
            else:
                return self.output_layer(self.hidden_state)


        # Z type network
        elif self.Network_Type == 'Z':
            if dynamical_input:
                for i in range(Nt):
                    self.hidden_state = self.hidden_state + self.eta * (-self.hidden_state + self.recurrent_layer(self.f(self.hidden_state)) + self.input_layer(x[:, i, :]))
                    if return_time_series or store_hidden_history:
                        hidden_state_history[:, i, :] = self.hidden_state
            else:
                JxX = self.input_layer(x)
                for i in range(Nt):
                    self.hidden_state = self.hidden_state + self.eta * (-self.hidden_state + self.recurrent_layer(self.f(self.hidden_state)) + JxX)
                    if return_time_series or store_hidden_history:
                        hidden_state_history[:, i, :] = self.hidden_state

            if store_hidden_history:
                self.hidden_state_history = hidden_state_history
            else:
                self.hidden_state_history = None

            if return_time_series:
                return self.output_layer(self.f(hidden_state_history))
            else:
                return self.output_layer(self.f(self.hidden_state))

        else:
            raise Exception("Network_Type must be 'R' or 'Z'.")


class Conv2dRateModel(nn.Module):

    def __init__(self, rec_channels, rec_kernel_size, in_channels=None, readin_kernel_size=None, readout_type = 'id', out_channels=None, readout_kernel_size=None,  f='tanh', eta=1,
                 bias_recurrent=False, bias_output=False, readin_padding='same', readin_stride=1, readout_padding='same', readout_stride=1, Network_Type='R'):
        super(Conv2dRateModel, self).__init__()

        # Step size for RNN dynamics
        self.eta = eta

        self.Network_Type = Network_Type
        if Network_Type not in ('R','Z'):
            raise Exception("Network_Type must be 'R' or 'Z'.")

        # Bias True or False for each linear component.
        # Bias in input and recurrent would be redundant, so bias=False for input.
        self.bias_recurrent = bias_recurrent
        self.bias_output = bias_output
        self.rec_channels = rec_channels

        # Build recurrent conv layer
        self.recurrent_layer = nn.Conv2d(rec_channels, rec_channels, rec_kernel_size, bias=bias_recurrent, padding = 'same')

        # If in_channels is None then the number of channels in the input should be rec_channels
        # and input is fed directly to the recurrent layer. Otherwise, we use a readin layer
        if in_channels is None:
            self.input_layer = nn.Identity()
            self.readin = False
            self.in_channels = rec_channels
        else:
            self.input_layer = nn.Conv2d(in_channels, rec_channels, readin_kernel_size, bias=False,
                                         padding=readin_padding, stride=readin_stride)
            self.readin = True
            self.in_channels = in_channels

        #  Define readout layer based on type of layer specified
        if readout_type == 'id':
            self.output_layer = nn.Identity()
            self.out_channels = rec_channels
            self.readout = 'id'
        elif readout_type == 'flatten':
            self.output_layer = nn.Flatten()
            self.out_channels = rec_channels
            self.readout = 'flatten'
        elif readout_type == 'conv':
            self.output_layer = nn.Conv2d(rec_channels, out_channels, readout_kernel_size, bias=bias_output,
                                         padding=readout_padding, stride=readout_stride)
            self.readout = 'conv'
            self.out_channels = out_channels
        elif readout_type == 'conv_flatten':
            self.output_layer = nn.Sequential(nn.Conv2d(rec_channels, out_channels, readout_kernel_size,
                                                        bias=bias_output,padding=readout_padding,stride=readout_stride),
                                              nn.Flatten())
            self.readout = 'conv_flatten'
            self.out_channels = out_channels
        elif readout_type == 'full':
            self.output_layer = nn.Sequential(nn.Flatten(),nn.LazyLinear(out_channels,bias=bias_output))
            self.readout = 'full'
            self.out_channels = out_channels
        else:
            raise Exception("readout_type should be 'id', 'flatten', 'conv', 'conv_flatten', or 'full'")

        # activation == fI curve, f, can be a string for relu, tanh, or identity
        # OR it can be any function
        if f == 'relu':
            self.f = torch.relu
        elif f == 'tanh':
            self.f = torch.tanh
        elif f == 'id':
            self.f = (lambda x: x)
        elif callable(f):
            self.f = f
        else:
            raise Exception("f should be 'tanh', 'relu', 'id', or a callable function.")

        # Initialize recurrent state
        self.hidden_state = None
        self.hidden_state_history = None


    # Forward pass.
    # input, x, should be (batch_size)x(in_channels)x(Nt)x(width)x(height)
    # where Nt is number of time steps. In this case, Nt will be inferred from x and
    # should not be passed in.
    # OR if x is constant in time, it should be (batch_size)x(in_channels)x(width)x(height)
    # and you must pass in Nt.
    def forward(self, x, Nt = None, initial_state = 'zero', return_time_series = True, store_hidden_history = True):

        # Get batch size, device, and requires_grad
        batch_size = x.shape[0]
        this_device = x.device
        this_req_grad = self.recurrent_layer.weight.requires_grad

        # Check that last dim of input is correct
        if x.shape[1]!=self.in_channels:
            raise Exception(
                'x should have' + str(self.in_channels) + 'channels, but got' + str(x.shape[1]))

        # If x is 4-dimensional then Nt should be None (or equal to 3rd dim of x) and input is dynamical.
        # Otherwise, x should be 3-dimensional and Nt needs to be passed in as an int, and input is time-constant.
        if len(x.shape)==5 and ((Nt is None) or Nt==x.shape[2]) :
            Nt = x.shape[2]
            dynamical_input = True
        elif (Nt is not None) and len(x.shape)==4:
            dynamical_input = False
        else:
            raise Exception('x should be 5 dim (in which case Nt should be None) or x should be 4 dim in which case you need to pass Nt.')

        # If initial_state is 'zero' initialize to zeros
        # If initial_state is 'keep' then keep old initial state
        # If initial_state is a tensor, intialize to that state
        if initial_state == 'zero':
            if dynamical_input:
                self.hidden_state = torch.zeros_like(self.input_layer(x[:,:,0,:,:]), requires_grad=this_req_grad).to(this_device)
            else:
                self.hidden_state = torch.zeros_like(self.input_layer(x), requires_grad=this_req_grad).to(this_device)
        elif initial_state == 'keep':
            if (not torch.is_tensor(self.hidden_state)) or (not (self.hidden_state.shape[0]==batch_size)):
                #print("initial_state = 'keep' but old state is not consistent type or shape. Using zero initial state instead.")
                self.hidden_state = torch.zeros(batch_size, self.N_recurrent, requires_grad=this_req_grad).to(this_device)
        elif torch.is_tensor(initial_state):
            self.hidden_state = initial_state
        else:
            raise Exception("initial_state should be 'zero', 'keep', or an initial state tensor.")
        self.hidden_state.to(this_device)

        # If we return time series, then initialize a variable for it.
        if return_time_series or store_hidden_history:
            hidden_state_history = torch.zeros(batch_size, self.rec_channels, Nt, self.hidden_state.shape[2], self.hidden_state.shape[3]).to(this_device)
        else:
            hidden_state_history = None

        # Rate type network
        if self.Network_Type == 'R':
            if dynamical_input:
                for i in range(Nt):
                    self.hidden_state = self.hidden_state + self.eta * (-self.hidden_state + self.f(self.recurrent_layer(self.hidden_state) + self.input_layer(x[:, :, i, :, :])))
                    if return_time_series or store_hidden_history:
                        hidden_state_history[:, :, i, :, :] = self.hidden_state
            else:
                JxX = self.input_layer(x)
                for i in range(Nt):
                    self.hidden_state = self.hidden_state + self.eta * (-self.hidden_state + self.f(self.recurrent_layer(self.hidden_state) + JxX))
                    if return_time_series or store_hidden_history:
                        hidden_state_history[:, :, i, :, :] = self.hidden_state

            if store_hidden_history:
                self.hidden_state_history = hidden_state_history
            else:
                self.hidden_state_history = None

            if return_time_series:
                return self.output_layer(hidden_state_history)
            else:
                return self.output_layer(self.hidden_state)


        # Z type network
        elif self.Network_Type == 'Z':
            if dynamical_input:
                for i in range(Nt):
                    self.hidden_state = self.hidden_state + self.eta * (-self.hidden_state + self.recurrent_layer(self.f(self.hidden_state)) + self.input_layer(x[:, :, i, :, :]))
                    if return_time_series or store_hidden_history:
                        hidden_state_history[:, :, i, :, :] = self.hidden_state
            else:
                JxX = self.input_layer(x)
                for i in range(Nt):
                    self.hidden_state = self.hidden_state + self.eta * (-self.hidden_state + self.recurrent_layer(self.f(self.hidden_state)) + JxX)
                    if return_time_series or store_hidden_history:
                        hidden_state_history[:, :, i, :, :] = self.hidden_state

            if store_hidden_history:
                self.hidden_state_history = hidden_state_history
            else:
                self.hidden_state_history = None

            if return_time_series:
                return self.output_layer(self.f(hidden_state_history))
            else:
                return self.output_layer(self.f(self.hidden_state))


        else:
            raise Exception("Network_Type must be 'R' or 'Z'.")

    # def GetLocalInput(self, history=False):
    #     if history:
    #         h = self.hidden_state_history
    #     else:
    #         h = self.hidden_state
    #
    #     if self.Network_Type == 'R':
    #         return self.recurrent_layer(h)
    #     else:
    #         return self.recurrent_layer(self.f(h))
    #
    # def GetTotalInput(self, history=False):


# Spiking neural net model
class SpikingModel(nn.Module):

    def __init__(self, recurrent, tausyn, readin=None, NeuronModel='EIF', NeuronParams={}):
        super(SpikingModel, self).__init__()

        if torch.is_tensor(recurrent) and len(recurrent.shape) == 2:
            self.N_recurrent = recurrent.shape[0]
            self.recurrent_layer = nn.Linear(self.N_recurrent, self.N_recurrent, bias=False)
            self.recurrent_layer.weight = nn.Parameter(recurrent)
        else:
            raise Exception('recurrent should be an NxN tensor')


        if torch.is_tensor(readin) and len(readin.shape)==2:
            self.Readin = True
            self.N_input = readin.shape[1]
            self.input_layer = nn.Linear(self.N_input, self.N_recurrent, bias=False)
            self.input_layer.weight.data = readin
        elif (readin is None) or (readin is False):
            self.Readin = False
            self.N_input = None
            self.input_layer = nn.Identity()
        else:
            raise Exception('readin should be a 2-dim tensor, False, or None')

        # Synaptic time constants
        self.tausyn = tausyn

        # Neuron parameters
        if NeuronModel == 'EIF':
            # Get each param from NeuronParams or use default if key isn't in NeuronParams
            self.taum = NeuronParams.get('taum',10)
            self.EL = NeuronParams.get('EL',-72)
            self.Vth = NeuronParams.get('Vth',0)
            self.Vre = NeuronParams.get('Vre',-72)
            self.VT = NeuronParams.get('VT',-55)
            self.DT = NeuronParams.get('DT',1)
            self.Vlb = NeuronParams.get('Vlb',-85)
            self.f = (lambda V,I: ((-(V-self.EL)+self.DT*torch.exp((V-self.VT)/self.DT)+I)/self.taum))

        elif NeuronModel == 'LIF':
            self.taum = NeuronParams.get('taum',10)
            self.EL = NeuronParams.get('EL',-72)
            self.Vth = NeuronParams.get('Vth',-55)
            self.Vre = NeuronParams.get('Vre',-72)
            self.Vlb = NeuronParams.get('Vlb', -85)
            self.f = (lambda V,I: ((-(V - self.EL)+I)/self.taum))
        elif callable(NeuronModel):
            self.Vth = NeuronParams['Vth']
            self.Vre = NeuronParams['Vre']
            self.Vlb = NeuronParams['Vlb']
            self.f = NeuronModel
        else:
            raise Exception("NeuronModel should be 'EIF', 'LIF', or a function of two variables (V,I).")

        # Initialize state, which contains V and zsyn
        self.V = None
        self.Y = None


    # Forward pass.
    # If Nt==None then the second dimension of x is assumed to be time.
    # If Nt is an integer, then x is interpreted to be constant in time and Nt is the number of time steps.
    def forward(self, x0, dt, x=None, T=None, initial_V='random', initial_Y='zero', dtRecord = None, Tburn = 0, VIRecord = []):

        # Get batch size, device, and requires_grad
        batch_size = x0.shape[0]
        this_device = x0.device
        this_req_grad = self.recurrent_layer.weight.requires_grad

        # Make sure x0 is correct shape
        if len(x0.shape)!=2 or x0.shape[1]!=self.N_recurrent:
            raise Exception('x0 should be (batch_size)x(N_recurent).')

        # Check shape and type of x. Set Nt, T values accordingly
        if torch.is_tensor(x) and len(x.shape)==3:
            dynamical_input = True
            Nt = x.shape[1]
            T = Nt*dt
            if x.shape[0]!=x0.shape[0]:
                raise Exception('First dim of x and x0 should be the same (batch_size).')
            if self.Readin:
                if x.shape[2]!=self.N_input:
                    raise Exception('When x is 3-dim and readin is True, last dim of x should be N_input.')
            else:
                if x.shape[2]!=self.N_recurrent:
                    raise Exception('When x is 3-dim and readin is False, last dim of x should be N_recurrent.')
        elif torch.is_tensor(x) and len(x.shape)==2:
            dynamical_input = False
            if T is None:
                raise Exception('If x is not dynamical (2-dim) then T cannot be None.')
            Nt = int(T/dt)
            if x.shape[0]!=x0.shape[0]:
                raise Exception('First dim of x and x0 should be the same (batch_size).')
            if self.Readin:
                if x.shape[1]!=self.N_input:
                    raise Exception('When readin is True, last dim of x should be N_input.')
            else:
                if x.shape[1]!=self.N_recurrent:
                    raise Exception('When readin is False, last dim of x should be N_recurrent.')
        elif x is None:
            dynamical_input = False
            if T is None:
                raise Exception('If x is None then T cannot be None.')
            else:
                Nt = int(T/dt)
            # if self.readin:
            #     x = torch.zeros(batch_size,self.N_input)
            # else:
            #     x = torch.zeros(batch_size,self.N_recurrent)
        else:
            raise Exception('x should be a 3-dim tensor, 2-dim tensor, or None.')

        # If initial_V is 'zero' initialize to Vre (not actually zero)
        # If initial_V is 'rand' initialize to uniform dist from Vre to Vth
        # If initial_state is 'keep' then keep old initial state
        # If initial_state is a tensor, intialize to that state
        if initial_V == 'zero':
            self.V = torch.zeros(batch_size, self.N_recurrent, requires_grad=this_req_grad).to(this_device)+self.Vre
        elif initial_V == 'random':
            if hasattr(self, 'VT'):
                self.V = (self.VT -self.Vre)*torch.rand(batch_size,self.N_recurrent, requires_grad=this_req_grad).to(this_device) + self.Vre
            else:
                self.V = (self.Vth-self.Vre)*torch.rand(batch_size, self.N_recurrent, requires_grad=this_req_grad).to(this_device)+self.Vre
        elif initial_V == 'keep':
            if (not torch.is_tensor(self.V)) or (self.V.shape[0] != batch_size):
                print("initial_V was 'keep' but V was wrong type or shape. Using random init instead")
                self.V = (self.Vth-self.Vre)*torch.rand(batch_size, self.N_recurrent, requires_grad=this_req_grad).to(this_device)+self.Vre
        elif torch.is_tensor(initial_V) and initial_V.shape==(batch_size,self.N_recurrent):
            self.V = initial_V
        else:
            raise Exception("initial_V should be 'zero', 'keep', or an initial tensor of shape (batch_size,N_recurrent)="+str((batch_size,self.N_recurrent)))

        # Same as initial_V except no random option
        if initial_Y == 'zero':
            self.Y = torch.zeros(batch_size, self.N_recurrent).to(this_device)
        elif initial_Y == 'keep':
            if (not torch.is_tensor(self.Y)) or (self.Y.shape[0] != batch_size):
                print("initial_Y was 'keep' but Y was wrong type or shape. Using zero init instead")
                self.Y = torch.zeros(batch_size, self.N_recurrent).to(this_device)
        elif torch.is_tensor(initial_Y) and initial_Y.shape==(batch_size,self.N_recurrent):
            self.Y = initial_Y
        else:
            raise Exception("initial_Y should be 'zero', 'keep', or an initial tensor of shape (batch_size,N_recurrent)="+str((batch_size,self.N_recurrent)))
        self.Y.requires_grad = this_req_grad
        self.Y.to(this_device)

        # Initialize dictionary that will store results of sim
        SimResults = {}
        SimResults['r'] = torch.zeros(batch_size, self.N_recurrent, requires_grad=this_req_grad).to(this_device)
        if dtRecord is None:
            RecordSandY = False
            SimResults['S'] = None
            SimResults['Y'] = None
        else:
            RecordSandY = True
            NdtRecord = int(dtRecord/dt)
            if NdtRecord<=0 or NdtRecord>Nt:
                raise Exception('dtRecord should be between dt and T respectively.')
            NtRecord = int(T/dtRecord)
            SimResults['S'] = torch.zeros(batch_size, NtRecord, self.N_recurrent, requires_grad=this_req_grad).to(this_device)
            SimResults['Y'] = torch.zeros(batch_size, NtRecord, self.N_recurrent, requires_grad=this_req_grad).to(this_device)

        if isinstance(VIRecord,list) and len(VIRecord)>0:
            RecordV = True
            NVRecord = len(VIRecord)
            SimResults['V'] = torch.zeros(batch_size, Nt, NVRecord, requires_grad=this_req_grad).to(this_device)
        elif (VIRecord is None) or (VIRecord == []):
            RecordV = False
            SimResults['V'] = None

        # Now start the acutal forward pass
        S = torch.zeros(batch_size, self.N_recurrent, requires_grad=this_req_grad).to(this_device)

        if (x is not None) and (not dynamical_input):
            JxX = self.input_layer(x)
        for i in range(Nt):
            Z = self.recurrent_layer(self.Y)+x0
            if x is not None:
                if dynamical_input:
                    Z = Z + self.input_layer(x[:,i,:])
                else:
                    Z = Z + JxX
            self.V = torch.clamp(self.V + dt*self.f(self.V, Z), min=self.Vlb)


            mask = (self.V>=self.Vth)
            self.V[mask] = self.Vre
            S = mask/dt

            if i*dt>=Tburn:
                SimResults['r'] += S


            self.Y = self.Y + (dt/self.tausyn)*(-self.Y+S)


            if RecordV:
                SimResults['V'][:,i,:] = self.V[:,VIRecord]+dt*S[:,VIRecord]*(self.Vth-self.V[:,VIRecord])

            if RecordSandY:
                irecord = int(i*dt/dtRecord)
                SimResults['S'][:, irecord, :] += S
                SimResults['Y'][:, irecord, :] += self.Y


        SimResults['r'] *= (dt/(T-Tburn))

        if RecordSandY:
            SimResults['S'] *= (dt/NdtRecord)
            SimResults['Y'] *= (1/NdtRecord)

        return SimResults


# Spiking neural net model with spike-based external input
class SpikingModelrx(nn.Module):

    def __init__(self, recurrent, tausyn, readin=None, taux=None, NeuronModel='EIF', NeuronParams={}):
        super(SpikingModelrx, self).__init__()

        if torch.is_tensor(recurrent) and len(recurrent.shape) == 2:
            self.N_recurrent = recurrent.shape[0]
            self.recurrent_layer = nn.Linear(self.N_recurrent, self.N_recurrent, bias=False)
            self.recurrent_layer.weight = nn.Parameter(recurrent)
        else:
            raise Exception('recurrent should be an NxN tensor')

        if torch.is_tensor(readin) and len(readin.shape)==2:
            self.Readin = True
            self.N_input = readin.shape[1]
            self.input_layer = nn.Linear(self.N_input, self.N_recurrent, bias=False)
            self.input_layer.weight.data = readin
            if taux is None:
                raise Exception('If readin is passed in, then taux should also be passed in.')
            self.taux = taux
        elif (readin is None) or (readin is False):
            self.Readin = False
            self.N_input = None
            self.taux = None
        else:
            raise Exception('readin should be a 2-dim tensor, False, or None')

        # Synaptic time constants
        self.tausyn = tausyn

        # Neuron parameters
        if NeuronModel == 'EIF':
            # Get each param from NeuronParams or use default if key isn't in NeuronParams
            self.taum = NeuronParams.get('taum',10)
            self.EL = NeuronParams.get('EL',-72)
            self.Vth = NeuronParams.get('Vth',0)
            self.Vre = NeuronParams.get('Vre',-72)
            self.VT = NeuronParams.get('VT',-55)
            self.DT = NeuronParams.get('DT',1)
            self.Vlb = NeuronParams.get('Vlb',-85)
            self.f = (lambda V,I: ((-(V-self.EL)+self.DT*torch.exp((V-self.VT)/self.DT)+I)/self.taum))

        elif NeuronModel == 'LIF':
            self.taum = NeuronParams.get('taum',10)
            self.EL = NeuronParams.get('EL',-72)
            self.Vth = NeuronParams.get('Vth',-55)
            self.Vre = NeuronParams.get('Vre',-72)
            self.Vlb = NeuronParams.get('Vlb', -85)
            self.f = (lambda V,I: ((-(V - self.EL)+I)/self.taum))
        elif callable(NeuronModel):
            self.Vth = NeuronParams['Vth']
            self.Vre = NeuronParams['Vre']
            self.Vlb = NeuronParams['Vlb']
            self.f = NeuronModel
        else:
            raise Exception("NeuronModel should be 'EIF', 'LIF', or a function of two variables (V,I).")

        # Initialize state, which contains V and zsyn
        self.V = None
        self.Y = None
        self.Yx = None


    # Forward pass.
    # If Nt==None then the second dimension of x is assumed to be time.
    # If Nt is an integer, then x is interpreted to be constant in time and Nt is the number of time steps.
    def forward(self, x0, dt, T, rx=None, initial_V='random', initial_Y='zero', dtRecord = None, Tburn = 0, VIRecord = []):


        # Get batch size, device, and requires_grad
        batch_size = x0.shape[0]
        this_device = x0.device
        this_req_grad = self.recurrent_layer.weight.requires_grad
        Nt = int(T / dt)

        # Make sure x0 is correct shape
        if len(x0.shape)!=2 or x0.shape[1]!=self.N_recurrent:
            raise Exception('x0 should be (batch_size)x(N_recurent).')

        # Check shape and type of rx.

        if torch.is_tensor(rx) and len(rx.shape)==2:
            batched_rx = True
            #Nx = rx.shape[1]
            if rx.shape[1]!=self.N_input:
                raise Exception('Second dimension of rx should be Nx=N_input='+str(self.N_input))
            if not self.Readin:
                raise Exception('Readin should be True if rx is passed in')
            if rx.shape[0]!=batch_size:
                raise Exception('When rx is batched, first dims of x0 and rx should match.')
        elif torch.is_tensor(rx) and len(rx.shape)==1:
            batched_rx = False
            if rx.shape[0] != self.N_input:
                raise Exception('First dimension of rx should be Nx=N_input=' + str(self.N_input))
            if not self.Readin:
                raise Exception('Readin should be True if rx is passed in')
        elif rx is None:
            if self.Readin:
                print('Readin is True, but no input rates were passed.')
        else:
            raise Exception('rx should be a 2-dim tensor, 1-dim tensor, or None.')

        # If initial_V is 'zero' initialize to Vre (not actually zero)
        # If initial_V is 'rand' initialize to uniform dist from Vre to Vth
        # If initial_state is 'keep' then keep old initial state
        # If initial_state is a tensor, intialize to that state
        if initial_V == 'zero':
            self.V = torch.zeros(batch_size, self.N_recurrent, requires_grad=this_req_grad).to(this_device)+self.Vre
        elif initial_V == 'random':
            if hasattr(self, 'VT'):
                self.V = (self.VT -self.Vre)*torch.rand(batch_size,self.N_recurrent, requires_grad=this_req_grad).to(this_device) + self.Vre
            else:
                self.V = (self.Vth-self.Vre)*torch.rand(batch_size, self.N_recurrent, requires_grad=this_req_grad).to(this_device)+self.Vre
        elif initial_V == 'keep':
            if (not torch.is_tensor(self.V)) or (self.V.shape[0] != batch_size):
                print("initial_V was 'keep' but V was wrong type or shape. Using random init instead")
                self.V = (self.Vth-self.Vre)*torch.rand(batch_size, self.N_recurrent, requires_grad=this_req_grad).to(this_device)+self.Vre
        elif torch.is_tensor(initial_V) and initial_V.shape==(batch_size,self.N_recurrent):
            self.V = initial_V
        else:
            raise Exception("initial_V should be 'zero', 'keep', or an initial tensor of shape (batch_size,N_recurrent)="+str((batch_size,self.N_recurrent)))

        # Same as initial_V except no random option
        if initial_Y == 'zero':
            self.Y = torch.zeros(batch_size, self.N_recurrent).to(this_device)
            if self.Readin:
                self.Yx = torch.zeros(batch_size, self.N_input).to(this_device)
        elif initial_Y == 'keep':
            if (not torch.is_tensor(self.Y)) or (self.Y.shape[0] != batch_size):
                print("initial_Y was 'keep' but Y was wrong type or shape. Using zero init instead")
                self.Y = torch.zeros(batch_size, self.N_recurrent).to(this_device)
            if self.Readin:
                if (not torch.is_tensor(self.Yx)) or (self.Yx.shape[0] != batch_size):
                    print("initial_Y was 'keep' but Yx was wrong type or shape. Using zero init instead")
                    self.Yx = torch.zeros(batch_size, self.N_input).to(this_device)

        elif torch.is_tensor(initial_Y) and initial_Y.shape==(batch_size,self.N_recurrent):
            self.Y = initial_Y
            if self.Readin:
                self.Yx = torch.zeros(batch_size, self.N_input).to(this_device)
        else:
            raise Exception("initial_Y should be 'zero', 'keep', or an initial tensor of shape (batch_size,N_recurrent)="+str((batch_size,self.N_recurrent)))
        self.Y.requires_grad = this_req_grad
        self.Y.to(this_device)
        if self.Readin:
            self.Yx.requires_grad = this_req_grad
            self.Yx.to(this_device)

        # Initialize dictionary that will store results of sim
        SimResults = {}
        SimResults['r'] = torch.zeros(batch_size, self.N_recurrent, requires_grad=this_req_grad).to(this_device)
        if dtRecord is None:
            RecordSandY = False
            SimResults['S'] = None
            SimResults['Y'] = None
        else:
            RecordSandY = True
            NdtRecord = int(dtRecord/dt)
            if NdtRecord<=0 or NdtRecord>Nt:
                raise Exception('dtRecord should be between dt and T respectively.')
            NtRecord = int(T/dtRecord)
            SimResults['S'] = torch.zeros(batch_size, NtRecord, self.N_recurrent, requires_grad=this_req_grad).to(this_device)
            SimResults['Y'] = torch.zeros(batch_size, NtRecord, self.N_recurrent, requires_grad=this_req_grad).to(this_device)

        if isinstance(VIRecord,list) and len(VIRecord)>0:
            RecordV = True
            NVRecord = len(VIRecord)
            SimResults['V'] = torch.zeros(batch_size, Nt, NVRecord, requires_grad=this_req_grad).to(this_device)
        elif (VIRecord is None) or (VIRecord == []):
            RecordV = False
            SimResults['V'] = None

        # Now start the acutal forward pass
        S = torch.zeros(batch_size, self.N_recurrent, requires_grad=this_req_grad).to(this_device)

        for i in range(Nt):
            Z = self.recurrent_layer(self.Y)+x0
            if self.Readin:
                Z = Z + self.input_layer(self.Yx)

            # if x is not None:
            #     if dynamical_input:
            #         Z = Z + self.input_layer(x[:,i,:])
            #     else:
            #         Z = Z + JxX

            self.V = torch.clamp(self.V + dt*self.f(self.V, Z), min=self.Vlb)

            mask = (self.V>=self.Vth)
            self.V[mask] = self.Vre
            S = mask/dt

            self.Y = self.Y + (dt/self.tausyn)*(-self.Y+S)
            if self.Readin:
                Sx = torch.bernoulli(dt*rx.expand(batch_size,self.N_input))/dt
                self.Yx = self.Yx + (dt / self.taux)*(-self.Yx+Sx)

            if i*dt>=Tburn:
                SimResults['r'] += S

            if RecordV:
                SimResults['V'][:,i,:] = self.V[:,VIRecord]+dt*S[:,VIRecord]*(self.Vth-self.V[:,VIRecord])

            if RecordSandY:
                irecord = int(i*dt/dtRecord)
                SimResults['S'][:, irecord, :] += S
                SimResults['Y'][:, irecord, :] += self.Y

        SimResults['r'] *= (dt/(T-Tburn))

        if RecordSandY:
            SimResults['S'] *= (dt/NdtRecord)
            SimResults['Y'] *= (1/NdtRecord)

        return SimResults