import torch
import torch.nn as nn
import numpy as np
import matplotlib.pyplot as plt


import matplotlib


matplotlib.rcParams['figure.figsize'] = [15, 10]


torch.set_default_dtype(torch.float64)


class Mu_Terminal_Layer(nn.Module):
    def __init__(self,n_in,n_out):
        super().__init__()
        self.n_in,self.n_out=n_in,n_out
        self.weights=nn.Parameter(torch.zeros((n_out,n_in),dtype=torch.float64))
        self.bias=nn.Parameter(torch.zeros(n_out,dtype=torch.float64))
        lim=0.01
        nn.init.uniform_(self.weights,-5,-4) #init weights between e^(-5) and e^(-4)
        nn.init.uniform_(self.bias,-lim,lim) #init weights between -lim and lim
        
    def forward(self,a_prev):
        z=a_prev
        z=torch.add(torch.mm(z,self.weights.exp().t()),self.bias) #z=a_prev*exp(W^t)+b
        a=torch.sigmoid(z) #a=sigmoid(z)
        return a


class Mu_Generic_Layer(nn.Module):
    def __init__(self,n_in,n_out):
        super().__init__()
        self.n_in=n_in
        self.n_out=n_out
        self.weights=nn.Parameter(torch.zeros((n_out,n_in),dtype=torch.float64))
        self.bias=nn.Parameter(torch.zeros(n_out,dtype=torch.float64))
        lim=0.01
        nn.init.uniform_(self.weights,-5,-4) #init weights between e^(-5) and e^(-4)
        nn.init.uniform_(self.bias,-lim,lim) #init weights between -lim and lim
        
    def forward(self,a_prev):
        z=a_prev
        z=torch.mm(z,self.weights.exp().t())
        z=z+self.bias #z=a_prev*exp(W^t) + b
        #a=nn.PReLU(num_parameters=self.n_out,init=0.1)(z) #a=h(z)
        #a=nn.LeakyReLU(0.1)(z)
        #a=torch.tanh(z)*(z**2)
        a=z**3
        return a


for x in Mu_Generic_Layer(1,5).parameters():
    print(x)

Parameter containing:
tensor([[-4.3745],
        [-4.8901],
        [-4.6499],
        [-4.0437],
        [-4.4297]], requires_grad=True)
Parameter containing:
tensor([-0.0010, -0.0071, -0.0068,  0.0079, -0.0097], requires_grad=True)


class Initial_Law_Model(nn.Module):
    def __init__(self,e_sig):
        super(Initial_Law_Model, self).__init__()
        self.e_sig=np.array(e_sig)
        E_sig=[]
        for i in range(0,e_sig.shape[-1]):
            E_sig.append(int(np.sum(e_sig[:,i])))
        self.gen_layers=[]
        self.term_layers=[]
        self.E_sig=E_sig
        for k in range(0,E_sig[0]):
            layer_list=list(e_sig[k,:])
            for l in range(1,len(layer_list)):
                self.gen_layers.append(['('+str(k)+','+str(l)+')',Mu_Generic_Layer(layer_list[l-1],layer_list[l])])
            self.term_layers.append([str(k),Mu_Terminal_Layer(layer_list[-1],1)])
        self.term_layers_mod=nn.ModuleDict(self.term_layers)
        self.gen_layers_mod=nn.ModuleDict(self.gen_layers)
        
    def forward(self, x_input):
        for k in range(0,self.E_sig[0]):
            z=x_input[:,k].view(x_input.shape[0],1)
            layer_list=list(self.e_sig[k,:])
            for l in range(1,len(layer_list)):
                z=self.gen_layers_mod['('+str(k)+','+str(l)+')'](z)
            z=self.term_layers_mod[str(k)](z)
            if k==0:
                a=z
            else:
                a=torch.multiply(a,z)
        return a


test=Initial_Law_Model(np.array([[1,3,3],
                                 [1,3,3]]))


test.parameters

<bound method Module.parameters of Initial_Law_Model(
  (term_layers_mod): ModuleDict(
    (0): Mu_Terminal_Layer()
    (1): Mu_Terminal_Layer()
  )
  (gen_layers_mod): ModuleDict(
    ((0,1)): Mu_Generic_Layer()
    ((0,2)): Mu_Generic_Layer()
    ((1,1)): Mu_Generic_Layer()
    ((1,2)): Mu_Generic_Layer()
  )
)>


test=Initial_Law_Model(np.array([[1,2,3]]))


test.parameters

<bound method Module.parameters of Initial_Law_Model(
  (term_layers_mod): ModuleDict(
    (0): Mu_Terminal_Layer()
  )
  (gen_layers_mod): ModuleDict(
    ((0,1)): Mu_Generic_Layer()
    ((0,2)): Mu_Generic_Layer()
  )
)>


def get_jacobian(output,x_input, batch_size, input_dim, output_dim):
    jacobian=torch.zeros(batch_size,output_dim,input_dim,device=x_input.device)
    for i in range(output_dim):
        grad_out=torch.zeros(batch_size,output_dim,device=x_input.device)
        grad_out[:,i]=1
        grad_in=torch.autograd.grad(output,x_input,grad_out,create_graph=True)[0]
        jacobian[:,i,:]=grad_in.view(batch_size,input_dim)
    return jacobian.view(batch_size,-1)


x_test=torch.tensor([1.0,-3.0],requires_grad=True,dtype=torch.float64).view(2,1)
get_jacobian(torch.pow(x_test,2),x_test,2,1,1)

tensor([[ 2.],
        [-6.]], grad_fn=<ViewBackward0>)


x_test=torch.tensor([1.0,-3.0],requires_grad=True,dtype=torch.float64).view(2,1)
get_jacobian(torch.pow(nn.BatchNorm1d(1,affine=False)(x_test),2),x_test,2,1,1)

tensor([[ 2.5000e-06],
        [-2.5000e-06]], grad_fn=<ViewBackward0>)


test=Initial_Law_Model(np.array([[1,3,3],
                                 [1,3,3]]))


x_test=torch.tensor([[-1.0,1.0],[-2,1.0],[-30.0,1.0]],requires_grad=True,dtype=torch.float64).view(3,2)


get_jacobian(test(x_test),x_test,3,2,1)

tensor([[8.5977e-14, 1.0145e-13],
        [5.2027e-13, 1.0145e-13],
        [2.9796e-10, 1.0145e-13]], grad_fn=<ViewBackward0>)


torch.prod(get_jacobian(test(x_test),x_test,3,2,1),dim=1).view(x_test.shape[0],1)

tensor([[8.7227e-27],
        [5.2783e-26],
        [3.0229e-23]], grad_fn=<ViewBackward0>)


def custom_loss(outputs,inputs,batch_size,input_dim,output_dim):
    ep=1e-10 # to avoid blowing up the loss function we add a buffer
    jac=torch.prod(get_jacobian(outputs,inputs,batch_size,input_dim,output_dim),dim=1).view(batch_size,1)
    tmp_loss=-torch.mean(torch.log(jac+ep))
    return tmp_loss


test=Initial_Law_Model(np.array([[1,3,3],
                                 [1,3,3]]))


x_test=torch.tensor([[-1.0,1.0],[-2,1.0],[-30.0,1.0]],requires_grad=True,dtype=torch.float64).view(3,2)


custom_loss(test(x_test),x_test,3,2,1)

tensor(23.0259, grad_fn=<NegBackward0>)


def train_network(t_model,t_optimizer,X_train,num_epochs):
    train_loss=[]
    for epoch in range(num_epochs):
        t_out=t_model(X_train)
        loss=custom_loss(t_out,X_train,X_train.shape[0],X_train.shape[1],1)
        train_loss.append(loss.item())
        t_optimizer.zero_grad()
        loss.backward()
        t_optimizer.step()
        if (epoch + 1)%10==0:
            print(f"Epoch {epoch+1}/{num_epochs}, Train Loss: {loss.item()}")
    return train_loss


sample_size=100000
samples=np.random.randn(sample_size)


samples

array([ 1.94492206,  1.38750203,  0.42946165, ..., -0.05372974,
        1.53818192,  0.03825953])


x_train=torch.tensor(samples,requires_grad=True,dtype=torch.float64).view(sample_size,1)


x_train

tensor([[ 1.9449],
        [ 1.3875],
        [ 0.4295],
        ...,
        [-0.0537],
        [ 1.5382],
        [ 0.0383]], grad_fn=<ViewBackward0>)


mu=Initial_Law_Model(np.array([[1,25,25,25,5]]))


learning_rate=0.1


optimizer=torch.optim.Adam(mu.parameters(),lr=learning_rate)


custom_loss(mu(x_train),x_train,x_train.shape[0],1,1)

tensor(23.0259, grad_fn=<NegBackward0>)


losses=train_network(mu,optimizer,x_train,num_epochs=100)

Epoch 10/100, Train Loss: 11.202314769542236
Epoch 20/100, Train Loss: 1.8207838086009172
Epoch 30/100, Train Loss: 2.3159801610148074
Epoch 40/100, Train Loss: 1.681825965946245
Epoch 50/100, Train Loss: 1.5801160721452212
Epoch 60/100, Train Loss: 1.4957154036667657
Epoch 70/100, Train Loss: 1.4505578598611697
Epoch 80/100, Train Loss: 1.4323952657759063
Epoch 90/100, Train Loss: 1.4242153984098975
Epoch 100/100, Train Loss: 1.4209325720490114


plt.plot(losses)
plt.legend('Losses')
plt.xlabel('Epochs')
plt.ylabel('Cross Entropy')
plt.title('Training Results')
plt.show()


l=1
r=1
mesh_size=10000
x_viz=np.linspace(min(samples)-l,max(samples)+r,mesh_size)
y_viz=mu(torch.tensor(x_viz,requires_grad=True,dtype=torch.float64).view(x_viz.shape[0],1)).view(x_viz.shape[0])
y_viz=y_viz.detach().numpy()
y_true,x_true=np.histogram(samples,bins=np.linspace(min(samples)-l,max(samples)+r,mesh_size+1))
y_true=y_true/sum(y_true)
y_tot=np.zeros(y_true.shape)
for t in range(len(y_true)):
    y_tot[t]=np.sum(y_true[0:t])
plt.plot(x_viz,y_viz,x_viz,y_tot)
plt.legend(['Model CDF','Sample CDF'])
plt.show()


l=1
r=1
mesh_size=1000
x_viz=np.linspace(min(samples)-l,max(samples)+r,mesh_size)
x_tmp=torch.tensor(x_viz,requires_grad=True,dtype=torch.float64).view(x_viz.shape[0],1)
y_viz=mu(x_tmp)
y_viz=get_jacobian(y_viz,
                   x_tmp,
                   x_viz.shape[0],1,1).view(x_viz.shape[0]).detach().numpy()
y_true,x_true=np.histogram(samples,bins=np.linspace(min(samples)-l,max(samples)+r,mesh_size+1))
y_true=y_true/sum(y_true*(x_viz[1]-x_viz[0]))
#plt.plot(x_viz,y_viz,x_train.view(x_train.shape[0]).detach().numpy(),y_train.view(y_train.shape[0]).detach().numpy())
plt.plot(x_viz,y_viz,x_viz,y_true)
plt.legend(['Model PDF','Sample PDF'])

<matplotlib.legend.Legend at 0x7efe6411ec40>


class G_Generic_Layer(nn.Module):
    def __init__(self,n_in,e_in,n_out,e_out):
        super().__init__()
        self.n_in,self.n_out=n_in,n_out #total size of matrix
        self.e_in=e_in #dimension of t component input
        self.e_out=e_out #dimension of t component output
        self.t_weights=nn.Parameter(torch.zeros((n_out,n_in),dtype=torch.float64))
        self.x_weights=nn.Parameter(torch.zeros((n_out,n_in),dtype=torch.float64))
        self.bias=nn.Parameter(torch.zeros(n_out,dtype=torch.float64))
        lim=0.01
        nn.init.uniform_(self.t_weights,-5,-4) #init t component weights between e^(-5) and e^(-4)
        nn.init.uniform_(self.bias,-lim,lim) #init bias between -lim and lim
        nn.init.uniform_(self.x_weights,-lim,lim) #init x component weights between -lim and lim
        
        #create a mask for top left  and botom left quadrants
        mask_pp=np.zeros((n_out,n_in))
        for i in range(0,e_in):
            #for j in range(0,e_out): #we use this instead to require bottom left is 0
            #    mask_pp[j,i]=1
            mask_pp[:,i]=1
        self.mask_pp=torch.tensor(mask_pp,dtype=torch.float64)
        
        #create a mask for top right and bottom right quadrants
        mask_x=np.zeros((n_out,n_in))
        for i in range(e_in,n_in):
            mask_x[:,i]=1
        
        self.mask_x=torch.tensor(mask_x,dtype=torch.float64)
        
    def forward(self,a_prev):
        z=a_prev
        W=(self.mask_pp*self.t_weights).exp().t()+(self.mask_x*self.x_weights).t()
        z=torch.mm(z,W)
        z=torch.add(z,self.bias)
        #a=nn.PReLU()(z) #a=h(z)
        a=z**3
        return a


k_test=G_Generic_Layer(3,2,4,3)


for x in k_test.parameters():
    print(x)

Parameter containing:
tensor([[-4.0859, -4.3800, -4.3141],
        [-4.9817, -4.4116, -4.0314],
        [-4.1528, -4.6637, -4.6550],
        [-4.7219, -4.0361, -4.8158]], requires_grad=True)
Parameter containing:
tensor([[ 0.0007,  0.0034,  0.0059],
        [ 0.0076, -0.0026,  0.0019],
        [-0.0078, -0.0043, -0.0099],
        [-0.0030,  0.0032, -0.0062]], requires_grad=True)
Parameter containing:
tensor([ 0.0017, -0.0097, -0.0037, -0.0009], requires_grad=True)


class G_Terminal_Layer(nn.Module):
    def __init__(self,n_in,e_in,n_out,e_out):
        super().__init__()
        self.n_in,self.n_out=n_in,n_out #total size of matrix
        self.e_in=e_in #dimension of t component input
        self.e_out=e_out #dimension of t component output
        self.t_weights=nn.Parameter(torch.zeros((n_out,n_in),dtype=torch.float64))
        self.x_weights=nn.Parameter(torch.zeros((n_out,n_in),dtype=torch.float64))
        self.bias=nn.Parameter(torch.zeros(n_out,dtype=torch.float64))
        lim=0.01
        nn.init.uniform_(self.t_weights,-5,-4) #init t component weights between e^(-5) and e^(-4)
        nn.init.uniform_(self.bias,-lim,lim) #init bias between -lim and lim
        nn.init.uniform_(self.x_weights,-lim,lim) #init x component weights between -lim and lim
        
        #create a mask for top left and bottom left quadrants
        mask_pp=np.zeros((n_out,n_in))
        for i in range(0,e_in):
            #for j in range(0,e_out): # we use this instead to require bottom left is 0
            #    mask_pp[j,i]=1
            mask_pp[:,i]=1
        self.mask_pp=torch.tensor(mask_pp,dtype=torch.float64)
        
        #create a mask for top right and bottom right quadrants
        mask_x=np.zeros((n_out,n_in))
        for i in range(e_in,n_in):
            mask_x[:,i]=1
        
        self.mask_x=torch.tensor(mask_x,dtype=torch.float64)
        
    def forward(self,a_prev):
        z=a_prev
        W=(self.mask_pp*self.t_weights).exp().t()+(self.mask_x*self.x_weights).t()
        #W=self.t_weights.exp().t()
        z=torch.mm(z,W)
        #z=torch.mm(z,self.t_weights.exp().t())
        z=torch.add(z,self.bias)
        #z=torch.add(torch.mm(z,(self.mask_pp*self.t_weights).exp().t()+(self.mask_x*self.x_weights).t()),self.bias)
        a=torch.sigmoid(z) #a=h(z)
        return a


k_test=G_Terminal_Layer(2,1,1,1)


for x in k_test.parameters():
    print(x)

Parameter containing:
tensor([[-4.9080, -4.8684]], requires_grad=True)
Parameter containing:
tensor([[-0.0042,  0.0067]], requires_grad=True)
Parameter containing:
tensor([0.0069], requires_grad=True)


class G_Model(nn.Module):
    def __init__(self,e_sig):
        super(G_Model, self).__init__()
        self.e_sig=np.array(e_sig)
        E_sig=[]
        for i in range(0,e_sig.shape[-1]):
            E_sig.append(int(np.sum(e_sig[:,i])))
        self.gen_layers=[]
        self.term_layers=[]
        self.E_sig=E_sig
        for k in range(0,E_sig[0]):
            layer_list=list(e_sig[k,:])
            for l in range(1,len(layer_list)):
                if l==1:
                    self.gen_layers.append(['('+str(k)+','+str(l)+')',G_Generic_Layer(E_sig[l-1]+layer_list[l-1],
                                                                                      layer_list[l-1],
                                                                                      E_sig[l]+layer_list[l],
                                                                                      layer_list[l])])
                else:
                    self.gen_layers.append(['('+str(k)+','+str(l)+')',G_Generic_Layer(E_sig[l-1]+layer_list[l-1],
                                                                                      layer_list[l-1],
                                                                                      E_sig[l]+layer_list[l],
                                                                                      layer_list[l])])
            self.term_layers.append([str(k),G_Terminal_Layer(E_sig[-1]+layer_list[-1],
                                                             layer_list[-1],
                                                             1,
                                                             1)])
        self.term_layers_mod=nn.ModuleDict(self.term_layers)
        self.gen_layers_mod=nn.ModuleDict(self.gen_layers)
        
    def forward(self, x_input):
        for k in range(0,self.E_sig[0]):
            z=torch.cat([x_input[:,k].view(x_input.shape[0],1),
                        x_input[:,self.E_sig[0]:].view(x_input.shape[0],self.E_sig[0])],axis=1)
            #print(z)
            layer_list=list(self.e_sig[k,:])
            for l in range(1,len(layer_list)):
                z=self.gen_layers_mod['('+str(k)+','+str(l)+')'](z)
            z=self.term_layers_mod[str(k)](z)
            if k==0:
                a=z
            else:
                a=torch.multiply(a,z)
        return a


e=np.array([[1,2,2,2],
           [1,2,3,2],
           [1,3,3,2]])


k_test=G_Model(e)


k_test.parameters

<bound method Module.parameters of G_Model(
  (term_layers_mod): ModuleDict(
    (0): G_Terminal_Layer()
    (1): G_Terminal_Layer()
    (2): G_Terminal_Layer()
  )
  (gen_layers_mod): ModuleDict(
    ((0,1)): G_Generic_Layer()
    ((0,2)): G_Generic_Layer()
    ((0,3)): G_Generic_Layer()
    ((1,1)): G_Generic_Layer()
    ((1,2)): G_Generic_Layer()
    ((1,3)): G_Generic_Layer()
    ((2,1)): G_Generic_Layer()
    ((2,2)): G_Generic_Layer()
    ((2,3)): G_Generic_Layer()
  )
)>


x_test=torch.tensor(0.01*np.random.randn(3,6),requires_grad=True,dtype=torch.float64).view(3,6)


k_test(x_test)

tensor([[0.1253],
        [0.1253],
        [0.1253]], grad_fn=<MulBackward0>)


get_jacobian(k_test(x_test),x_test,3,6,1)

tensor([[2.0477e-12, 9.2511e-13, 1.5907e-12, 3.7162e-10, 3.7161e-10, 3.7260e-10],
        [3.8413e-13, 2.4806e-13, 3.8043e-13, 9.3067e-11, 9.3212e-11, 9.3195e-11],
        [3.4923e-13, 1.4858e-13, 2.7568e-13, 6.6208e-11, 6.6268e-11, 6.6391e-11]],
       grad_fn=<ViewBackward0>)


torch.prod(get_jacobian(k_test(x_test),x_test,3,6,1)[:,0:e[:,0].sum()],axis=1).view(3,1)

tensor([[3.0134e-36],
        [3.6250e-38],
        [1.4304e-38]], grad_fn=<ViewBackward0>)


def k_custom_loss(outputs,inputs,batch_size,input_dim,output_dim,e_sig,mu_model):
    ep=1e-10 # to avoid blowing up the loss function we add a buffer
    jac=get_jacobian(outputs,inputs,batch_size,input_dim,output_dim)[:,0:e_sig[:,0].sum()]
    jac=torch.prod(jac,axis=1).view(batch_size,1)
    mu_inputs=inputs[:,e_sig[:,0].sum():]
    mu_jac=get_jacobian(mu_model(mu_inputs),mu_inputs,batch_size,mu_inputs.shape[1],output_dim)
    mu_jac=torch.prod(mu_jac,axis=1).view(batch_size,1)
    tmp_loss=-torch.mean(torch.log(mu_jac*jac+ep))
    return tmp_loss


mu_test=Initial_Law_Model(e)


k_custom_loss(k_test(x_test),x_test,3,6,1,e,mu_test)

tensor(23.0259, grad_fn=<NegBackward0>)


def k_train_network(t_model,t_optimizer,X_train,num_epochs,e_sig,mu_model):
    train_loss=[]
    for epoch in range(num_epochs):
        t_out=t_model(X_train)
        loss=k_custom_loss(t_out,X_train,X_train.shape[0],X_train.shape[1],1,e_sig,mu_model)
        train_loss.append(loss.item())
        t_optimizer.zero_grad()
        loss.backward()
        t_optimizer.step()
        if (epoch + 1)%10==0:
            print(f"Epoch {epoch+1}/{num_epochs}, Train Loss: {loss.item()}")
    return train_loss


e=np.array([[1,25,25,25,5]])


k_samples=np.random.randn(sample_size)+samples


k_samples.reshape(sample_size,1)

array([[ 2.72989493],
       [ 2.37269062],
       [ 1.52150286],
       ...,
       [ 2.28236553],
       [ 0.87083153],
       [-0.41948233]])


sample_pairs=np.concatenate([k_samples.reshape(k_samples.shape[0],1),samples.reshape(samples.shape[0],1)],axis=1)


sample_pairs.shape

(100000, 2)


x_train=torch.tensor(sample_pairs,requires_grad=True,dtype=torch.float64)


k_test=G_Model(e)


k_custom_loss(k_test(x_train),x_train,sample_size,2,1,e,mu)

tensor(22.3114, grad_fn=<NegBackward0>)


k_test(x_train).mean()

tensor(0.5008, grad_fn=<MeanBackward0>)


learning_rate=0.1


k_optimizer=torch.optim.Adam(k_test.parameters(),lr=learning_rate)


k_losses=k_train_network(k_test,k_optimizer,x_train,70,e,mu)

Epoch 10/70, Train Loss: 7.141359272492365
Epoch 20/70, Train Loss: 3.1783132339242184
Epoch 30/70, Train Loss: 3.0156816150553984
Epoch 40/70, Train Loss: 2.893138558198135
Epoch 50/70, Train Loss: nan
Epoch 60/70, Train Loss: 2.8472711566783513
Epoch 70/70, Train Loss: 2.8434874279532267


plt.plot(k_losses)
plt.legend('Losses')
plt.xlabel('Epochs')
plt.ylabel('Cross Entropy')
plt.title('Training Results')
plt.show()


l=1
r=1
mesh_size=1000
y_viz=np.linspace(min(samples)-l,max(samples)+r,mesh_size).reshape(mesh_size,1)
x_viz=np.linspace(-1.5,1.5,3)
z_viz=[]
for x in x_viz:
    tmp_in=np.concatenate([y_viz,x*np.ones((y_viz.shape[0],1))], axis=1)
    tmp_in=torch.tensor(tmp_in,requires_grad=True,dtype=torch.float64).view(y_viz.shape[0],2)
    tmp_z=k_test(tmp_in)
    z_tmp=get_jacobian(tmp_z,
                   tmp_in,
                   tmp_in.shape[0],2,1)
    z_tmp=torch.prod(z_tmp[:,0:e[:,0].sum()],axis=1).detach().numpy()
    z_viz.append(z_tmp)
plt.plot(y_viz,z_viz[0],y_viz,z_viz[1],y_viz,z_viz[2])
plt.legend(['x='+str(x_viz[0]),'x='+str(x_viz[1]),'x='+str(x_viz[2])])

<matplotlib.legend.Legend at 0x7efe640e3c10>


l=1
r=1
mesh_size=100
x_viz=np.linspace(-2.5,2.5,mesh_size)
y_viz=np.linspace(-2.5,2.8,mesh_size)
X_viz,Y_viz=np.meshgrid(x_viz,y_viz)
tx_input=torch.tensor(np.concatenate([X_viz.reshape(mesh_size**2,1),Y_viz.reshape(mesh_size**2,1)],axis=1),
                      requires_grad=True,
                      dtype=torch.float64)
zs=torch.prod(get_jacobian(k_test(tx_input),tx_input,mesh_size**2,2,1)[:,0:e[:,0].sum()],axis=1)
Z_viz=zs.reshape(X_viz.shape).detach().numpy()
fig = plt.figure()
ax = fig.add_subplot(111, projection='3d')
ax.plot_surface(Y_viz, X_viz, Z_viz)

ax.set_xlabel('x_1')
ax.set_ylabel('x_0')
ax.set_zlabel('k(x_1 | x_0)')

ax.view_init(30, 20)

#plt.figure(figsize=(10,6))

plt.show()


x_0=np.random.randn(1,1)
x_1=np.random.randn(1,1)+x_0
x_2=np.random.randn(1,1)+x_1
x_3=np.random.randn(1,1)+x_2


(x_0,x_1,x_2,x_3)

(array([[-2.24303546]]),
 array([[-2.17420876]]),
 array([[-1.91315694]]),
 array([[-3.06965352]]))


1.0-k_test(torch.tensor(np.array([[x_3,x_3]]),dtype=torch.float64)).item()

0.48967168349676227


N=100000
a=-100
b=100
t_mesh=np.linspace(a,b,N).reshape(N,1)
t_mesh.shape
integral=0
t_mesh
x_mesh=x_3*np.ones((N,1))
input_mesh=torch.tensor(np.concatenate([t_mesh,x_mesh],axis=1),dtype=torch.float64,requires_grad=True)
zs=torch.prod(get_jacobian(k_test(input_mesh),input_mesh,N,2,1)[:,0:e[:,0].sum()],axis=1)
zs=zs.detach().numpy()
for i in range(1,N):
    integral+=(t_mesh[i][0]-t_mesh[i-1][0])*zs[i]*t_mesh[i][0]
print(integral)

-3.1069884781405674

x_3

array([[-3.06965352]])

Markov Kernel Learning¶

Terminal Layer¶

Generic Layer¶

Training a Kernel Function¶

Kernel Terminal Layer¶

Kernel Generic Layer¶

Kernel Loss Function¶

Application¶