Got most of the neural network stuff working. Some parameter updates to manage in NeuralNetworkSpecifications

5 years ago · d8fff40288
parent 7b51044057
commit d8fff40288
3 changed files with 344 additions and 375 deletions
--- a/Code/BasicNeuralNet2.ipynb
+++ b/Code/BasicNeuralNet2.ipynb
@ -2,7 +2,7 @@
 "cells": [
  {
   "cell_type": "markdown",
-   "id": "electric-scratch",
+   "id": "chief-solomon",
   "metadata": {},
   "source": [
    "Note on pytorch. NN optimization acts imperitively/by side effect as follows.\n",
@ -23,7 +23,7 @@
  {
   "cell_type": "code",
   "execution_count": 1,
-   "id": "outdoor-essay",
+   "id": "accepting-telephone",
   "metadata": {},
   "outputs": [],
   "source": [
@ -33,357 +33,12 @@
  },
  {
   "cell_type": "code",
-   "execution_count": 2,
-   "id": "played-reward",
-   "metadata": {
-    "tags": []
-   },
-   "outputs": [],
-   "source": [
-    "class DoubleNetwork(torch.nn.Module):\n",
-    "    def __init__(self, input_size,output_size,layers_size):\n",
-    "        super().__init__()\n",
-    "        \n",
-    "        #So, this next section constructs different layers within the NN\n",
-    "        #sinlge linear section\n",
-    "        self.linear_step_1a = torch.nn.Linear(input_size,layers_size)\n",
-    "        \n",
-    "        #single linear section\n",
-    "        self.linear_step_2a = torch.nn.Linear(layers_size,output_size)\n",
-    "        self.linear_step_2b = torch.nn.Linear(layers_size,output_size)\n",
-    "        \n",
-    "    def forward(self, input_values):\n",
-    "        \n",
-    "        intermediate_values_a = self.linear_step_1a(input_values)\n",
-    "        \n",
-    "        out_values_a = self.linear_step_2a(intermediate_values_a)\n",
-    "        out_values_b = self.linear_step_2b(intermediate_values_a)\n",
-    "        \n",
-    "        return out_values_a,out_values_b"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 3,
-   "id": "tribal-manor",
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "\n",
-      " tensor(4.8121, grad_fn=<AddBackward0>)\n",
-      "\n",
-      " tensor(17.3775, grad_fn=<AddBackward0>)\n",
-      "\n",
-      " tensor(30.0737, grad_fn=<AddBackward0>)\n",
-      "\n",
-      " tensor(0.6026, grad_fn=<AddBackward0>)\n",
-      "\n",
-      " tensor(0.3996, grad_fn=<AddBackward0>)\n",
-      "\n",
-      " tensor(0.3020, grad_fn=<AddBackward0>)\n",
-      "\n",
-      " tensor(0.2092, grad_fn=<AddBackward0>)\n",
-      "\n",
-      " tensor(0.1412, grad_fn=<AddBackward0>)\n",
-      "\n",
-      " tensor(0.0893, grad_fn=<AddBackward0>)\n",
-      "\n",
-      " tensor(0.0561, grad_fn=<AddBackward0>)\n",
-      "\n",
-      " tensor(0.0341, grad_fn=<AddBackward0>)\n",
-      "\n",
-      " tensor(0.0208, grad_fn=<AddBackward0>)\n",
-      "\n",
-      " tensor(0.0125, grad_fn=<AddBackward0>)\n",
-      "\n",
-      " tensor(0.0075, grad_fn=<AddBackward0>)\n",
-      "\n",
-      " tensor(0.0045, grad_fn=<AddBackward0>)\n",
-      "\n",
-      " tensor(0.0027, grad_fn=<AddBackward0>)\n",
-      "\n",
-      " tensor(0.0016, grad_fn=<AddBackward0>)\n",
-      "\n",
-      " tensor(0.0010, grad_fn=<AddBackward0>)\n",
-      "\n",
-      " tensor(0.0006, grad_fn=<AddBackward0>)\n",
-      "\n",
-      " tensor(0.0003, grad_fn=<AddBackward0>)\n"
-     ]
-    }
-   ],
-   "source": [
-    "model = DoubleNetwork(input_size = 5, output_size=5, layers_size=15)\n",
-    "\n",
-    "data_in = torch.tensor([1.5,2,3,4,5])\n",
-    "\n",
-    "data_in\n",
-    "\n",
-    "target = torch.zeros(5)\n",
-    "\n",
-    "def loss_fn2(output,target):\n",
-    "    return sum((output[1] +output[0] - target)**2)\n",
-    "    #could add a simplicity assumption i.e. l1 on parameters.\n",
-    "\n",
-    "#Prep Optimizer\n",
-    "optimizer = torch.optim.SGD(model.parameters(),lr=0.01)\n",
-    "\n",
-    "for i in range(20):\n",
-    "    #training loop\n",
-    "    optimizer.zero_grad()\n",
-    "\n",
-    "    output = model.forward(data_in)\n",
-    "    output\n",
-    "\n",
-    "    l = loss_fn2(output, target)\n",
-    "\n",
-    "    l.backward()\n",
-    "\n",
-    "    optimizer.step()\n",
-    "\n",
-    "    print(\"\\n\",l)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 4,
-   "id": "uniform-union",
+   "execution_count": 56,
+   "id": "major-transformation",
   "metadata": {},
   "outputs": [],
   "source": [
-    "class SplitNetwork(torch.nn.Module):\n",
-    "    def __init__(self, input_size,output_size_a,output_size_b,layers_size):\n",
-    "        super().__init__()\n",
-    "        \n",
-    "        #So, this next section constructs different layers within the NN\n",
-    "        #sinlge linear section\n",
-    "        self.linear_step_1 = torch.nn.Linear(input_size,layers_size)\n",
-    "        self.linear_step_2 = torch.nn.Linear(layers_size,layers_size)\n",
-    "        self.linear_step_3 = torch.nn.Linear(layers_size,layers_size)\n",
-    "        self.linear_step_4 = torch.nn.Linear(layers_size,layers_size)\n",
-    "        \n",
-    "        #single linear section\n",
-    "        self.linear_step_split_a = torch.nn.Linear(layers_size,output_size_a)\n",
-    "        self.linear_step_split_b = torch.nn.Linear(layers_size,output_size_b)\n",
-    "        \n",
-    "    def forward(self, input_values):\n",
-    "        \n",
-    "        intermediate_values = self.linear_step_1(input_values)\n",
-    "        intermediate_values = self.linear_step_2(intermediate_values)\n",
-    "        intermediate_values = self.linear_step_3(intermediate_values)\n",
-    "        intermediate_values = self.linear_step_4(intermediate_values)\n",
-    "        \n",
-    "        out_values_a = self.linear_step_split_a(intermediate_values)\n",
-    "        out_values_b = self.linear_step_split_b(intermediate_values)\n",
-    "        \n",
-    "        return out_values_a,out_values_b"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 5,
-   "id": "grand-vietnamese",
-   "metadata": {
-    "tags": []
-   },
-   "outputs": [
-    {
-     "ename": "NameError",
-     "evalue": "name 'loss_fn3' is not defined",
-     "output_type": "error",
-     "traceback": [
-      "\u001b[0;31m---------------------------------------\u001b[0m",
-      "\u001b[0;31mNameError\u001b[0mTraceback (most recent call last)",
-      "\u001b[0;32m<ipython-input-5-4ecf63ceaaa2>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m\u001b[0m\n\u001b[1;32m      9\u001b[0m     \u001b[0moutput\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     10\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 11\u001b[0;31m     \u001b[0ml\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mloss_fn3\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0moutput\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtarget_a\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mtarget_b\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m     12\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m     13\u001b[0m     \u001b[0ml\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mbackward\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
-      "\u001b[0;31mNameError\u001b[0m: name 'loss_fn3' is not defined"
-     ]
-    }
-   ],
-   "source": [
-    "#Prep Optimizer\n",
-    "optimizer = torch.optim.SGD(model.parameters(),lr=0.01)\n",
-    "\n",
-    "for i in range(25):\n",
-    "    #training loop\n",
-    "    optimizer.zero_grad()\n",
-    "\n",
-    "    output = model.forward(data_in)\n",
-    "    output\n",
-    "\n",
-    "    l = loss_fn3(output, target_a, target_b)\n",
-    "\n",
-    "    l.backward()\n",
    "\n",
-    "    optimizer.step()\n",
-    "\n",
-    "    print(\"\\n\",l)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "settled-maple",
-   "metadata": {},
-   "outputs": [],
-   "source": []
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 6,
-   "id": "appointed-sandwich",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "#This is a custom upscale module.\n",
-    "class PartialDerivativesEstimand(torch.nn.Module):\n",
-    "    def __init__(self, state_tensor_size,layers_size,number_constellations):\n",
-    "        \"\"\"\n",
-    "        Description\n",
-    "        \"\"\"\n",
-    "        super().__init__()\n",
-    "        self.number_constellations = number_constellations\n",
-    "        \n",
-    "        #Scale up the input from just the tensor of states to the layer_size X number_constellations\n",
-    "        \n",
-    "        #Increase to the layer size\n",
-    "        self.linear_step_1 = torch.nn.Linear(in_features=state_tensor_size, out_features=layers_size)\n",
-    "        #Upscale the tensor to be able to estimate for each constellation\n",
-    "        #TODO: change to the standard upscaler\n",
-    "        self.upscale_step = lambda x: torch.nn.functional.interpolate(x, scale_factor=self.number_constellations).view(x.numel(), self.number_constellations)\n",
-    "        \n",
-    "        #start adding useful layers (start small).\n",
-    "        self.relu_3 = torch.nn.ReLU()\n",
-    "        self.relu_4 = torch.nn.ReLU() #TODO:swap to linear or something like that.\n",
-    "        #TODO:downscale to match the proper output values\n",
-    "        \n",
-    "    def forward(self, input_values):\n",
-    "        \n",
-    "        intermediate_values = self.linear_step_1(input_values)\n",
-    "        intermediate_values = self.upscale_step(intermediate_values)\n",
-    "        intermediate_values = self.relu_3(intermediate_values)\n",
-    "        \n",
-    "        intermediate_values = self.relu_4(intermediate_values)\n",
-    "        \n",
-    "        return intermediate_values"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 7,
-   "id": "complete-gather",
-   "metadata": {},
-   "outputs": [
-    {
-     "data": {
-      "text/plain": [
-       "tensor([[0.0000, 0.0000, 0.0000],\n",
-       "        [0.4215, 0.4215, 0.4215],\n",
-       "        [0.5668, 0.5668, 0.5668],\n",
-       "        [0.0000, 0.0000, 0.0000],\n",
-       "        [0.0675, 0.0675, 0.0675],\n",
-       "        [1.8888, 1.8888, 1.8888],\n",
-       "        [0.0000, 0.0000, 0.0000],\n",
-       "        [0.0000, 0.0000, 0.0000],\n",
-       "        [0.0000, 0.0000, 0.0000],\n",
-       "        [0.0000, 0.0000, 0.0000],\n",
-       "        [0.0000, 0.0000, 0.0000],\n",
-       "        [0.0000, 0.0000, 0.0000]], grad_fn=<ReluBackward0>)"
-      ]
-     },
-     "execution_count": 7,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "nn = PartialDerivativesEstimand(3,12,3)\n",
-    "\n",
-    "test = torch.tensor([[[1.0,3,4]]])\n",
-    "\n",
-    "t = nn.forward(test)\n",
-    "t"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 8,
-   "id": "iraqi-italic",
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "tensor(30.5458, grad_fn=<AddBackward0>)\n",
-      "tensor(26.5162, grad_fn=<AddBackward0>)\n",
-      "tensor(24.9672, grad_fn=<AddBackward0>)\n",
-      "tensor(24.3718, grad_fn=<AddBackward0>)\n",
-      "tensor(24.1429, grad_fn=<AddBackward0>)\n",
-      "tensor(24.0549, grad_fn=<AddBackward0>)\n",
-      "tensor(24.0211, grad_fn=<AddBackward0>)\n",
-      "tensor(24.0081, grad_fn=<AddBackward0>)\n",
-      "tensor(24.0031, grad_fn=<AddBackward0>)\n",
-      "tensor(24.0012, grad_fn=<AddBackward0>)\n"
-     ]
-    },
-    {
-     "data": {
-      "text/plain": [
-       "tensor([[0.0000, 0.0000, 0.0000],\n",
-       "        [0.9951, 0.9951, 0.9951],\n",
-       "        [0.9964, 0.9964, 0.9964],\n",
-       "        [0.0000, 0.0000, 0.0000],\n",
-       "        [0.9922, 0.9922, 0.9922],\n",
-       "        [1.0075, 1.0075, 1.0075],\n",
-       "        [0.0000, 0.0000, 0.0000],\n",
-       "        [0.0000, 0.0000, 0.0000],\n",
-       "        [0.0000, 0.0000, 0.0000],\n",
-       "        [0.0000, 0.0000, 0.0000],\n",
-       "        [0.0000, 0.0000, 0.0000],\n",
-       "        [0.0000, 0.0000, 0.0000]], grad_fn=<ReluBackward0>)"
-      ]
-     },
-     "execution_count": 8,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "#Prep Optimizer\n",
-    "optimizer = torch.optim.SGD(nn.parameters(),lr=0.01)\n",
-    "\n",
-    "#get loss function\n",
-    "def loss_fn4(output):\n",
-    "    return sum(sum((1-output)**2))\n",
-    "\n",
-    "for i in range(10):\n",
-    "    #training loop\n",
-    "    optimizer.zero_grad()\n",
-    "\n",
-    "    output = nn.forward(test)\n",
-    "\n",
-    "    l = loss_fn4(output)\n",
-    "\n",
-    "    l.backward()\n",
-    "\n",
-    "    optimizer.step()\n",
-    "\n",
-    "    print(l)\n",
-    "\n",
-    "nn.forward(test)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 9,
-   "id": "adaptive-period",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "#This is a custom upscale module.\n",
    "class LaunchFnEstimand(torch.nn.Module):\n",
    "    def __init__(self, state_tensor_size,layers_size,number_constellations):\n",
    "        \"\"\"\n",
@ -391,6 +46,8 @@
    "        \"\"\"\n",
    "        super().__init__()\n",
    "        self.number_constellations = number_constellations\n",
+    "        self.layers_size = layers_size\n",
+    "        self.state_tensor_size = state_tensor_size\n",
    "        \n",
    "        #Scale up the input from just the tensor of states to the layer_size X number_constellations\n",
    "        \n",
@ -403,10 +60,9 @@
    "        \n",
    "    def forward(self, input_values):\n",
    "        \n",
-    "        intermediate_values = self.linear_1(input_values)\n",
-    "        intermediate_values = self.relu(intermediate_values)\n",
+    "        intermediate_values = self.relu(input_values) #states should be positive anyway.\n",
+    "        intermediate_values = self.linear_1(intermediate_values)\n",
    "        intermediate_values = self.linear_3(intermediate_values)\n",
-    "        intermediate_values = self.relu(intermediate_values)\n",
    "        intermediate_values = self.linear_5(intermediate_values)\n",
    "        intermediate_values = self.relu(intermediate_values) #launches are always positive\n",
    "        \n",
@ -415,33 +71,33 @@
  },
  {
   "cell_type": "code",
-   "execution_count": 10,
-   "id": "northern-vault",
+   "execution_count": 61,
+   "id": "further-advice",
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
-      "tensor(0.0315, grad_fn=<AddBackward0>)\n",
-      "tensor(0.0241, grad_fn=<AddBackward0>)\n",
-      "tensor(0.0184, grad_fn=<AddBackward0>)\n",
-      "tensor(0.0141, grad_fn=<AddBackward0>)\n",
-      "tensor(0.0107, grad_fn=<AddBackward0>)\n",
-      "tensor(0.0082, grad_fn=<AddBackward0>)\n",
-      "tensor(0.0062, grad_fn=<AddBackward0>)\n",
-      "tensor(0.0048, grad_fn=<AddBackward0>)\n",
-      "tensor(0.0036, grad_fn=<AddBackward0>)\n",
-      "tensor(0.0028, grad_fn=<AddBackward0>)\n"
+      "tensor(0.7175, grad_fn=<AddBackward0>)\n",
+      "tensor(0.2107, grad_fn=<AddBackward0>)\n",
+      "tensor(0.0724, grad_fn=<AddBackward0>)\n",
+      "tensor(0.0259, grad_fn=<AddBackward0>)\n",
+      "tensor(0.0094, grad_fn=<AddBackward0>)\n",
+      "tensor(0.0034, grad_fn=<AddBackward0>)\n",
+      "tensor(0.0012, grad_fn=<AddBackward0>)\n",
+      "tensor(0.0004, grad_fn=<AddBackward0>)\n",
+      "tensor(0.0002, grad_fn=<AddBackward0>)\n",
+      "tensor(5.8468e-05, grad_fn=<AddBackward0>)\n"
     ]
    },
    {
     "data": {
      "text/plain": [
-       "tensor([[[0.0457, 0.0000]]], grad_fn=<ReluBackward0>)"
+       "tensor([[[0.0046, 0.0000]]], grad_fn=<ReluBackward0>)"
      ]
     },
-     "execution_count": 10,
+     "execution_count": 61,
     "metadata": {},
     "output_type": "execute_result"
    }
@ -476,17 +132,17 @@
  },
  {
   "cell_type": "code",
-   "execution_count": 11,
-   "id": "sensitive-pennsylvania",
+   "execution_count": 60,
+   "id": "convinced-candidate",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
-       "tensor([[[0.0457, 0.0000]]], grad_fn=<ReluBackward0>)"
+       "tensor([[[0.0000, 0.9998]]], grad_fn=<ReluBackward0>)"
      ]
     },
-     "execution_count": 11,
+     "execution_count": 60,
     "metadata": {},
     "output_type": "execute_result"
    }
@ -498,7 +154,7 @@
  {
   "cell_type": "code",
   "execution_count": 12,
-   "id": "utility-giant",
+   "id": "prompt-order",
   "metadata": {},
   "outputs": [],
   "source": [
@ -509,19 +165,20 @@
    "        #So, this next section constructs different layers within the NN\n",
    "        #sinlge linear section\n",
    "        \n",
-    "        self.partials_estimator = PartialDerivativesEstimand(state_tensor_size,layers_size,number_constellations)\n",
+    "        self.partials_estimator = PartialDerivativesEstimand(state_tensor_size,layers_size,number_constellations) #TODO\n",
    "        self.launch_estimator = LaunchFnEstimand(state_tensor_size,layers_size,number_constellations)\n",
    "        \n",
    "    def forward(self, input_values):\n",
    "        partials = self.partials_estimator(input_values)\n",
    "        launch = self.launch_estimator(input_values)\n",
+    "        \n",
    "        return c.EstimandInterface(partials,launch)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
-   "id": "molecular-factory",
+   "id": "three-hobby",
   "metadata": {},
   "outputs": [],
   "source": [
@ -531,7 +188,7 @@
  {
   "cell_type": "code",
   "execution_count": 15,
-   "id": "artistic-washer",
+   "id": "overall-league",
   "metadata": {},
   "outputs": [
    {
@ -564,7 +221,7 @@
  {
   "cell_type": "code",
   "execution_count": null,
-   "id": "purple-filling",
+   "id": "weird-municipality",
   "metadata": {},
   "outputs": [],
   "source": []
--- a/Code/NeuralNetworkSpecifications.py
+++ b/Code/NeuralNetworkSpecifications.py
@ -0,0 +1,109 @@
+import torch
+import combined as c
+
+"""
+This module holds the neural networks I am going to use to estimate 
+the functions of interest.
+"""
+
+class LaunchFnEstimand(torch.nn.Module):
+    """
+    This is used to estimate the launch function
+    """
+    def __init__(self, state_tensor_size,layers_size,number_constellations):
+        super().__init__()
+        self.number_constellations = number_constellations
+        self.layers_size = layers_size
+        self.state_tensor_size = state_tensor_size
+        
+        
+        #Layers
+        self.linear_1 = torch.nn.Linear(in_features=state_tensor_size, out_features=layers_size)
+        self.relu = torch.nn.ReLU()
+        self.linear_3 = torch.nn.Linear(in_features=layers_size, out_features=layers_size)
+        self.linear_5 = torch.nn.Linear(in_features=layers_size, out_features=number_constellations)
+
+        
+    def forward(self, input_values):
+        
+        intermediate_values = self.relu(input_values) #states should be positive anyway.
+        intermediate_values = self.linear_1(intermediate_values)
+        intermediate_values = self.linear_3(intermediate_values)
+        intermediate_values = self.linear_5(intermediate_values)
+        intermediate_values = self.relu(intermediate_values) #launches are always positive
+        
+        return intermediate_values
+    
+class PartialDerivativesEstimand(torch.nn.Module):
+    """
+    This is used to estimate the partial derivatives of the value functions
+    """
+    def __init__(self,batch_size, number_constellations, number_states, layer_size=12):
+        super().__init__()
+        self.batch_size = batch_size
+        self.number_constellations = number_constellations
+        self.number_states = number_states
+        self.layer_size = layer_size
+        
+        
+        #preprocess (single linear layer in case there is anything that needs to happen to all states)
+        self.preprocess = torch.nn.Sequential(
+            torch.nn.ReLU() #cleanup as states must be positive
+            ,torch.nn.Linear(in_features = self.number_states, out_features=self.number_states)
+        )
+        #upscale to get the basic dimensionality correct. From (batch,State) to (batch, constellation, state). Includes a reshape
+        self.upsample = lambda x: torch.nn.Upsample(scale_factor=self.number_constellations)(x).view(self.batch_size
+                                                                                            ,self.number_constellations
+                                                                                            ,self.number_states)
+        
+        #sequential steps
+        self.sequential = torch.nn.Sequential(
+            torch.nn.Linear(in_features=number_states, out_features=layer_size)
+            #who knows if a convolution might help here.
+            ,torch.nn.Linear(in_features=layer_size, out_features=layer_size)
+            ,torch.nn.Linear(in_features=layer_size, out_features=layer_size)
+        )
+
+        #reduce the feature axis to match expected results
+        self.feature_reduction = torch.nn.Linear(in_features=layer_size, out_features=number_states)
+        
+    def forward(self, input_values):
+        #Note that the input values are just going to be the state variables
+        #TODO:check that input values match the prepared dimension?
+        
+        #preprocess
+        intermediate = self.preprocess(input_values)
+        
+        #upscale the input values
+        intermediate = self.upsample(intermediate)
+        
+        #intermediate processing
+        intermediate = self.sequential(intermediate)
+        
+        #reduce feature axis to match the expected number of partials
+        intermediate = self.feature_reduction(intermediate)
+        
+        
+        return intermediate
+    
+class EstimandNN(torch.nn.Module):
+    """
+    This neural network takes the current states as input values and returns both
+    the partial derivatives of the value function and the launch function.
+    """
+    def __init__(self, state_tensor_size,layers_size,number_constellations):
+        super().__init__()
+        
+        #So, this next section constructs different layers within the NN
+        #sinlge linear section
+        pass
+        #TODO:verify these are correct
+        self.partials_estimator = PartialDerivativesEstimand(state_tensor_size,layers_size,number_constellations) #TODO
+        self.launch_estimator = LaunchFnEstimand(state_tensor_size,layers_size,number_constellations)
+        
+    def forward(self, input_values):
+        pass
+        partials = self.partials_estimator(input_values)
+        launch = self.launch_estimator(input_values)
+        
+        return c.EstimandInterface(partials,launch)
--- a/Code/PartialDerivativesEstimand.ipynb
+++ b/Code/PartialDerivativesEstimand.ipynb
@ -0,0 +1,203 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "least-cooling",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import torch"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "statistical-temperature",
+   "metadata": {},
+   "source": [
+    "The purpose of this notebook is to allow me to investigate proper shaping of inputs.\n",
+    "\n",
+    "Typically pytorch chooses a tensor specification\n",
+    "$$\n",
+    "(N, .*)\n",
+    "$$\n",
+    "where $N$ is the batch size.\n",
+    "For example a Convolutional NN layer expects\n",
+    "$$\n",
+    "    NCHW\n",
+    "$$\n",
+    "for BatchSize,ChannelSize,Height,Width.\n",
+    "On the other hand, Linear expects\n",
+    "$$\n",
+    "    N.*H\n",
+    "$$\n",
+    "for BatchSize,any number of other dimensions, in_features\n",
+    "\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 15,
+   "id": "japanese-poultry",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "class PartialDerivativesEstimand(torch.nn.Module):\n",
+    "    def __init__(self,batch_size, number_constellations, number_states,scale_factor=4, layer_size=12):\n",
+    "        \"\"\"\n",
+    "        \n",
+    "        \"\"\"\n",
+    "        super().__init__()\n",
+    "        self.batch_size = batch_size\n",
+    "        self.number_constellations = number_constellations\n",
+    "        self.number_states = number_states\n",
+    "        self.scale_factor = scale_factor\n",
+    "        self.layer_size = layer_size\n",
+    "        \n",
+    "        \n",
+    "        #preprocess (single linear layer in case there is anything that needs to happen to all states)\n",
+    "        self.preprocess = torch.nn.Sequential(\n",
+    "            torch.nn.ReLU() #cleanup as states must be positive\n",
+    "            ,torch.nn.Linear(in_features = self.number_states, out_features=self.number_states)\n",
+    "        )\n",
+    "        #upscale to get the basic dimensionality correct. From (batch,State) to (batch, constellation, state). Includes a reshape\n",
+    "        self.upsample = lambda x: torch.nn.Upsample(scale_factor=self.number_constellations)(x).view(self.batch_size\n",
+    "                                                                                            ,self.number_constellations\n",
+    "                                                                                            ,self.number_states)\n",
+    "        \n",
+    "        #sequential steps\n",
+    "        self.sequential = torch.nn.Sequential(\n",
+    "            torch.nn.Linear(in_features=number_states, out_features=layer_size)\n",
+    "            #who knows if a convolution might help here.\n",
+    "            ,torch.nn.Linear(in_features=layer_size, out_features=layer_size)\n",
+    "            ,torch.nn.Linear(in_features=layer_size, out_features=layer_size)\n",
+    "        )\n",
+    "\n",
+    "        #reduce axis to match expectation\n",
+    "        self.feature_reduction = torch.nn.Linear(in_features=layer_size, out_features=number_states)\n",
+    "        \n",
+    "    def forward(self, input_values):\n",
+    "        #Note that the input values are just going to be the state variables\n",
+    "        #TODO:check that input values match the prepared dimension?\n",
+    "        \n",
+    "        #preprocess\n",
+    "        intermediate = self.preprocess(input_values)\n",
+    "        \n",
+    "        #upscale the input values\n",
+    "        intermediate = self.upsample(intermediate)\n",
+    "        \n",
+    "        #intermediate processing\n",
+    "        intermediate = self.sequential(intermediate)\n",
+    "        \n",
+    "        #reduce feature axis to match the expected number of partials\n",
+    "        intermediate = self.feature_reduction(intermediate)\n",
+    "        \n",
+    "        \n",
+    "        return intermediate"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 19,
+   "id": "communist-teach",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "batch_size = 2\n",
+    "constellations = 2\n",
+    "number_states = constellations+1\n",
+    "\n",
+    "#initialize the NN\n",
+    "a = PartialDerivativesEstimand(batch_size,constellations,number_states,scale_factor=2)\n",
+    "\n",
+    "#example state\n",
+    "s = torch.rand(size=(batch_size,1,number_states))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 22,
+   "id": "chemical-revolution",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "tensor([[[0.9283, 0.9414, 0.3426]],\n",
+       "\n",
+       "        [[0.1902, 0.0369, 0.4699]]])"
+      ]
+     },
+     "execution_count": 22,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "s"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 23,
+   "id": "directed-lobby",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "tensor([[[-0.1991,  0.1335,  0.2821],\n",
+       "         [-0.3549,  0.0213,  0.2322]],\n",
+       "\n",
+       "        [[-0.1701,  0.1557,  0.2954],\n",
+       "         [-0.3017,  0.0690,  0.2419]]], grad_fn=<AddBackward0>)"
+      ]
+     },
+     "execution_count": 23,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "a(s)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "placed-coating",
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "advised-execution",
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.8.8"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}