began writing computational approach

5 years ago · 226f344f02
parent 3ca5312fab
commit 226f344f02
2 changed files with 346 additions and 0 deletions
--- a/Code/Untitled.ipynb
+++ b/Code/Untitled.ipynb
@ -0,0 +1,242 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "departmental-hardware",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import torch\n",
+    "from torch.autograd.functional import jacobian"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "id": "differential-shock",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "a = torch.tensor([1,2,3,4.2],requires_grad=False)\n",
+    "b = torch.tensor([2,2,2,2.0],requires_grad=True)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 16,
+   "id": "separated-pursuit",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def test(x,y):\n",
+    "    return (x@y)**2"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 17,
+   "id": "french-trunk",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "tensor(416.1600, grad_fn=<PowBackward0>)"
+      ]
+     },
+     "execution_count": 17,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "test(a,b)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 57,
+   "id": "adverse-ceremony",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "((tensor([81.6000, 81.6000, 81.6000, 81.6000]),\n",
+       "  tensor([ 40.8000,  81.6000, 122.4000, 171.3600])),\n",
+       " tensor([2., 2., 2., 2.], requires_grad=True),\n",
+       " tensor(416.1600, grad_fn=<PowBackward0>))"
+      ]
+     },
+     "execution_count": 57,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "j = jacobian(test,(a,b))\n",
+    "j,b,test(a,b)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 58,
+   "id": "lovely-apple",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "((tensor([-12.8304,  -3.9878,   4.8547,  15.4658]),\n",
+       "  tensor([-10.8365, -21.6729, -32.5094, -45.5132])),\n",
+       " tensor([ 1.1840,  0.3680, -0.4480, -1.4272], grad_fn=<SubBackward0>),\n",
+       " tensor(29.3573, grad_fn=<PowBackward0>))"
+      ]
+     },
+     "execution_count": 58,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "b2 = b - j[1]*b*0.01\n",
+    "j2 = jacobian(test,(a,b2))\n",
+    "j2,b2,test(a,b2)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 63,
+   "id": "stretch-selection",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "((tensor([-13.6581,  -4.2906,   5.2787,  17.0284]),\n",
+       "  tensor([-11.4119, -22.8239, -34.2358, -47.9301])),\n",
+       " tensor([ 1.1968,  0.3760, -0.4626, -1.4922], grad_fn=<SubBackward0>),\n",
+       " tensor(32.5580, grad_fn=<PowBackward0>))"
+      ]
+     },
+     "execution_count": 63,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "b3 = b2 - j2[1]*b2*0.001\n",
+    "j3 = jacobian(test,(a,b3))\n",
+    "j3,b3,test(a,b3)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 64,
+   "id": "colored-visit",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "((tensor([-14.5816,  -4.6324,   5.7628,  18.8361]),\n",
+       "  tensor([-12.0461, -24.0921, -36.1382, -50.5935])),\n",
+       " tensor([ 1.2105,  0.3846, -0.4784, -1.5637], grad_fn=<SubBackward0>),\n",
+       " tensor(36.2769, grad_fn=<PowBackward0>))"
+      ]
+     },
+     "execution_count": 64,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "b4 = b3 - j3[1]*b3*0.001\n",
+    "j4 = jacobian(test,(a,b4))\n",
+    "j4,b4,test(a,b4)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 65,
+   "id": "familiar-pizza",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "((tensor([-15.6173,  -5.0205,   6.3191,  20.9424]),\n",
+       "  tensor([-12.7481, -25.4962, -38.2443, -53.5421])),\n",
+       " tensor([ 1.2251,  0.3938, -0.4957, -1.6428], grad_fn=<SubBackward0>),\n",
+       " tensor(40.6286, grad_fn=<PowBackward0>))"
+      ]
+     },
+     "execution_count": 65,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "b5 = b4 - j4[1]*b4*0.001\n",
+    "j5 = jacobian(test,(a,b5))\n",
+    "j5,b5,test(a,b5)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 66,
+   "id": "brilliant-squad",
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "((tensor([-15.6173,  -5.0205,   6.3191,  20.9424]),\n",
+       "  tensor([-12.7481, -25.4962, -38.2443, -53.5421])),\n",
+       " tensor([ 1.2407,  0.4039, -0.5146, -1.7307], grad_fn=<SubBackward0>),\n",
+       " tensor(45.7605, grad_fn=<PowBackward0>))"
+      ]
+     },
+     "execution_count": 66,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "b6 = b5 - j5[1]*b5*0.001\n",
+    "j6 = jacobian(test,(a,b5))\n",
+    "j6,b6,test(a,b6)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "discrete-engineer",
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.8.8"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
--- a/CurrentWriting/sections/07_ComputationalApproach.tex
+++ b/CurrentWriting/sections/07_ComputationalApproach.tex
@ -0,0 +1,104 @@
+\documentclass[../Main.tex]{subfiles}
+\graphicspath{{\subfix{Assets/img/}}}
+
+\begin{document}
+\subsection{Introduction to }
+The computational approach I have decided to take is an application of 
+\cite{MALIAR2018}, where the policy function is approximated using a
+neural network.
+
+The approach uses the fact that the euler equation implicitly defines the 
+optimal policy function, for example: 
+$[0] = f(x(\theta),\theta)$.
+This can easily be turned into a mean square loss function by squaring both
+sides,
+$0 = f^2(x(\theta),\theta)$,
+allowing one to find $x(\dot)$ as the solution to a minimization problem.
+
+By choosing a neural network as the functional approximation, we are able to 
+take advantage of the significant computational and practical improvements
+currently revolutionizing Machine Learning.
+In particular, we can now use common frameworks, such as python, PyTorch,
+and various online accerators (Google Colab)
+which have been optimized for relatively high performance and 
+straightforward development.
+
+\subsection{Computational Plan}
+I have decided to use python and the PyTorch Neural Network library for this project.
+
+The most difficult step is creating the euler equations. 
+When working with high dimensioned problems involving differentiation,
+three general computational approaches exist:
+\begin{itemize}
+    \item Using a symbolic library (sympy) or language (mathematica) to create the 
+        euler equations.
+        This has the disadvantage of being (very) slow, but the advantage that
+        for a single problem specification it only needs completed once.
+        It requires taking a matrix inverse, which can easily complicate formulas,
+        and is computationally expensive.
+    \item Using numerical differentiation (ND). 
+        The primary issue with ND is that errors can grow quite quickly when 
+        performing algebra on numerical derivatives. 
+        This requires tracking how errors can grow and compound within your
+        specific formulation of the problem.
+    \item Using automatic differentiation (AD) to differentiate the computer code 
+        directly.
+        This approach has a few major benefits. 
+        \begin{itemize}
+            \item Precision is high, because you are calcuating symbolic 
+                derivatives of your computer functions.
+            \item ML is heavily dependent on AD, thus the tools are plentiful
+                and tested.
+            \item The coupling of AD and ML lead to a tight integration with
+                the neural network libraries, simplifying the calibration procedure.
+        \end{itemize}
+\end{itemize}
+I have chosen to use the AD to generate a euler equation function, which will
+then be the basis of our loss function.
+
+
+The first step is to construct the intertemporal transition functions 
+(e.g \ref{put_refs_here}).
+%Not sure how much detail to use.
+%I'm debating on describing how it is done.
+These take derivatives of the value function at time $t$ as an input, and output
+derivatives of the value function at time $t+1$.
+Once this function has been finished, it can be combined with the laws of motion
+in an iterated manner to transition between times $t$ and times $t+k$.
+I did so by coding a function that iteratively compose the transition 
+and laws of motion functions, retuning a $k$-period transition function.
+
+The second step is to generate functions that represent the optimality conditions.
+By taking the appropriate derivatives with respect to the laws of motion and
+utility functions, this can be constructed explicitly.
+
+Once these two functions are completed, they can be combined to create
+the euler equations, as described in appendix \ref{appx??}.
+
+\subsection{Training}
+
+With the euler equation and resulting loss function in place, 
+standard training approachs can be used to fit the function.
+I plan on using some variation on stochastic gradient descent.
+
+Normally, neural networks are trained on real world data.
+As this is a synthetic model, I am planning on training it on random selections
+from the state space.
+If I can data on how satellites are and have been distributed, I plan on
+selecting from that distribution.
+
+\subsections{Extensions}
+One key question is how to handle the case of heterogeneous agents.
+I believe I can address this in the constellation operator's case
+by solving for the policy functions of each class of operator
+simultaneously. 
+I still have some questions about this approach and have not dived into 
+some of the mathemeatics that deeply.
+
+
+
+\subsection{Existence concerns}
+%check matrix inverses etc.
+%
+
+\end{document}