DiffEqML
diff --git a/‎tutorials/model predictive control/02c_mpc_constraints_final.ipynb
Lines changed: 313 additions & 0 deletions b/‎tutorials/model predictive control/02c_mpc_constraints_final.ipynb
Lines changed: 313 additions & 0 deletions
@@ -0,0 +1,313 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import torch\n",
+    "import torch.nn as nn\n",
+    "from torchdiffeq import odeint\n",
+    "import sys; sys.path.append(2*'../')\n",
+    "from src import *\n",
+    "import matplotlib.pyplot as plt\n",
+    "from torch.distributions import MultivariateNormal, Uniform\n",
+    "from warnings import warn\n",
+    "\n",
+    "# device = torch.device('cuda:0')\n",
+    "device=torch.device('cpu')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 1. CSTR model"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Input scaling:\n",
+      " tensor([1.0000, 1.0000, 0.0100, 0.0100])\n",
+      "Output scaling:\n",
+      " tensor([[ 5.0000e+00,  1.0000e+02],\n",
+      "        [-8.5000e+03,  0.0000e+00]])\n",
+      "Lower bounds:\n",
+      " [0.1, 0.1, 50.0, 50.0] \n",
+      "Upper bounds:\n",
+      " [2.0, 2.0, None, 140.0]\n"
+     ]
+    }
+   ],
+   "source": [
+    "System = ControlledCSTR\n",
+    "\n",
+    "##### Scaling since the parameters have very different values\n",
+    "scaling_T_R = 1/100\n",
+    "scaling_T_K = 1/100\n",
+    "scaling_Q_dot = 1/2000\n",
+    "scaling_F = 1/100\n",
+    "\n",
+    "# Scale the inputs appropriately for the controller\n",
+    "in_scal = torch.ones(4).to(device)\n",
+    "in_scal[2] = scaling_T_R\n",
+    "in_scal[3] = scaling_T_K\n",
+    "print('Input scaling:\\n', in_scal)\n",
+    "\n",
+    "out_scal = torch.tensor([[5.,  100.],\n",
+    "                        [-8500, 0.]]).to(device)\n",
+    "print('Output scaling:\\n', out_scal)\n",
+    "\n",
+    "# State constraints\n",
+    "lower_bounds = [0.1, 0.1, 50., 50.]\n",
+    "upper_bounds = [2., 2., None, 140.]\n",
+    "penalties =  .01*torch.ones(4); penalties[3] = 100\n",
+    "# penalties =  torch.zeros(4)\n",
+    "print('Lower bounds:\\n', lower_bounds, '\\nUpper bounds:\\n', upper_bounds)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 2. Parameters for MPC simulation"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Time constraints\n",
+    "Δt = 0.005\n",
+    "t0, tf = 0, 0.5 # 0.5\n",
+    "t_span = torch.linspace(t0, tf, int(tf/Δt) + 1).to(device) # define the t span\n",
+    "\n",
+    "# MPC simulation variables\n",
+    "steps_nom = 10 # Nominal steps to do between each MPC step\n",
+    "max_iters = 50\n",
+    "eps_accept = 1e-3 # so we 'fix' the iterations to be always maximum\n",
+    "lookahead_steps = 10\n",
+    "bs = 512\n",
+    "\n",
+    "# Desired final condition\n",
+    "C_b_star = 0.6\n",
+    "\n",
+    "# Initial Conditions\n",
+    "ε = .01 # 1% of uncertainty given initial conditions\n",
+    "C_a_0 = 0.8 # This is the initial concentration inside the tank [mol/l]\n",
+    "C_b_0 = 0.5 # This is the controlled variable [mol/l]\n",
+    "T_R_0 = 134.14 #[C]\n",
+    "T_K_0 = 130.0 #[C]\n",
+    "init = torch.Tensor([C_a_0, C_b_0, T_R_0, T_K_0])\n",
+    "init_dist = Uniform((1-ε)*init, (1+ε)*init)\n",
+    "x0 = init_dist.sample((bs,)).to(device)\n",
+    "\n",
+    "# Controllers and systems\n",
+    "lr = .5e-3\n",
+    "u = BoxConstrainedController(4, 2, input_scaling=in_scal, output_scaling=out_scal, constrained=True)\n",
+    "const_u = RandConstController([1, 1], -1, 1).to(device) # dummy constant controller for simulation\n",
+    "opt = torch.optim.Adam(u.parameters(), lr=lr) # optimizer\n",
+    "system = System(u, solver='midpoint', retain_u=True)\n",
+    "real_system = System(const_u, solver='dopri5')"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 2b. Define cost function"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "loss = nn.MSELoss()\n",
+    "class PositioningCost(nn.Module):\n",
+    "    '''Economic version of the positioning cost: we want to\n",
+    "    penalize big control inputs\n",
+    "\n",
+    "    Args:\n",
+    "        target: torch.tensor, target position\n",
+    "        Q: float, state weight\n",
+    "        R: float, controller weight\n",
+    "        P: float, terminal cost weight\n",
+    "    '''\n",
+    "    def __init__(self, target, Q=1, R=0, P=0):\n",
+    "        super().__init__()\n",
+    "        self.target = target\n",
+    "        self.Q, self.R, self.P = Q, R, P\n",
+    "        \n",
+    "    def forward(self, traj, u=None, mesh_p=None):\n",
+    "        \"\"\"\n",
+    "        traj: trajectory to be followed\n",
+    "        u: control input to be minimized\n",
+    "        \"\"\"\n",
+    "        cost = self.Q*torch.norm(traj[-1, ..., 1] - self.target).mean(0)\n",
+    "        return cost\n",
+    "    \n",
+    "cost_function = PositioningCost(torch.Tensor([C_b_star]))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Starting simulation... Time: 0.0000 s\n",
+      "Inner-loop did not converge, last cost: 0.762 | Time: 0.0050 s\n",
+      "Inner-loop did not converge, last cost: 0.362 | Time: 0.0100 s\n",
+      "Inner-loop did not converge, last cost: 0.372 | Time: 0.0150 s\n",
+      "Inner-loop did not converge, last cost: 0.380 | Time: 0.0200 s\n",
+      "Inner-loop did not converge, last cost: 0.385 | Time: 0.0250 s\n",
+      "Inner-loop did not converge, last cost: 0.387 | Time: 0.0300 s\n",
+      "Inner-loop did not converge, last cost: 0.386 | Time: 0.0350 s\n",
+      "Inner-loop did not converge, last cost: 0.384 | Time: 0.0400 s\n",
+      "Inner-loop did not converge, last cost: 0.381 | Time: 0.0450 s\n",
+      "Inner-loop did not converge, last cost: 0.377 | Time: 0.0500 s\n",
+      "Inner-loop did not converge, last cost: 0.371 | Time: 0.0550 s\n",
+      "Inner-loop did not converge, last cost: 0.366 | Time: 0.0600 s\n",
+      "Inner-loop did not converge, last cost: 0.360 | Time: 0.0650 s\n",
+      "Inner-loop did not converge, last cost: 0.354 | Time: 0.0700 s\n",
+      "Inner-loop did not converge, last cost: 0.347 | Time: 0.0750 s\n",
+      "Inner-loop did not converge, last cost: 0.341 | Time: 0.0800 s\n",
+      "Inner-loop did not converge, last cost: 0.334 | Time: 0.0850 s\n",
+      "Inner-loop did not converge, last cost: 0.327 | Time: 0.0900 s\n",
+      "Inner-loop did not converge, last cost: 0.321 | Time: 0.0950 s\n",
+      "Inner-loop did not converge, last cost: 0.314 | Time: 0.1000 s\n",
+      "Inner-loop did not converge, last cost: 0.308 | Time: 0.1050 s\n",
+      "Inner-loop did not converge, last cost: 0.302 | Time: 0.1100 s\n",
+      "Inner-loop did not converge, last cost: 0.295 | Time: 0.1150 s\n",
+      "Inner-loop did not converge, last cost: 0.289 | Time: 0.1200 s\n",
+      "Inner-loop did not converge, last cost: 0.284 | Time: 0.1250 s\n",
+      "Inner-loop did not converge, last cost: 0.278 | Time: 0.1300 s\n",
+      "Inner-loop did not converge, last cost: 0.273 | Time: 0.1350 s\n",
+      "Inner-loop did not converge, last cost: 0.267 | Time: 0.1400 s\n",
+      "Inner-loop did not converge, last cost: 0.262 | Time: 0.1450 s\n",
+      "Inner-loop did not converge, last cost: 0.257 | Time: 0.1500 s\n",
+      "Inner-loop did not converge, last cost: 0.253 | Time: 0.1550 s\n",
+      "Inner-loop did not converge, last cost: 0.247 | Time: 0.1600 s\n",
+      "Inner-loop did not converge, last cost: 0.243 | Time: 0.1650 s\n",
+      "Inner-loop did not converge, last cost: 0.239 | Time: 0.1700 s\n",
+      "Inner-loop did not converge, last cost: 0.236 | Time: 0.1750 s\n",
+      "Inner-loop did not converge, last cost: 0.233 | Time: 0.1800 s\n",
+      "Inner-loop did not converge, last cost: 0.229 | Time: 0.1850 s\n",
+      "Inner-loop did not converge, last cost: 0.227 | Time: 0.1900 s\n",
+      "Inner-loop did not converge, last cost: 0.223 | Time: 0.1950 s\n",
+      "Inner-loop did not converge, last cost: 0.221 | Time: 0.2000 s\n",
+      "Inner-loop did not converge, last cost: 0.221 | Time: 0.2050 s\n",
+      "Inner-loop did not converge, last cost: 0.217 | Time: 0.2100 s\n",
+      "Inner-loop did not converge, last cost: 0.214 | Time: 0.2150 s\n",
+      "Inner-loop did not converge, last cost: 0.212 | Time: 0.2200 s\n",
+      "Inner-loop did not converge, last cost: 0.211 | Time: 0.2250 s\n",
+      "Inner-loop did not converge, last cost: 0.209 | Time: 0.2300 s\n",
+      "Inner-loop did not converge, last cost: 0.207 | Time: 0.2350 s\n",
+      "Inner-loop did not converge, last cost: 0.205 | Time: 0.2400 s\n",
+      "Inner-loop did not converge, last cost: 0.204 | Time: 0.2450 s\n",
+      "Inner-loop did not converge, last cost: 0.203 | Time: 0.2500 s\n",
+      "Inner-loop did not converge, last cost: 0.201 | Time: 0.2550 s\n",
+      "Inner-loop did not converge, last cost: 0.200 | Time: 0.2600 s\n",
+      "Inner-loop did not converge, last cost: 0.198 | Time: 0.2650 s\n",
+      "Inner-loop did not converge, last cost: 0.197 | Time: 0.2700 s\n",
+      "Inner-loop did not converge, last cost: 0.196 | Time: 0.2750 s\n",
+      "Inner-loop did not converge, last cost: 0.195 | Time: 0.2800 s\n",
+      "Inner-loop did not converge, last cost: 0.194 | Time: 0.2850 s\n",
+      "Inner-loop did not converge, last cost: 0.193 | Time: 0.2900 s\n",
+      "Inner-loop did not converge, last cost: 0.192 | Time: 0.2950 s\n",
+      "Inner-loop did not converge, last cost: 0.191 | Time: 0.3000 s\n",
+      "Inner-loop did not converge, last cost: 0.191 | Time: 0.3050 s\n",
+      "Inner-loop did not converge, last cost: 0.190 | Time: 0.3100 s\n",
+      "Inner-loop did not converge, last cost: 0.189 | Time: 0.3150 s\n",
+      "Inner-loop did not converge, last cost: 0.188 | Time: 0.3200 s\n",
+      "Inner-loop did not converge, last cost: 0.188 | Time: 0.3250 s\n",
+      "Inner-loop did not converge, last cost: 0.187 | Time: 0.3300 s\n",
+      "Inner-loop did not converge, last cost: 0.186 | Time: 0.3350 s\n",
+      "Inner-loop did not converge, last cost: 0.186 | Time: 0.3400 s\n",
+      "Inner-loop did not converge, last cost: 0.185 | Time: 0.3450 s\n",
+      "Inner-loop did not converge, last cost: 0.185 | Time: 0.3500 s\n",
+      "Inner-loop did not converge, last cost: 0.184 | Time: 0.3550 s\n",
+      "Inner-loop did not converge, last cost: 0.184 | Time: 0.3600 s\n",
+      "Inner-loop did not converge, last cost: 0.183 | Time: 0.3650 s\n",
+      "Inner-loop did not converge, last cost: 0.183 | Time: 0.3700 s\n",
+      "Inner-loop did not converge, last cost: 0.182 | Time: 0.3750 s\n",
+      "Inner-loop did not converge, last cost: 0.182 | Time: 0.3800 s\n",
+      "Inner-loop did not converge, last cost: 0.182 | Time: 0.3850 s\n",
+      "Inner-loop did not converge, last cost: 0.181 | Time: 0.3900 s\n",
+      "Inner-loop did not converge, last cost: 0.181 | Time: 0.3950 s\n",
+      "Inner-loop did not converge, last cost: 0.181 | Time: 0.4000 s\n",
+      "Inner-loop did not converge, last cost: 0.180 | Time: 0.4050 s\n",
+      "Inner-loop did not converge, last cost: 0.180 | Time: 0.4100 s\n",
+      "Inner-loop did not converge, last cost: 0.180 | Time: 0.4150 s\n",
+      "Inner-loop did not converge, last cost: 0.179 | Time: 0.4200 s\n",
+      "Inner-loop did not converge, last cost: 0.179 | Time: 0.4250 s\n",
+      "Inner-loop did not converge, last cost: 0.179 | Time: 0.4300 s\n",
+      "Inner-loop did not converge, last cost: 0.179 | Time: 0.4350 s\n",
+      "Inner-loop did not converge, last cost: 0.178 | Time: 0.4400 s\n",
+      "Inner-loop did not converge, last cost: 0.178 | Time: 0.4450 s\n",
+      "Inner-loop did not converge, last cost: 0.178 | Time: 0.4500 s\n",
+      "Inner-loop did not converge, last cost: 0.178 | Time: 0.4550 s\n",
+      "Inner-loop did not converge, last cost: 0.178 | Time: 0.4600 s\n",
+      "Inner-loop did not converge, last cost: 0.177 | Time: 0.4650 s\n",
+      "Inner-loop did not converge, last cost: 0.177 | Time: 0.4700 s\n",
+      "Inner-loop did not converge, last cost: 0.177 | Time: 0.4750 s\n",
+      "Inner-loop did not converge, last cost: 0.177 | Time: 0.4800 s\n",
+      "Inner-loop did not converge, last cost: 0.177 | Time: 0.4850 s\n",
+      "Inner-loop did not converge, last cost: 0.176 | Time: 0.4900 s\n",
+      "Inner-loop did not converge, last cost: 0.176 | Time: 0.4950 s\n",
+      "Inner-loop did not converge, last cost: 0.176 | Time: 0.5000 s\n",
+      "The simulation has ended!\n"
+     ]
+    }
+   ],
+   "source": [
+    "mpc = TorchMPC(system, cost_function, t_span, opt, eps_accept=eps_accept, max_g_iters=max_iters,\n",
+    "                lookahead_steps=lookahead_steps, lower_bounds=lower_bounds,\n",
+    "                upper_bounds=upper_bounds, penalties=penalties).to(device)\n",
+    "\n",
+    "mpc.forward_simulation(real_system, x0, t_span)\n",
+    "\n",
+    "with torch.no_grad():\n",
+    "# Save the learned controller and nominal trajectory\n",
+    "    torch.save(mpc.control_inputs, 'data/control_inputs.pt')\n",
+    "    torch.save(mpc.trajectory_nominal, 'data/trajectory.pt')"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3 (ipykernel)",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.9.5"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 4
+}