{ "cells": [ { "cell_type": "markdown", "metadata": { "colab_type": "text", "id": "x83dMPapQBN6" }, "source": [ "# Gyroscope DDPG/TD3/SAC training (spinup library)" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "colab": {}, "colab_type": "code", "id": "8inmkEG5QHqx" }, "outputs": [], "source": [ "from google.colab import drive\n", "drive.mount('/content/drive')" ] }, { "cell_type": "code", "execution_count": null, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 35 }, "colab_type": "code", "executionInfo": { "elapsed": 655, "status": "ok", "timestamp": 1584030129316, "user": { "displayName": "Matthieu Le Cauchois", "photoUrl": "https://lh3.googleusercontent.com/a-/AOh14GgY9gRlHHK-FHlINeRnTJw_wewJsr639GH8MAWl=s64", "userId": "10992927378504656501" }, "user_tz": -60 }, "id": "DnnJGcnsQvZC", "outputId": "9d6d1408-da29-44ed-af74-4ebdc2bd865a" }, "outputs": [], "source": [ "cd drive/My\\ Drive/Colab Notebooks/DDPG_uda_v0/" ] }, { "cell_type": "code", "execution_count": 1, "metadata": { "colab": {}, "colab_type": "code", "id": "fuJhdd479TpP" }, "outputs": [ { "data": { "text/html": [ "
" ], "text/plain": [ "" ] }, "metadata": {}, "output_type": "display_data" }, { "data": { "application/javascript": [ "if (typeof Jupyter !== \"undefined\") { window.__context = { glowscript_container: $(\"#glowscript\").removeAttr(\"id\")};}else{ element.textContent = ' ';}" ], "text/plain": [ "" ] }, "metadata": {}, "output_type": "display_data" }, { "ename": "ModuleNotFoundError", "evalue": "No module named 'spinup'", "output_type": "error", "traceback": [ "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", "\u001b[0;31mModuleNotFoundError\u001b[0m Traceback (most recent call last)", "\u001b[0;32m\u001b[0m in \u001b[0;36m\u001b[0;34m\u001b[0m\n\u001b[1;32m 12\u001b[0m \u001b[0;32mfrom\u001b[0m \u001b[0mvpython\u001b[0m \u001b[0;32mimport\u001b[0m \u001b[0;34m*\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 13\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m---> 14\u001b[0;31m \u001b[0;32mimport\u001b[0m \u001b[0mspinup\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m", "\u001b[0;31mModuleNotFoundError\u001b[0m: No module named 'spinup'" ] } ], "source": [ "import gym\n", "from gym import spaces\n", "from gym.utils import seeding\n", "from os import path\n", "from scipy.integrate import solve_ivp\n", "import random\n", "import torch\n", "import numpy as np\n", "from collections import deque\n", "import matplotlib.pyplot as plt\n", "%matplotlib inline\n", "from vpython import *\n", "\n", "import spinup" ] }, { "cell_type": "markdown", "metadata": { "colab_type": "text", "id": "O0O0t5ZR9Tp6" }, "source": [ "## Environment Class and Modules" ] }, { "cell_type": "code", "execution_count": 2, "metadata": { "colab": {}, "colab_type": "code", "id": "Al_k1rtvQBOM" }, "outputs": [], "source": [ "class GyroscopeEnv(gym.Env):\n", " \n", " \n", " \"\"\"\n", " GyroscopeEnv is a double gimbal control moment gyroscope (DGCMG) with 2 input voltage u1 and u2 \n", " on the two gimbals, and disk speed assumed constant (parameter w). Simulation is based on the \n", " Quanser 3-DOF gyroscope setup.\n", " \n", " \n", " **STATE:**\n", " The state consists of the angle and angular speed of the outer red gimbal (theta = x1, thetadot = x2),\n", " the angle and angular speed of the inner blue gimbal (phi = x3, phidot = x4), the difference to the reference\n", " for tracking on theta and phi (tracking error theta = diff_x1, tracking error phi = diff_x3), and the \n", " disk speed (disk speed = w):\n", " \n", " state = [x1, x2, x3, x4, diff_x1, diff_x3, w]\n", " \n", " **ACTIONS:**\n", " The actions are the input voltage to create the red and blue gimbal torque (red voltage = u1, blue voltage = u2),\n", " and are continuous in a range of -10 and 10V:\n", " \n", " action = [u1,u2]\n", " \n", " \"\"\"\n", " \n", " \n", " metadata = {\n", " 'render.modes' : ['human', 'rgb_array'],\n", " 'video.frames_per_second' : 30\n", " }\n", "\n", " def __init__(self):\n", " \n", " # Inertias in Kg*m2\n", " self.Jbx1 = 0.0019\n", " self.Jbx2 = 0.0008\n", " self.Jbx3 = 0.0012\n", " self.Jrx1 = 0.0179\n", " self.Jdx1 = 0.0028\n", " self.Jdx3 = 0.0056\n", " \n", " # Combined inertias\n", " self.J1 = self.Jbx1 - self.Jbx3 + self.Jdx1 - self.Jdx3\n", " self.J2 = self.Jbx1 + self.Jdx1 + self.Jrx1\n", " self.J3 = self.Jbx2 + self.Jdx1\n", "\n", " # Motor constants\n", " self.Kamp = 0.5 # A/V\n", " self.Ktorque = 0.0704 # Nm/A\n", " self.eff = 0.86\n", " self.nRed = 1.5\n", " self.nBlue = 1\n", " self.KtotRed = self.Kamp*self.Ktorque*self.eff*self.nRed \n", " self.KtotBlue = self.Kamp*self.Ktorque*self.eff*self.nBlue \n", " \n", " # Time step in s\n", " self.dt = 0.05\n", " \n", " # Error\n", " self.int_diff_x1 = 0\n", " self.int_diff_x3 = 0\n", " \n", " # Action space\n", " self.maxVoltage = 10 # V\n", " self.highAct = np.array([self.maxVoltage,self.maxVoltage])\n", " self.action_space = spaces.Box(low = -self.highAct, high = self.highAct, dtype=np.float32) \n", " \n", " # Observation space (here it is equal to state space)\n", " self.maxSpeed = 100 * 2 * np.pi / 60\n", " self.maxAngle = np.pi\n", " self.maxdiskSpeed = 300 * 2 * np.pi / 60\n", " self.highObs = np.array([self.maxAngle,self.maxSpeed,self.maxAngle,self.maxSpeed,self.maxAngle,self.maxAngle,self.maxdiskSpeed])\n", " self.observation_space = spaces.Box(low = -self.highObs, high = self.highObs, dtype=np.float32)\n", "\n", " # Seed for random number generation\n", " self.seed()\n", " \n", " self.viewer = None\n", "\n", " def seed(self, seed=None):\n", " self.np_random, seed = seeding.np_random(seed)\n", " return [seed]\n", " \n", " \n", "\n", " def step(self,u):\n", " x1, x2, x3, x4, x1_ref, x3_ref, w= self.state \n", " u1,u2 = u\n", " \n", " # Angle error\n", " diff_x1 = angle_normalize(x1 - x1_ref)\n", " diff_x3 = angle_normalize(x3 - x3_ref)\n", " \n", " # Integral of error\n", " self.int_diff_x1 = self.int_diff_x1 + diff_x1\n", " self.int_diff_x3 = self.int_diff_x3 + diff_x3\n", " \n", " # Reward 1: differentiable reward (LQR obj function)\n", " reward = -((3*diff_x1)**2 + (3*diff_x3)**2 + (.2*x2)**2 + (.2*x4)**2 + (.1*u1)**2 + (.1*u2)**2)\\\n", " #-(0.01*abs(self.int_diff_x1) + 0.01*abs(self.int_diff_x3))\n", "\n", " \"\"\"# Count time spent in goal:\n", " if abs(diff_x1)<0.05 and abs(diff_x3)<0.05:\n", " self.countGoal +=1\n", " else:\n", " self.countGoal = 0\n", " \n", " # Reward 2: sparse reward for staying in goal range for a long time \n", " if self.countGoal >= (self.timeGoal)/self.dt: #max expected reward over length becomes 0 + (totaltime-goaltime)\n", " reward += 1\"\"\"\n", "\n", "\n", " results = solve_ivp(fun = dxdt, t_span = (0, self.dt), y0 = [x1,x2,x3,x4], method='RK45', args=(u1,u2,self))\n", " \n", " x1 = angle_normalize(results.y[0][-1])\n", " x2 = np.clip(results.y[1][-1],-self.maxSpeed,self.maxSpeed)\n", " x3 = angle_normalize(results.y[2][-1])\n", " x4 = np.clip(results.y[3][-1],-self.maxSpeed,self.maxSpeed)\n", " \n", " self.state = np.asarray([x1,x2,x3,x4,x1_ref, x3_ref,w])\n", "\n", " return (self.state, reward, False, {})\n", "\n", " def reset(self, state = None):\n", " \n", " \n", " # Generate random state (for training) or use given state (for simulation)\n", " if state is None:\n", " self.state = self.np_random.uniform(low=-self.highObs, high=self.highObs)\n", " else:\n", " self.state = state\n", "\n", " \n", " return self.state\n", "\n", "\n", " def render(self, mode='human'):\n", " return None\n", " \n", " def close(self):\n", " if self.viewer:\n", " self.viewer.close()\n", " self.viewer = None\n", " \n", "def dxdt(t, x, u1, u2, gyro):\n", " \n", " # Rewrite constants shorter\n", " J1 = gyro.J1\n", " J2 = gyro.J2\n", " J3 = gyro.J3\n", " Jdx3 = gyro.Jdx3\n", " KtotRed = gyro.KtotRed\n", " KtotBlue = gyro.KtotBlue\n", " w = x[-1]\n", "\n", " # Convert input voltage to input torque\n", " u1,u2 = KtotRed*u1, KtotBlue*u2\n", " \n", " # Equations of motion \n", " dx_dt = [0, 0, 0, 0]\n", " dx_dt[0] = x[1]\n", " dx_dt[1] = (u1+J1*np.sin(2*x[2])*x[1]*x[3]-Jdx3*np.cos(x[2])*x[3]*w)/(J2 + J1*np.power(np.sin(x[2]),2))\n", " dx_dt[2] = x[3]\n", " dx_dt[3] = (u2 - J1*np.cos(x[2])*np.sin(x[2])*np.power(x[1],2)+Jdx3*np.cos(x[2])*x[1]*w)/J3\n", " return dx_dt\n", " \n", "def angle_normalize(x):\n", " return (((x+np.pi) % (2*np.pi)) - np.pi) # To keep the angles between -pi and pi\n" ] }, { "cell_type": "markdown", "metadata": { "colab_type": "text", "id": "be0wYIeBQBOc" }, "source": [ "## Training" ] }, { "cell_type": "code", "execution_count": 3, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 533 }, "colab_type": "code", "executionInfo": { "elapsed": 654004, "status": "error", "timestamp": 1584037207187, "user": { "displayName": "Matthieu Le Cauchois", "photoUrl": "https://lh3.googleusercontent.com/a-/AOh14GgY9gRlHHK-FHlINeRnTJw_wewJsr639GH8MAWl=s64", "userId": "10992927378504656501" }, "user_tz": -60 }, "id": "fLyFHs0yQBOd", "outputId": "260489ff-5e40-416a-e529-5a0cfcaefceb" }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Warning: Log dir model already exists! Storing info there anyway.\n", "\u001b[32;1mLogging data to model/progress.txt\u001b[0m\n", "\u001b[36;1mSaving config:\n", "\u001b[0m\n", "{\n", " \"ac_kwargs\":\t{},\n", " \"act_noise\":\t0.1,\n", " \"actor_critic\":\t\"MLPActorCritic\",\n", " \"batch_size\":\t100,\n", " \"env_fn\":\t\"GyroscopeEnv\",\n", " \"epochs\":\t120,\n", " \"exp_name\":\t\"v0\",\n", " \"gamma\":\t0.95,\n", " \"logger\":\t{\n", " \"\":\t{\n", " \"epoch_dict\":\t{},\n", " \"exp_name\":\t\"v0\",\n", " \"first_row\":\ttrue,\n", " \"log_current_row\":\t{},\n", " \"log_headers\":\t[],\n", " \"output_dir\":\t\"model\",\n", " \"output_file\":\t{\n", " \"<_io.TextIOWrapper name='model/progress.txt' mode='w' encoding='UTF-8'>\":\t{\n", " \"mode\":\t\"w\"\n", " }\n", " }\n", " }\n", " },\n", " \"logger_kwargs\":\t{\n", " \"exp_name\":\t\"v0\",\n", " \"output_dir\":\t\"model\"\n", " },\n", " \"max_ep_len\":\t110,\n", " \"noise_clip\":\t0.5,\n", " \"num_test_episodes\":\t10,\n", " \"pi_lr\":\t0.001,\n", " \"policy_delay\":\t2,\n", " \"polyak\":\t0.995,\n", " \"q_lr\":\t0.001,\n", " \"replay_size\":\t1000000,\n", " \"save_freq\":\t1,\n", " \"seed\":\t0,\n", " \"start_steps\":\t20000,\n", " \"steps_per_epoch\":\t2200,\n", " \"target_noise\":\t0.2,\n", " \"update_after\":\t800,\n", " \"update_every\":\t50\n", "}\n", "\u001b[32;1m\n", "Number of parameters: \t pi: 68354, \t q1: 68609, \t q2: 68609\n", "\u001b[0m\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "/home/matthieulc/Documents/MA2/PS1/ps1venv/lib/python3.6/site-packages/gym/logger.py:30: UserWarning: \u001b[33mWARN: Box bound precision lowered by casting to float32\u001b[0m\n", " warnings.warn(colorize('%s: %s'%('WARN', msg % args), 'yellow'))\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "---------------------------------------\n", "| Epoch | 1 |\n", "| AverageEpRet | -6.44e+03 |\n", "| StdEpRet | 1.49e+03 |\n", "| MaxEpRet | -4.55e+03 |\n", "| MinEpRet | -9.52e+03 |\n", "| AverageTestEpRet | -7.13e+03 |\n", "| StdTestEpRet | 1.25e+03 |\n", "| MaxTestEpRet | -4.01e+03 |\n", "| MinTestEpRet | -8.49e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.2e+03 |\n", "| AverageQ1Vals | -123 |\n", "| StdQ1Vals | 54.5 |\n", "| MaxQ1Vals | 0.0809 |\n", "| MinQ1Vals | -364 |\n", "| AverageQ2Vals | -123 |\n", "| StdQ2Vals | 54.6 |\n", "| MaxQ2Vals | 1.77 |\n", "| MinQ2Vals | -373 |\n", "| LossPi | 112 |\n", "| LossQ | 1.95e+03 |\n", "| Time | 15.8 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 2 |\n", "| AverageEpRet | -6.72e+03 |\n", "| StdEpRet | 1.81e+03 |\n", "| MaxEpRet | -4.58e+03 |\n", "| MinEpRet | -1.07e+04 |\n", "| AverageTestEpRet | -8.21e+03 |\n", "| StdTestEpRet | 1.1e+03 |\n", "| MaxTestEpRet | -6.46e+03 |\n", "| MinTestEpRet | -1.01e+04 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 4.4e+03 |\n", "| AverageQ1Vals | -276 |\n", "| StdQ1Vals | 98.9 |\n", "| MaxQ1Vals | -54.4 |\n", "| MinQ1Vals | -672 |\n", "| AverageQ2Vals | -276 |\n", "| StdQ2Vals | 99.2 |\n", "| MaxQ2Vals | -51.6 |\n", "| MinQ2Vals | -686 |\n", "| LossPi | 256 |\n", "| LossQ | 2.12e+03 |\n", "| Time | 42.1 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 3 |\n", "| AverageEpRet | -7.08e+03 |\n", "| StdEpRet | 1.22e+03 |\n", "| MaxEpRet | -4.94e+03 |\n", "| MinEpRet | -9.27e+03 |\n", "| AverageTestEpRet | -5.91e+03 |\n", "| StdTestEpRet | 1.83e+03 |\n", "| MaxTestEpRet | -3.79e+03 |\n", "| MinTestEpRet | -9.63e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 6.6e+03 |\n", "| AverageQ1Vals | -414 |\n", "| StdQ1Vals | 128 |\n", "| MaxQ1Vals | -36.3 |\n", "| MinQ1Vals | -952 |\n", "| AverageQ2Vals | -414 |\n", "| StdQ2Vals | 128 |\n", "| MaxQ2Vals | -26.8 |\n", "| MinQ2Vals | -950 |\n", "| LossPi | 382 |\n", "| LossQ | 2.76e+03 |\n", "| Time | 67.9 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 4 |\n", "| AverageEpRet | -7.06e+03 |\n", "| StdEpRet | 1.53e+03 |\n", "| MaxEpRet | -4.98e+03 |\n", "| MinEpRet | -1.09e+04 |\n", "| AverageTestEpRet | -5.01e+03 |\n", "| StdTestEpRet | 1.18e+03 |\n", "| MaxTestEpRet | -3.34e+03 |\n", "| MinTestEpRet | -6.44e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 8.8e+03 |\n", "| AverageQ1Vals | -501 |\n", "| StdQ1Vals | 154 |\n", "| MaxQ1Vals | 11.2 |\n", "| MinQ1Vals | -1.07e+03 |\n", "| AverageQ2Vals | -501 |\n", "| StdQ2Vals | 154 |\n", "| MaxQ2Vals | 16.9 |\n", "| MinQ2Vals | -1.11e+03 |\n", "| LossPi | 459 |\n", "| LossQ | 3.94e+03 |\n", "| Time | 92 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 5 |\n", "| AverageEpRet | -6.3e+03 |\n", "| StdEpRet | 1.14e+03 |\n", "| MaxEpRet | -3.87e+03 |\n", "| MinEpRet | -8.1e+03 |\n", "| AverageTestEpRet | -4.27e+03 |\n", "| StdTestEpRet | 1.52e+03 |\n", "| MaxTestEpRet | -1.82e+03 |\n", "| MinTestEpRet | -6.62e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.1e+04 |\n", "| AverageQ1Vals | -552 |\n", "| StdQ1Vals | 173 |\n", "| MaxQ1Vals | -15.7 |\n", "| MinQ1Vals | -1.15e+03 |\n", "| AverageQ2Vals | -552 |\n", "| StdQ2Vals | 172 |\n", "| MaxQ2Vals | 17.8 |\n", "| MinQ2Vals | -1.17e+03 |\n", "| LossPi | 508 |\n", "| LossQ | 4.63e+03 |\n", "| Time | 116 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 6 |\n", "| AverageEpRet | -6.76e+03 |\n", "| StdEpRet | 1.35e+03 |\n", "| MaxEpRet | -4.61e+03 |\n", "| MinEpRet | -1.13e+04 |\n", "| AverageTestEpRet | -3.67e+03 |\n", "| StdTestEpRet | 994 |\n", "| MaxTestEpRet | -2.24e+03 |\n", "| MinTestEpRet | -5.28e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.32e+04 |\n", "| AverageQ1Vals | -574 |\n", "| StdQ1Vals | 186 |\n", "| MaxQ1Vals | -39.4 |\n", "| MinQ1Vals | -1.41e+03 |\n", "| AverageQ2Vals | -574 |\n", "| StdQ2Vals | 185 |\n", "| MaxQ2Vals | -27.9 |\n", "| MinQ2Vals | -1.29e+03 |\n", "| LossPi | 527 |\n", "| LossQ | 5.18e+03 |\n", "| Time | 139 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 7 |\n", "| AverageEpRet | -7.02e+03 |\n", "| StdEpRet | 1.79e+03 |\n", "| MaxEpRet | -3.34e+03 |\n", "| MinEpRet | -9.5e+03 |\n", "| AverageTestEpRet | -3.05e+03 |\n", "| StdTestEpRet | 1.56e+03 |\n", "| MaxTestEpRet | -1.34e+03 |\n", "| MinTestEpRet | -6.7e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.54e+04 |\n", "| AverageQ1Vals | -582 |\n", "| StdQ1Vals | 196 |\n", "| MaxQ1Vals | -68.9 |\n", "| MinQ1Vals | -1.38e+03 |\n", "| AverageQ2Vals | -582 |\n", "| StdQ2Vals | 195 |\n", "| MaxQ2Vals | -43.9 |\n", "| MinQ2Vals | -1.31e+03 |\n", "| LossPi | 534 |\n", "| LossQ | 5.26e+03 |\n", "| Time | 163 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 8 |\n", "| AverageEpRet | -6.62e+03 |\n", "| StdEpRet | 1.42e+03 |\n", "| MaxEpRet | -4.04e+03 |\n", "| MinEpRet | -9.02e+03 |\n", "| AverageTestEpRet | -1.54e+03 |\n", "| StdTestEpRet | 771 |\n", "| MaxTestEpRet | -595 |\n", "| MinTestEpRet | -3e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.76e+04 |\n", "| AverageQ1Vals | -573 |\n", "| StdQ1Vals | 209 |\n", "| MaxQ1Vals | -4.68 |\n", "| MinQ1Vals | -1.34e+03 |\n", "| AverageQ2Vals | -573 |\n", "| StdQ2Vals | 209 |\n", "| MaxQ2Vals | 22.9 |\n", "| MinQ2Vals | -1.35e+03 |\n", "| LossPi | 522 |\n", "| LossQ | 5.51e+03 |\n", "| Time | 187 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 9 |\n", "| AverageEpRet | -6.7e+03 |\n", "| StdEpRet | 1.58e+03 |\n", "| MaxEpRet | -4.21e+03 |\n", "| MinEpRet | -9.46e+03 |\n", "| AverageTestEpRet | -842 |\n", "| StdTestEpRet | 304 |\n", "| MaxTestEpRet | -411 |\n", "| MinTestEpRet | -1.52e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.98e+04 |\n", "| AverageQ1Vals | -546 |\n", "| StdQ1Vals | 223 |\n", "| MaxQ1Vals | 71.2 |\n", "| MinQ1Vals | -1.4e+03 |\n", "| AverageQ2Vals | -546 |\n", "| StdQ2Vals | 222 |\n", "| MaxQ2Vals | 60.5 |\n", "| MinQ2Vals | -1.41e+03 |\n", "| LossPi | 490 |\n", "| LossQ | 5.83e+03 |\n", "| Time | 211 |\n", "---------------------------------------\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "---------------------------------------\n", "| Epoch | 10 |\n", "| AverageEpRet | -1.66e+03 |\n", "| StdEpRet | 1.99e+03 |\n", "| MaxEpRet | -153 |\n", "| MinEpRet | -8.64e+03 |\n", "| AverageTestEpRet | -872 |\n", "| StdTestEpRet | 378 |\n", "| MaxTestEpRet | -487 |\n", "| MinTestEpRet | -1.53e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.2e+04 |\n", "| AverageQ1Vals | -488 |\n", "| StdQ1Vals | 243 |\n", "| MaxQ1Vals | 151 |\n", "| MinQ1Vals | -1.43e+03 |\n", "| AverageQ2Vals | -488 |\n", "| StdQ2Vals | 243 |\n", "| MaxQ2Vals | 127 |\n", "| MinQ2Vals | -1.4e+03 |\n", "| LossPi | 432 |\n", "| LossQ | 5.85e+03 |\n", "| Time | 239 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 11 |\n", "| AverageEpRet | -947 |\n", "| StdEpRet | 493 |\n", "| MaxEpRet | -232 |\n", "| MinEpRet | -1.89e+03 |\n", "| AverageTestEpRet | -1.09e+03 |\n", "| StdTestEpRet | 661 |\n", "| MaxTestEpRet | -271 |\n", "| MinTestEpRet | -2.78e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.42e+04 |\n", "| AverageQ1Vals | -425 |\n", "| StdQ1Vals | 258 |\n", "| MaxQ1Vals | 141 |\n", "| MinQ1Vals | -1.4e+03 |\n", "| AverageQ2Vals | -425 |\n", "| StdQ2Vals | 258 |\n", "| MaxQ2Vals | 137 |\n", "| MinQ2Vals | -1.39e+03 |\n", "| LossPi | 376 |\n", "| LossQ | 4.71e+03 |\n", "| Time | 263 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 12 |\n", "| AverageEpRet | -888 |\n", "| StdEpRet | 472 |\n", "| MaxEpRet | -325 |\n", "| MinEpRet | -2.33e+03 |\n", "| AverageTestEpRet | -602 |\n", "| StdTestEpRet | 199 |\n", "| MaxTestEpRet | -286 |\n", "| MinTestEpRet | -910 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.64e+04 |\n", "| AverageQ1Vals | -384 |\n", "| StdQ1Vals | 264 |\n", "| MaxQ1Vals | 161 |\n", "| MinQ1Vals | -1.41e+03 |\n", "| AverageQ2Vals | -384 |\n", "| StdQ2Vals | 264 |\n", "| MaxQ2Vals | 142 |\n", "| MinQ2Vals | -1.39e+03 |\n", "| LossPi | 341 |\n", "| LossQ | 3.72e+03 |\n", "| Time | 288 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 13 |\n", "| AverageEpRet | -797 |\n", "| StdEpRet | 536 |\n", "| MaxEpRet | -48.6 |\n", "| MinEpRet | -2.46e+03 |\n", "| AverageTestEpRet | -857 |\n", "| StdTestEpRet | 354 |\n", "| MaxTestEpRet | -467 |\n", "| MinTestEpRet | -1.77e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.86e+04 |\n", "| AverageQ1Vals | -354 |\n", "| StdQ1Vals | 270 |\n", "| MaxQ1Vals | 169 |\n", "| MinQ1Vals | -1.36e+03 |\n", "| AverageQ2Vals | -354 |\n", "| StdQ2Vals | 270 |\n", "| MaxQ2Vals | 166 |\n", "| MinQ2Vals | -1.35e+03 |\n", "| LossPi | 314 |\n", "| LossQ | 3.07e+03 |\n", "| Time | 312 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 14 |\n", "| AverageEpRet | -926 |\n", "| StdEpRet | 418 |\n", "| MaxEpRet | -333 |\n", "| MinEpRet | -1.67e+03 |\n", "| AverageTestEpRet | -902 |\n", "| StdTestEpRet | 481 |\n", "| MaxTestEpRet | -146 |\n", "| MinTestEpRet | -2.01e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 3.08e+04 |\n", "| AverageQ1Vals | -326 |\n", "| StdQ1Vals | 274 |\n", "| MaxQ1Vals | 192 |\n", "| MinQ1Vals | -1.34e+03 |\n", "| AverageQ2Vals | -326 |\n", "| StdQ2Vals | 274 |\n", "| MaxQ2Vals | 191 |\n", "| MinQ2Vals | -1.34e+03 |\n", "| LossPi | 288 |\n", "| LossQ | 2.66e+03 |\n", "| Time | 337 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 15 |\n", "| AverageEpRet | -738 |\n", "| StdEpRet | 339 |\n", "| MaxEpRet | -267 |\n", "| MinEpRet | -1.46e+03 |\n", "| AverageTestEpRet | -1.45e+03 |\n", "| StdTestEpRet | 1.42e+03 |\n", "| MaxTestEpRet | -185 |\n", "| MinTestEpRet | -4.34e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 3.3e+04 |\n", "| AverageQ1Vals | -297 |\n", "| StdQ1Vals | 279 |\n", "| MaxQ1Vals | 220 |\n", "| MinQ1Vals | -1.31e+03 |\n", "| AverageQ2Vals | -297 |\n", "| StdQ2Vals | 279 |\n", "| MaxQ2Vals | 221 |\n", "| MinQ2Vals | -1.31e+03 |\n", "| LossPi | 261 |\n", "| LossQ | 2.37e+03 |\n", "| Time | 362 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 16 |\n", "| AverageEpRet | -1.37e+03 |\n", "| StdEpRet | 1.85e+03 |\n", "| MaxEpRet | -223 |\n", "| MinEpRet | -8.63e+03 |\n", "| AverageTestEpRet | -595 |\n", "| StdTestEpRet | 159 |\n", "| MaxTestEpRet | -339 |\n", "| MinTestEpRet | -913 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 3.52e+04 |\n", "| AverageQ1Vals | -267 |\n", "| StdQ1Vals | 277 |\n", "| MaxQ1Vals | 279 |\n", "| MinQ1Vals | -1.3e+03 |\n", "| AverageQ2Vals | -267 |\n", "| StdQ2Vals | 277 |\n", "| MaxQ2Vals | 269 |\n", "| MinQ2Vals | -1.27e+03 |\n", "| LossPi | 231 |\n", "| LossQ | 2.21e+03 |\n", "| Time | 386 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 17 |\n", "| AverageEpRet | -754 |\n", "| StdEpRet | 595 |\n", "| MaxEpRet | -202 |\n", "| MinEpRet | -2.5e+03 |\n", "| AverageTestEpRet | -636 |\n", "| StdTestEpRet | 389 |\n", "| MaxTestEpRet | -147 |\n", "| MinTestEpRet | -1.49e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 3.74e+04 |\n", "| AverageQ1Vals | -245 |\n", "| StdQ1Vals | 273 |\n", "| MaxQ1Vals | 278 |\n", "| MinQ1Vals | -1.25e+03 |\n", "| AverageQ2Vals | -245 |\n", "| StdQ2Vals | 273 |\n", "| MaxQ2Vals | 268 |\n", "| MinQ2Vals | -1.24e+03 |\n", "| LossPi | 211 |\n", "| LossQ | 2.03e+03 |\n", "| Time | 411 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 18 |\n", "| AverageEpRet | -616 |\n", "| StdEpRet | 339 |\n", "| MaxEpRet | -241 |\n", "| MinEpRet | -1.4e+03 |\n", "| AverageTestEpRet | -713 |\n", "| StdTestEpRet | 304 |\n", "| MaxTestEpRet | -419 |\n", "| MinTestEpRet | -1.53e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 3.96e+04 |\n", "| AverageQ1Vals | -226 |\n", "| StdQ1Vals | 268 |\n", "| MaxQ1Vals | 275 |\n", "| MinQ1Vals | -1.19e+03 |\n", "| AverageQ2Vals | -226 |\n", "| StdQ2Vals | 268 |\n", "| MaxQ2Vals | 265 |\n", "| MinQ2Vals | -1.16e+03 |\n", "| LossPi | 194 |\n", "| LossQ | 1.83e+03 |\n", "| Time | 434 |\n", "---------------------------------------\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "---------------------------------------\n", "| Epoch | 19 |\n", "| AverageEpRet | -745 |\n", "| StdEpRet | 537 |\n", "| MaxEpRet | -109 |\n", "| MinEpRet | -2.14e+03 |\n", "| AverageTestEpRet | -963 |\n", "| StdTestEpRet | 641 |\n", "| MaxTestEpRet | -159 |\n", "| MinTestEpRet | -2.65e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 4.18e+04 |\n", "| AverageQ1Vals | -214 |\n", "| StdQ1Vals | 263 |\n", "| MaxQ1Vals | 273 |\n", "| MinQ1Vals | -1.18e+03 |\n", "| AverageQ2Vals | -214 |\n", "| StdQ2Vals | 263 |\n", "| MaxQ2Vals | 266 |\n", "| MinQ2Vals | -1.18e+03 |\n", "| LossPi | 183 |\n", "| LossQ | 1.67e+03 |\n", "| Time | 458 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 20 |\n", "| AverageEpRet | -711 |\n", "| StdEpRet | 511 |\n", "| MaxEpRet | -18.3 |\n", "| MinEpRet | -1.83e+03 |\n", "| AverageTestEpRet | -803 |\n", "| StdTestEpRet | 372 |\n", "| MaxTestEpRet | -126 |\n", "| MinTestEpRet | -1.53e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 4.4e+04 |\n", "| AverageQ1Vals | -198 |\n", "| StdQ1Vals | 260 |\n", "| MaxQ1Vals | 276 |\n", "| MinQ1Vals | -1.19e+03 |\n", "| AverageQ2Vals | -198 |\n", "| StdQ2Vals | 260 |\n", "| MaxQ2Vals | 268 |\n", "| MinQ2Vals | -1.16e+03 |\n", "| LossPi | 169 |\n", "| LossQ | 1.57e+03 |\n", "| Time | 483 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 21 |\n", "| AverageEpRet | -664 |\n", "| StdEpRet | 403 |\n", "| MaxEpRet | -176 |\n", "| MinEpRet | -1.87e+03 |\n", "| AverageTestEpRet | -577 |\n", "| StdTestEpRet | 343 |\n", "| MaxTestEpRet | -133 |\n", "| MinTestEpRet | -1.16e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 4.62e+04 |\n", "| AverageQ1Vals | -187 |\n", "| StdQ1Vals | 254 |\n", "| MaxQ1Vals | 269 |\n", "| MinQ1Vals | -1.15e+03 |\n", "| AverageQ2Vals | -187 |\n", "| StdQ2Vals | 254 |\n", "| MaxQ2Vals | 262 |\n", "| MinQ2Vals | -1.13e+03 |\n", "| LossPi | 159 |\n", "| LossQ | 1.48e+03 |\n", "| Time | 507 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 22 |\n", "| AverageEpRet | -662 |\n", "| StdEpRet | 341 |\n", "| MaxEpRet | -261 |\n", "| MinEpRet | -1.64e+03 |\n", "| AverageTestEpRet | -780 |\n", "| StdTestEpRet | 458 |\n", "| MaxTestEpRet | -39.9 |\n", "| MinTestEpRet | -1.77e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 4.84e+04 |\n", "| AverageQ1Vals | -178 |\n", "| StdQ1Vals | 249 |\n", "| MaxQ1Vals | 260 |\n", "| MinQ1Vals | -1.15e+03 |\n", "| AverageQ2Vals | -178 |\n", "| StdQ2Vals | 249 |\n", "| MaxQ2Vals | 258 |\n", "| MinQ2Vals | -1.14e+03 |\n", "| LossPi | 151 |\n", "| LossQ | 1.35e+03 |\n", "| Time | 531 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 23 |\n", "| AverageEpRet | -524 |\n", "| StdEpRet | 312 |\n", "| MaxEpRet | -85.9 |\n", "| MinEpRet | -1.22e+03 |\n", "| AverageTestEpRet | -768 |\n", "| StdTestEpRet | 268 |\n", "| MaxTestEpRet | -329 |\n", "| MinTestEpRet | -1.3e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 5.06e+04 |\n", "| AverageQ1Vals | -171 |\n", "| StdQ1Vals | 243 |\n", "| MaxQ1Vals | 239 |\n", "| MinQ1Vals | -1.15e+03 |\n", "| AverageQ2Vals | -170 |\n", "| StdQ2Vals | 243 |\n", "| MaxQ2Vals | 246 |\n", "| MinQ2Vals | -1.13e+03 |\n", "| LossPi | 145 |\n", "| LossQ | 1.29e+03 |\n", "| Time | 555 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 24 |\n", "| AverageEpRet | -714 |\n", "| StdEpRet | 351 |\n", "| MaxEpRet | -181 |\n", "| MinEpRet | -1.29e+03 |\n", "| AverageTestEpRet | -433 |\n", "| StdTestEpRet | 184 |\n", "| MaxTestEpRet | -178 |\n", "| MinTestEpRet | -786 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 5.28e+04 |\n", "| AverageQ1Vals | -164 |\n", "| StdQ1Vals | 238 |\n", "| MaxQ1Vals | 227 |\n", "| MinQ1Vals | -1.16e+03 |\n", "| AverageQ2Vals | -164 |\n", "| StdQ2Vals | 238 |\n", "| MaxQ2Vals | 229 |\n", "| MinQ2Vals | -1.16e+03 |\n", "| LossPi | 139 |\n", "| LossQ | 1.22e+03 |\n", "| Time | 579 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 25 |\n", "| AverageEpRet | -709 |\n", "| StdEpRet | 425 |\n", "| MaxEpRet | -88.8 |\n", "| MinEpRet | -1.59e+03 |\n", "| AverageTestEpRet | -808 |\n", "| StdTestEpRet | 476 |\n", "| MaxTestEpRet | -198 |\n", "| MinTestEpRet | -1.81e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 5.5e+04 |\n", "| AverageQ1Vals | -159 |\n", "| StdQ1Vals | 233 |\n", "| MaxQ1Vals | 209 |\n", "| MinQ1Vals | -1.14e+03 |\n", "| AverageQ2Vals | -159 |\n", "| StdQ2Vals | 233 |\n", "| MaxQ2Vals | 209 |\n", "| MinQ2Vals | -1.13e+03 |\n", "| LossPi | 136 |\n", "| LossQ | 1.15e+03 |\n", "| Time | 603 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 26 |\n", "| AverageEpRet | -813 |\n", "| StdEpRet | 433 |\n", "| MaxEpRet | -247 |\n", "| MinEpRet | -1.81e+03 |\n", "| AverageTestEpRet | -702 |\n", "| StdTestEpRet | 308 |\n", "| MaxTestEpRet | -197 |\n", "| MinTestEpRet | -1.43e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 5.72e+04 |\n", "| AverageQ1Vals | -158 |\n", "| StdQ1Vals | 231 |\n", "| MaxQ1Vals | 194 |\n", "| MinQ1Vals | -1.2e+03 |\n", "| AverageQ2Vals | -158 |\n", "| StdQ2Vals | 231 |\n", "| MaxQ2Vals | 198 |\n", "| MinQ2Vals | -1.17e+03 |\n", "| LossPi | 136 |\n", "| LossQ | 1.14e+03 |\n", "| Time | 628 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 27 |\n", "| AverageEpRet | -690 |\n", "| StdEpRet | 282 |\n", "| MaxEpRet | -336 |\n", "| MinEpRet | -1.07e+03 |\n", "| AverageTestEpRet | -934 |\n", "| StdTestEpRet | 626 |\n", "| MaxTestEpRet | -317 |\n", "| MinTestEpRet | -2.24e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 5.94e+04 |\n", "| AverageQ1Vals | -157 |\n", "| StdQ1Vals | 229 |\n", "| MaxQ1Vals | 190 |\n", "| MinQ1Vals | -1.15e+03 |\n", "| AverageQ2Vals | -157 |\n", "| StdQ2Vals | 229 |\n", "| MaxQ2Vals | 192 |\n", "| MinQ2Vals | -1.14e+03 |\n", "| LossPi | 135 |\n", "| LossQ | 1.03e+03 |\n", "| Time | 653 |\n", "---------------------------------------\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "---------------------------------------\n", "| Epoch | 28 |\n", "| AverageEpRet | -965 |\n", "| StdEpRet | 522 |\n", "| MaxEpRet | -172 |\n", "| MinEpRet | -2.3e+03 |\n", "| AverageTestEpRet | -599 |\n", "| StdTestEpRet | 398 |\n", "| MaxTestEpRet | -163 |\n", "| MinTestEpRet | -1.32e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 6.16e+04 |\n", "| AverageQ1Vals | -154 |\n", "| StdQ1Vals | 226 |\n", "| MaxQ1Vals | 176 |\n", "| MinQ1Vals | -1.12e+03 |\n", "| AverageQ2Vals | -154 |\n", "| StdQ2Vals | 226 |\n", "| MaxQ2Vals | 188 |\n", "| MinQ2Vals | -1.14e+03 |\n", "| LossPi | 133 |\n", "| LossQ | 973 |\n", "| Time | 677 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 29 |\n", "| AverageEpRet | -766 |\n", "| StdEpRet | 367 |\n", "| MaxEpRet | -114 |\n", "| MinEpRet | -1.69e+03 |\n", "| AverageTestEpRet | -659 |\n", "| StdTestEpRet | 229 |\n", "| MaxTestEpRet | -303 |\n", "| MinTestEpRet | -1.1e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 6.38e+04 |\n", "| AverageQ1Vals | -153 |\n", "| StdQ1Vals | 225 |\n", "| MaxQ1Vals | 173 |\n", "| MinQ1Vals | -1.14e+03 |\n", "| AverageQ2Vals | -153 |\n", "| StdQ2Vals | 225 |\n", "| MaxQ2Vals | 176 |\n", "| MinQ2Vals | -1.14e+03 |\n", "| LossPi | 133 |\n", "| LossQ | 961 |\n", "| Time | 702 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 30 |\n", "| AverageEpRet | -682 |\n", "| StdEpRet | 254 |\n", "| MaxEpRet | -388 |\n", "| MinEpRet | -1.46e+03 |\n", "| AverageTestEpRet | -686 |\n", "| StdTestEpRet | 188 |\n", "| MaxTestEpRet | -312 |\n", "| MinTestEpRet | -977 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 6.6e+04 |\n", "| AverageQ1Vals | -151 |\n", "| StdQ1Vals | 222 |\n", "| MaxQ1Vals | 162 |\n", "| MinQ1Vals | -1.2e+03 |\n", "| AverageQ2Vals | -151 |\n", "| StdQ2Vals | 222 |\n", "| MaxQ2Vals | 159 |\n", "| MinQ2Vals | -1.16e+03 |\n", "| LossPi | 131 |\n", "| LossQ | 913 |\n", "| Time | 727 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 31 |\n", "| AverageEpRet | -676 |\n", "| StdEpRet | 442 |\n", "| MaxEpRet | -163 |\n", "| MinEpRet | -1.84e+03 |\n", "| AverageTestEpRet | -678 |\n", "| StdTestEpRet | 371 |\n", "| MaxTestEpRet | -156 |\n", "| MinTestEpRet | -1.41e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 6.82e+04 |\n", "| AverageQ1Vals | -149 |\n", "| StdQ1Vals | 219 |\n", "| MaxQ1Vals | 149 |\n", "| MinQ1Vals | -1.14e+03 |\n", "| AverageQ2Vals | -149 |\n", "| StdQ2Vals | 219 |\n", "| MaxQ2Vals | 153 |\n", "| MinQ2Vals | -1.09e+03 |\n", "| LossPi | 130 |\n", "| LossQ | 855 |\n", "| Time | 753 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 32 |\n", "| AverageEpRet | -760 |\n", "| StdEpRet | 313 |\n", "| MaxEpRet | -216 |\n", "| MinEpRet | -1.49e+03 |\n", "| AverageTestEpRet | -759 |\n", "| StdTestEpRet | 430 |\n", "| MaxTestEpRet | -256 |\n", "| MinTestEpRet | -1.64e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 7.04e+04 |\n", "| AverageQ1Vals | -150 |\n", "| StdQ1Vals | 217 |\n", "| MaxQ1Vals | 146 |\n", "| MinQ1Vals | -1.1e+03 |\n", "| AverageQ2Vals | -150 |\n", "| StdQ2Vals | 217 |\n", "| MaxQ2Vals | 145 |\n", "| MinQ2Vals | -1.11e+03 |\n", "| LossPi | 130 |\n", "| LossQ | 835 |\n", "| Time | 775 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 33 |\n", "| AverageEpRet | -527 |\n", "| StdEpRet | 395 |\n", "| MaxEpRet | -57.1 |\n", "| MinEpRet | -1.4e+03 |\n", "| AverageTestEpRet | -583 |\n", "| StdTestEpRet | 368 |\n", "| MaxTestEpRet | -120 |\n", "| MinTestEpRet | -1.52e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 7.26e+04 |\n", "| AverageQ1Vals | -147 |\n", "| StdQ1Vals | 213 |\n", "| MaxQ1Vals | 130 |\n", "| MinQ1Vals | -1.11e+03 |\n", "| AverageQ2Vals | -147 |\n", "| StdQ2Vals | 213 |\n", "| MaxQ2Vals | 125 |\n", "| MinQ2Vals | -1.11e+03 |\n", "| LossPi | 129 |\n", "| LossQ | 800 |\n", "| Time | 796 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 34 |\n", "| AverageEpRet | -732 |\n", "| StdEpRet | 361 |\n", "| MaxEpRet | -114 |\n", "| MinEpRet | -1.6e+03 |\n", "| AverageTestEpRet | -737 |\n", "| StdTestEpRet | 290 |\n", "| MaxTestEpRet | -278 |\n", "| MinTestEpRet | -1.25e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 7.48e+04 |\n", "| AverageQ1Vals | -144 |\n", "| StdQ1Vals | 211 |\n", "| MaxQ1Vals | 133 |\n", "| MinQ1Vals | -1.09e+03 |\n", "| AverageQ2Vals | -144 |\n", "| StdQ2Vals | 211 |\n", "| MaxQ2Vals | 121 |\n", "| MinQ2Vals | -1.1e+03 |\n", "| LossPi | 126 |\n", "| LossQ | 784 |\n", "| Time | 820 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 35 |\n", "| AverageEpRet | -682 |\n", "| StdEpRet | 348 |\n", "| MaxEpRet | -159 |\n", "| MinEpRet | -1.58e+03 |\n", "| AverageTestEpRet | -766 |\n", "| StdTestEpRet | 358 |\n", "| MaxTestEpRet | -85.9 |\n", "| MinTestEpRet | -1.35e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 7.7e+04 |\n", "| AverageQ1Vals | -143 |\n", "| StdQ1Vals | 209 |\n", "| MaxQ1Vals | 123 |\n", "| MinQ1Vals | -1.16e+03 |\n", "| AverageQ2Vals | -143 |\n", "| StdQ2Vals | 209 |\n", "| MaxQ2Vals | 107 |\n", "| MinQ2Vals | -1.17e+03 |\n", "| LossPi | 125 |\n", "| LossQ | 730 |\n", "| Time | 846 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 36 |\n", "| AverageEpRet | -848 |\n", "| StdEpRet | 733 |\n", "| MaxEpRet | -216 |\n", "| MinEpRet | -3.32e+03 |\n", "| AverageTestEpRet | -765 |\n", "| StdTestEpRet | 340 |\n", "| MaxTestEpRet | -191 |\n", "| MinTestEpRet | -1.48e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 7.92e+04 |\n", "| AverageQ1Vals | -141 |\n", "| StdQ1Vals | 207 |\n", "| MaxQ1Vals | 115 |\n", "| MinQ1Vals | -1.1e+03 |\n", "| AverageQ2Vals | -141 |\n", "| StdQ2Vals | 207 |\n", "| MaxQ2Vals | 108 |\n", "| MinQ2Vals | -1.14e+03 |\n", "| LossPi | 125 |\n", "| LossQ | 703 |\n", "| Time | 873 |\n", "---------------------------------------\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "---------------------------------------\n", "| Epoch | 37 |\n", "| AverageEpRet | -625 |\n", "| StdEpRet | 379 |\n", "| MaxEpRet | -11.3 |\n", "| MinEpRet | -1.43e+03 |\n", "| AverageTestEpRet | -646 |\n", "| StdTestEpRet | 399 |\n", "| MaxTestEpRet | -102 |\n", "| MinTestEpRet | -1.15e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 8.14e+04 |\n", "| AverageQ1Vals | -140 |\n", "| StdQ1Vals | 204 |\n", "| MaxQ1Vals | 103 |\n", "| MinQ1Vals | -1.15e+03 |\n", "| AverageQ2Vals | -140 |\n", "| StdQ2Vals | 204 |\n", "| MaxQ2Vals | 96.8 |\n", "| MinQ2Vals | -1.14e+03 |\n", "| LossPi | 124 |\n", "| LossQ | 667 |\n", "| Time | 900 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 38 |\n", "| AverageEpRet | -634 |\n", "| StdEpRet | 304 |\n", "| MaxEpRet | -44.1 |\n", "| MinEpRet | -1.19e+03 |\n", "| AverageTestEpRet | -716 |\n", "| StdTestEpRet | 356 |\n", "| MaxTestEpRet | -263 |\n", "| MinTestEpRet | -1.49e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 8.36e+04 |\n", "| AverageQ1Vals | -140 |\n", "| StdQ1Vals | 203 |\n", "| MaxQ1Vals | 91.8 |\n", "| MinQ1Vals | -1.14e+03 |\n", "| AverageQ2Vals | -140 |\n", "| StdQ2Vals | 203 |\n", "| MaxQ2Vals | 86 |\n", "| MinQ2Vals | -1.16e+03 |\n", "| LossPi | 124 |\n", "| LossQ | 664 |\n", "| Time | 929 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 39 |\n", "| AverageEpRet | -630 |\n", "| StdEpRet | 375 |\n", "| MaxEpRet | -127 |\n", "| MinEpRet | -1.59e+03 |\n", "| AverageTestEpRet | -591 |\n", "| StdTestEpRet | 239 |\n", "| MaxTestEpRet | -204 |\n", "| MinTestEpRet | -946 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 8.58e+04 |\n", "| AverageQ1Vals | -139 |\n", "| StdQ1Vals | 201 |\n", "| MaxQ1Vals | 86.8 |\n", "| MinQ1Vals | -1.14e+03 |\n", "| AverageQ2Vals | -139 |\n", "| StdQ2Vals | 201 |\n", "| MaxQ2Vals | 77.3 |\n", "| MinQ2Vals | -1.11e+03 |\n", "| LossPi | 124 |\n", "| LossQ | 649 |\n", "| Time | 960 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 40 |\n", "| AverageEpRet | -506 |\n", "| StdEpRet | 280 |\n", "| MaxEpRet | -67.2 |\n", "| MinEpRet | -1.18e+03 |\n", "| AverageTestEpRet | -621 |\n", "| StdTestEpRet | 351 |\n", "| MaxTestEpRet | -171 |\n", "| MinTestEpRet | -1.07e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 8.8e+04 |\n", "| AverageQ1Vals | -137 |\n", "| StdQ1Vals | 199 |\n", "| MaxQ1Vals | 77.5 |\n", "| MinQ1Vals | -1.21e+03 |\n", "| AverageQ2Vals | -137 |\n", "| StdQ2Vals | 199 |\n", "| MaxQ2Vals | 66.2 |\n", "| MinQ2Vals | -1.21e+03 |\n", "| LossPi | 122 |\n", "| LossQ | 629 |\n", "| Time | 991 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 41 |\n", "| AverageEpRet | -676 |\n", "| StdEpRet | 301 |\n", "| MaxEpRet | -182 |\n", "| MinEpRet | -1.31e+03 |\n", "| AverageTestEpRet | -784 |\n", "| StdTestEpRet | 309 |\n", "| MaxTestEpRet | -408 |\n", "| MinTestEpRet | -1.4e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 9.02e+04 |\n", "| AverageQ1Vals | -136 |\n", "| StdQ1Vals | 197 |\n", "| MaxQ1Vals | 74.4 |\n", "| MinQ1Vals | -1.16e+03 |\n", "| AverageQ2Vals | -136 |\n", "| StdQ2Vals | 197 |\n", "| MaxQ2Vals | 74.3 |\n", "| MinQ2Vals | -1.12e+03 |\n", "| LossPi | 121 |\n", "| LossQ | 587 |\n", "| Time | 1.02e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 42 |\n", "| AverageEpRet | -623 |\n", "| StdEpRet | 295 |\n", "| MaxEpRet | -69.3 |\n", "| MinEpRet | -1.19e+03 |\n", "| AverageTestEpRet | -806 |\n", "| StdTestEpRet | 386 |\n", "| MaxTestEpRet | -285 |\n", "| MinTestEpRet | -1.63e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 9.24e+04 |\n", "| AverageQ1Vals | -134 |\n", "| StdQ1Vals | 196 |\n", "| MaxQ1Vals | 59.5 |\n", "| MinQ1Vals | -1.13e+03 |\n", "| AverageQ2Vals | -134 |\n", "| StdQ2Vals | 196 |\n", "| MaxQ2Vals | 67.8 |\n", "| MinQ2Vals | -1.14e+03 |\n", "| LossPi | 120 |\n", "| LossQ | 584 |\n", "| Time | 1.05e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 43 |\n", "| AverageEpRet | -565 |\n", "| StdEpRet | 255 |\n", "| MaxEpRet | -79.6 |\n", "| MinEpRet | -1.08e+03 |\n", "| AverageTestEpRet | -620 |\n", "| StdTestEpRet | 300 |\n", "| MaxTestEpRet | -160 |\n", "| MinTestEpRet | -971 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 9.46e+04 |\n", "| AverageQ1Vals | -133 |\n", "| StdQ1Vals | 194 |\n", "| MaxQ1Vals | 63.5 |\n", "| MinQ1Vals | -1.17e+03 |\n", "| AverageQ2Vals | -133 |\n", "| StdQ2Vals | 194 |\n", "| MaxQ2Vals | 68.2 |\n", "| MinQ2Vals | -1.12e+03 |\n", "| LossPi | 118 |\n", "| LossQ | 561 |\n", "| Time | 1.08e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 44 |\n", "| AverageEpRet | -583 |\n", "| StdEpRet | 247 |\n", "| MaxEpRet | -63.3 |\n", "| MinEpRet | -1.08e+03 |\n", "| AverageTestEpRet | -507 |\n", "| StdTestEpRet | 296 |\n", "| MaxTestEpRet | -107 |\n", "| MinTestEpRet | -996 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 9.68e+04 |\n", "| AverageQ1Vals | -132 |\n", "| StdQ1Vals | 191 |\n", "| MaxQ1Vals | 49.2 |\n", "| MinQ1Vals | -1.18e+03 |\n", "| AverageQ2Vals | -132 |\n", "| StdQ2Vals | 191 |\n", "| MaxQ2Vals | 49.2 |\n", "| MinQ2Vals | -1.14e+03 |\n", "| LossPi | 118 |\n", "| LossQ | 532 |\n", "| Time | 1.11e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 45 |\n", "| AverageEpRet | -608 |\n", "| StdEpRet | 309 |\n", "| MaxEpRet | -147 |\n", "| MinEpRet | -1.23e+03 |\n", "| AverageTestEpRet | -727 |\n", "| StdTestEpRet | 348 |\n", "| MaxTestEpRet | -203 |\n", "| MinTestEpRet | -1.43e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 9.9e+04 |\n", "| AverageQ1Vals | -129 |\n", "| StdQ1Vals | 187 |\n", "| MaxQ1Vals | 50.6 |\n", "| MinQ1Vals | -1.14e+03 |\n", "| AverageQ2Vals | -129 |\n", "| StdQ2Vals | 187 |\n", "| MaxQ2Vals | 47.9 |\n", "| MinQ2Vals | -1.14e+03 |\n", "| LossPi | 116 |\n", "| LossQ | 517 |\n", "| Time | 1.14e+03 |\n", "---------------------------------------\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "---------------------------------------\n", "| Epoch | 46 |\n", "| AverageEpRet | -649 |\n", "| StdEpRet | 325 |\n", "| MaxEpRet | -151 |\n", "| MinEpRet | -1.5e+03 |\n", "| AverageTestEpRet | -647 |\n", "| StdTestEpRet | 317 |\n", "| MaxTestEpRet | -219 |\n", "| MinTestEpRet | -1.25e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.01e+05 |\n", "| AverageQ1Vals | -129 |\n", "| StdQ1Vals | 187 |\n", "| MaxQ1Vals | 49.8 |\n", "| MinQ1Vals | -1.1e+03 |\n", "| AverageQ2Vals | -129 |\n", "| StdQ2Vals | 187 |\n", "| MaxQ2Vals | 90.9 |\n", "| MinQ2Vals | -1.11e+03 |\n", "| LossPi | 115 |\n", "| LossQ | 514 |\n", "| Time | 1.18e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 47 |\n", "| AverageEpRet | -444 |\n", "| StdEpRet | 183 |\n", "| MaxEpRet | -183 |\n", "| MinEpRet | -968 |\n", "| AverageTestEpRet | -669 |\n", "| StdTestEpRet | 245 |\n", "| MaxTestEpRet | -261 |\n", "| MinTestEpRet | -1.12e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.03e+05 |\n", "| AverageQ1Vals | -127 |\n", "| StdQ1Vals | 185 |\n", "| MaxQ1Vals | 58.8 |\n", "| MinQ1Vals | -1.15e+03 |\n", "| AverageQ2Vals | -127 |\n", "| StdQ2Vals | 185 |\n", "| MaxQ2Vals | 55.1 |\n", "| MinQ2Vals | -1.15e+03 |\n", "| LossPi | 113 |\n", "| LossQ | 489 |\n", "| Time | 1.21e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 48 |\n", "| AverageEpRet | -673 |\n", "| StdEpRet | 332 |\n", "| MaxEpRet | -125 |\n", "| MinEpRet | -1.41e+03 |\n", "| AverageTestEpRet | -534 |\n", "| StdTestEpRet | 252 |\n", "| MaxTestEpRet | -167 |\n", "| MinTestEpRet | -1.04e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.06e+05 |\n", "| AverageQ1Vals | -125 |\n", "| StdQ1Vals | 182 |\n", "| MaxQ1Vals | 96.2 |\n", "| MinQ1Vals | -1.16e+03 |\n", "| AverageQ2Vals | -125 |\n", "| StdQ2Vals | 182 |\n", "| MaxQ2Vals | 93.5 |\n", "| MinQ2Vals | -1.18e+03 |\n", "| LossPi | 112 |\n", "| LossQ | 473 |\n", "| Time | 1.24e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 49 |\n", "| AverageEpRet | -475 |\n", "| StdEpRet | 243 |\n", "| MaxEpRet | -125 |\n", "| MinEpRet | -1.11e+03 |\n", "| AverageTestEpRet | -572 |\n", "| StdTestEpRet | 339 |\n", "| MaxTestEpRet | -155 |\n", "| MinTestEpRet | -1.25e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.08e+05 |\n", "| AverageQ1Vals | -124 |\n", "| StdQ1Vals | 181 |\n", "| MaxQ1Vals | 66.2 |\n", "| MinQ1Vals | -1.14e+03 |\n", "| AverageQ2Vals | -124 |\n", "| StdQ2Vals | 181 |\n", "| MaxQ2Vals | 60.6 |\n", "| MinQ2Vals | -1.11e+03 |\n", "| LossPi | 112 |\n", "| LossQ | 466 |\n", "| Time | 1.27e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 50 |\n", "| AverageEpRet | -581 |\n", "| StdEpRet | 358 |\n", "| MaxEpRet | -121 |\n", "| MinEpRet | -1.34e+03 |\n", "| AverageTestEpRet | -687 |\n", "| StdTestEpRet | 246 |\n", "| MaxTestEpRet | -246 |\n", "| MinTestEpRet | -1.07e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.1e+05 |\n", "| AverageQ1Vals | -122 |\n", "| StdQ1Vals | 179 |\n", "| MaxQ1Vals | 40.6 |\n", "| MinQ1Vals | -1.16e+03 |\n", "| AverageQ2Vals | -122 |\n", "| StdQ2Vals | 179 |\n", "| MaxQ2Vals | 50.9 |\n", "| MinQ2Vals | -1.16e+03 |\n", "| LossPi | 109 |\n", "| LossQ | 439 |\n", "| Time | 1.31e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 51 |\n", "| AverageEpRet | -599 |\n", "| StdEpRet | 287 |\n", "| MaxEpRet | -232 |\n", "| MinEpRet | -1.44e+03 |\n", "| AverageTestEpRet | -561 |\n", "| StdTestEpRet | 204 |\n", "| MaxTestEpRet | -216 |\n", "| MinTestEpRet | -856 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.12e+05 |\n", "| AverageQ1Vals | -122 |\n", "| StdQ1Vals | 179 |\n", "| MaxQ1Vals | 78.3 |\n", "| MinQ1Vals | -1.12e+03 |\n", "| AverageQ2Vals | -122 |\n", "| StdQ2Vals | 179 |\n", "| MaxQ2Vals | 76.5 |\n", "| MinQ2Vals | -1.14e+03 |\n", "| LossPi | 110 |\n", "| LossQ | 437 |\n", "| Time | 1.34e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 52 |\n", "| AverageEpRet | -636 |\n", "| StdEpRet | 283 |\n", "| MaxEpRet | -220 |\n", "| MinEpRet | -1.12e+03 |\n", "| AverageTestEpRet | -712 |\n", "| StdTestEpRet | 185 |\n", "| MaxTestEpRet | -457 |\n", "| MinTestEpRet | -1.09e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.14e+05 |\n", "| AverageQ1Vals | -121 |\n", "| StdQ1Vals | 178 |\n", "| MaxQ1Vals | 58.8 |\n", "| MinQ1Vals | -1.17e+03 |\n", "| AverageQ2Vals | -121 |\n", "| StdQ2Vals | 178 |\n", "| MaxQ2Vals | 54.7 |\n", "| MinQ2Vals | -1.17e+03 |\n", "| LossPi | 109 |\n", "| LossQ | 431 |\n", "| Time | 1.37e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 53 |\n", "| AverageEpRet | -591 |\n", "| StdEpRet | 351 |\n", "| MaxEpRet | -132 |\n", "| MinEpRet | -1.43e+03 |\n", "| AverageTestEpRet | -551 |\n", "| StdTestEpRet | 206 |\n", "| MaxTestEpRet | -333 |\n", "| MinTestEpRet | -975 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.17e+05 |\n", "| AverageQ1Vals | -119 |\n", "| StdQ1Vals | 176 |\n", "| MaxQ1Vals | 54.4 |\n", "| MinQ1Vals | -1.14e+03 |\n", "| AverageQ2Vals | -119 |\n", "| StdQ2Vals | 176 |\n", "| MaxQ2Vals | 89.1 |\n", "| MinQ2Vals | -1.18e+03 |\n", "| LossPi | 108 |\n", "| LossQ | 418 |\n", "| Time | 1.4e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 54 |\n", "| AverageEpRet | -426 |\n", "| StdEpRet | 230 |\n", "| MaxEpRet | -90.2 |\n", "| MinEpRet | -906 |\n", "| AverageTestEpRet | -447 |\n", "| StdTestEpRet | 197 |\n", "| MaxTestEpRet | -124 |\n", "| MinTestEpRet | -708 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.19e+05 |\n", "| AverageQ1Vals | -118 |\n", "| StdQ1Vals | 175 |\n", "| MaxQ1Vals | 47.2 |\n", "| MinQ1Vals | -1.14e+03 |\n", "| AverageQ2Vals | -118 |\n", "| StdQ2Vals | 175 |\n", "| MaxQ2Vals | 80 |\n", "| MinQ2Vals | -1.14e+03 |\n", "| LossPi | 106 |\n", "| LossQ | 401 |\n", "| Time | 1.43e+03 |\n", "---------------------------------------\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "---------------------------------------\n", "| Epoch | 55 |\n", "| AverageEpRet | -503 |\n", "| StdEpRet | 235 |\n", "| MaxEpRet | -110 |\n", "| MinEpRet | -939 |\n", "| AverageTestEpRet | -615 |\n", "| StdTestEpRet | 194 |\n", "| MaxTestEpRet | -400 |\n", "| MinTestEpRet | -952 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.21e+05 |\n", "| AverageQ1Vals | -118 |\n", "| StdQ1Vals | 174 |\n", "| MaxQ1Vals | 54.2 |\n", "| MinQ1Vals | -1.19e+03 |\n", "| AverageQ2Vals | -118 |\n", "| StdQ2Vals | 174 |\n", "| MaxQ2Vals | 68.6 |\n", "| MinQ2Vals | -1.15e+03 |\n", "| LossPi | 106 |\n", "| LossQ | 392 |\n", "| Time | 1.47e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 56 |\n", "| AverageEpRet | -552 |\n", "| StdEpRet | 234 |\n", "| MaxEpRet | -228 |\n", "| MinEpRet | -969 |\n", "| AverageTestEpRet | -400 |\n", "| StdTestEpRet | 293 |\n", "| MaxTestEpRet | -66.3 |\n", "| MinTestEpRet | -1.1e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.23e+05 |\n", "| AverageQ1Vals | -117 |\n", "| StdQ1Vals | 173 |\n", "| MaxQ1Vals | 66.1 |\n", "| MinQ1Vals | -1.14e+03 |\n", "| AverageQ2Vals | -117 |\n", "| StdQ2Vals | 173 |\n", "| MaxQ2Vals | 69.5 |\n", "| MinQ2Vals | -1.13e+03 |\n", "| LossPi | 105 |\n", "| LossQ | 400 |\n", "| Time | 1.5e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 57 |\n", "| AverageEpRet | -476 |\n", "| StdEpRet | 318 |\n", "| MaxEpRet | -33.7 |\n", "| MinEpRet | -1.13e+03 |\n", "| AverageTestEpRet | -480 |\n", "| StdTestEpRet | 210 |\n", "| MaxTestEpRet | -197 |\n", "| MinTestEpRet | -802 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.25e+05 |\n", "| AverageQ1Vals | -114 |\n", "| StdQ1Vals | 171 |\n", "| MaxQ1Vals | 68.5 |\n", "| MinQ1Vals | -1.16e+03 |\n", "| AverageQ2Vals | -114 |\n", "| StdQ2Vals | 171 |\n", "| MaxQ2Vals | 68.8 |\n", "| MinQ2Vals | -1.16e+03 |\n", "| LossPi | 103 |\n", "| LossQ | 380 |\n", "| Time | 1.53e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 58 |\n", "| AverageEpRet | -590 |\n", "| StdEpRet | 261 |\n", "| MaxEpRet | -113 |\n", "| MinEpRet | -1.32e+03 |\n", "| AverageTestEpRet | -519 |\n", "| StdTestEpRet | 234 |\n", "| MaxTestEpRet | -206 |\n", "| MinTestEpRet | -935 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.28e+05 |\n", "| AverageQ1Vals | -113 |\n", "| StdQ1Vals | 170 |\n", "| MaxQ1Vals | 72.9 |\n", "| MinQ1Vals | -1.12e+03 |\n", "| AverageQ2Vals | -113 |\n", "| StdQ2Vals | 170 |\n", "| MaxQ2Vals | 51.6 |\n", "| MinQ2Vals | -1.09e+03 |\n", "| LossPi | 102 |\n", "| LossQ | 368 |\n", "| Time | 1.56e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 59 |\n", "| AverageEpRet | -588 |\n", "| StdEpRet | 220 |\n", "| MaxEpRet | -170 |\n", "| MinEpRet | -1.05e+03 |\n", "| AverageTestEpRet | -467 |\n", "| StdTestEpRet | 182 |\n", "| MaxTestEpRet | -212 |\n", "| MinTestEpRet | -763 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.3e+05 |\n", "| AverageQ1Vals | -112 |\n", "| StdQ1Vals | 169 |\n", "| MaxQ1Vals | 64.5 |\n", "| MinQ1Vals | -1.16e+03 |\n", "| AverageQ2Vals | -112 |\n", "| StdQ2Vals | 169 |\n", "| MaxQ2Vals | 93.3 |\n", "| MinQ2Vals | -1.14e+03 |\n", "| LossPi | 102 |\n", "| LossQ | 367 |\n", "| Time | 1.6e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 60 |\n", "| AverageEpRet | -495 |\n", "| StdEpRet | 358 |\n", "| MaxEpRet | -44.8 |\n", "| MinEpRet | -1.71e+03 |\n", "| AverageTestEpRet | -654 |\n", "| StdTestEpRet | 261 |\n", "| MaxTestEpRet | -227 |\n", "| MinTestEpRet | -1.05e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.32e+05 |\n", "| AverageQ1Vals | -112 |\n", "| StdQ1Vals | 168 |\n", "| MaxQ1Vals | 68.9 |\n", "| MinQ1Vals | -1.18e+03 |\n", "| AverageQ2Vals | -112 |\n", "| StdQ2Vals | 168 |\n", "| MaxQ2Vals | 73.7 |\n", "| MinQ2Vals | -1.15e+03 |\n", "| LossPi | 101 |\n", "| LossQ | 363 |\n", "| Time | 1.63e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 61 |\n", "| AverageEpRet | -690 |\n", "| StdEpRet | 376 |\n", "| MaxEpRet | -74.9 |\n", "| MinEpRet | -1.45e+03 |\n", "| AverageTestEpRet | -574 |\n", "| StdTestEpRet | 410 |\n", "| MaxTestEpRet | -144 |\n", "| MinTestEpRet | -1.57e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.34e+05 |\n", "| AverageQ1Vals | -110 |\n", "| StdQ1Vals | 166 |\n", "| MaxQ1Vals | 49.8 |\n", "| MinQ1Vals | -1.18e+03 |\n", "| AverageQ2Vals | -110 |\n", "| StdQ2Vals | 166 |\n", "| MaxQ2Vals | 52.8 |\n", "| MinQ2Vals | -1.17e+03 |\n", "| LossPi | 100 |\n", "| LossQ | 349 |\n", "| Time | 1.66e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 62 |\n", "| AverageEpRet | -487 |\n", "| StdEpRet | 280 |\n", "| MaxEpRet | -116 |\n", "| MinEpRet | -1.24e+03 |\n", "| AverageTestEpRet | -485 |\n", "| StdTestEpRet | 247 |\n", "| MaxTestEpRet | -146 |\n", "| MinTestEpRet | -886 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.36e+05 |\n", "| AverageQ1Vals | -109 |\n", "| StdQ1Vals | 165 |\n", "| MaxQ1Vals | 67.9 |\n", "| MinQ1Vals | -1.17e+03 |\n", "| AverageQ2Vals | -109 |\n", "| StdQ2Vals | 165 |\n", "| MaxQ2Vals | 44.4 |\n", "| MinQ2Vals | -1.14e+03 |\n", "| LossPi | 98.7 |\n", "| LossQ | 358 |\n", "| Time | 1.7e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 63 |\n", "| AverageEpRet | -448 |\n", "| StdEpRet | 251 |\n", "| MaxEpRet | -56.4 |\n", "| MinEpRet | -1.16e+03 |\n", "| AverageTestEpRet | -341 |\n", "| StdTestEpRet | 181 |\n", "| MaxTestEpRet | -63.6 |\n", "| MinTestEpRet | -608 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.39e+05 |\n", "| AverageQ1Vals | -108 |\n", "| StdQ1Vals | 165 |\n", "| MaxQ1Vals | 55.3 |\n", "| MinQ1Vals | -1.16e+03 |\n", "| AverageQ2Vals | -108 |\n", "| StdQ2Vals | 165 |\n", "| MaxQ2Vals | 52.7 |\n", "| MinQ2Vals | -1.13e+03 |\n", "| LossPi | 97.8 |\n", "| LossQ | 344 |\n", "| Time | 1.73e+03 |\n", "---------------------------------------\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "---------------------------------------\n", "| Epoch | 64 |\n", "| AverageEpRet | -525 |\n", "| StdEpRet | 226 |\n", "| MaxEpRet | -189 |\n", "| MinEpRet | -1.16e+03 |\n", "| AverageTestEpRet | -532 |\n", "| StdTestEpRet | 182 |\n", "| MaxTestEpRet | -302 |\n", "| MinTestEpRet | -824 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.41e+05 |\n", "| AverageQ1Vals | -106 |\n", "| StdQ1Vals | 164 |\n", "| MaxQ1Vals | 50.1 |\n", "| MinQ1Vals | -1.13e+03 |\n", "| AverageQ2Vals | -106 |\n", "| StdQ2Vals | 164 |\n", "| MaxQ2Vals | 37.7 |\n", "| MinQ2Vals | -1.13e+03 |\n", "| LossPi | 95.7 |\n", "| LossQ | 340 |\n", "| Time | 1.76e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 65 |\n", "| AverageEpRet | -470 |\n", "| StdEpRet | 277 |\n", "| MaxEpRet | -31.2 |\n", "| MinEpRet | -1.01e+03 |\n", "| AverageTestEpRet | -520 |\n", "| StdTestEpRet | 359 |\n", "| MaxTestEpRet | -127 |\n", "| MinTestEpRet | -1.51e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.43e+05 |\n", "| AverageQ1Vals | -105 |\n", "| StdQ1Vals | 162 |\n", "| MaxQ1Vals | 58.3 |\n", "| MinQ1Vals | -1.22e+03 |\n", "| AverageQ2Vals | -105 |\n", "| StdQ2Vals | 162 |\n", "| MaxQ2Vals | 51.6 |\n", "| MinQ2Vals | -1.2e+03 |\n", "| LossPi | 95.2 |\n", "| LossQ | 329 |\n", "| Time | 1.79e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 66 |\n", "| AverageEpRet | -622 |\n", "| StdEpRet | 284 |\n", "| MaxEpRet | -126 |\n", "| MinEpRet | -1.33e+03 |\n", "| AverageTestEpRet | -525 |\n", "| StdTestEpRet | 239 |\n", "| MaxTestEpRet | -224 |\n", "| MinTestEpRet | -1.01e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.45e+05 |\n", "| AverageQ1Vals | -104 |\n", "| StdQ1Vals | 163 |\n", "| MaxQ1Vals | 46.5 |\n", "| MinQ1Vals | -1.17e+03 |\n", "| AverageQ2Vals | -104 |\n", "| StdQ2Vals | 163 |\n", "| MaxQ2Vals | 73.2 |\n", "| MinQ2Vals | -1.19e+03 |\n", "| LossPi | 94.4 |\n", "| LossQ | 329 |\n", "| Time | 1.83e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 67 |\n", "| AverageEpRet | -483 |\n", "| StdEpRet | 204 |\n", "| MaxEpRet | -118 |\n", "| MinEpRet | -836 |\n", "| AverageTestEpRet | -530 |\n", "| StdTestEpRet | 231 |\n", "| MaxTestEpRet | -156 |\n", "| MinTestEpRet | -994 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.47e+05 |\n", "| AverageQ1Vals | -103 |\n", "| StdQ1Vals | 161 |\n", "| MaxQ1Vals | 56 |\n", "| MinQ1Vals | -1.22e+03 |\n", "| AverageQ2Vals | -103 |\n", "| StdQ2Vals | 161 |\n", "| MaxQ2Vals | 80 |\n", "| MinQ2Vals | -1.24e+03 |\n", "| LossPi | 93.2 |\n", "| LossQ | 325 |\n", "| Time | 1.86e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 68 |\n", "| AverageEpRet | -443 |\n", "| StdEpRet | 266 |\n", "| MaxEpRet | -17.7 |\n", "| MinEpRet | -926 |\n", "| AverageTestEpRet | -498 |\n", "| StdTestEpRet | 213 |\n", "| MaxTestEpRet | -224 |\n", "| MinTestEpRet | -779 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.5e+05 |\n", "| AverageQ1Vals | -101 |\n", "| StdQ1Vals | 160 |\n", "| MaxQ1Vals | 71.7 |\n", "| MinQ1Vals | -1.13e+03 |\n", "| AverageQ2Vals | -101 |\n", "| StdQ2Vals | 160 |\n", "| MaxQ2Vals | 76.3 |\n", "| MinQ2Vals | -1.16e+03 |\n", "| LossPi | 91.3 |\n", "| LossQ | 311 |\n", "| Time | 1.89e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 69 |\n", "| AverageEpRet | -542 |\n", "| StdEpRet | 422 |\n", "| MaxEpRet | -74.6 |\n", "| MinEpRet | -1.84e+03 |\n", "| AverageTestEpRet | -466 |\n", "| StdTestEpRet | 205 |\n", "| MaxTestEpRet | -134 |\n", "| MinTestEpRet | -905 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.52e+05 |\n", "| AverageQ1Vals | -101 |\n", "| StdQ1Vals | 160 |\n", "| MaxQ1Vals | 57.9 |\n", "| MinQ1Vals | -1.19e+03 |\n", "| AverageQ2Vals | -101 |\n", "| StdQ2Vals | 160 |\n", "| MaxQ2Vals | 106 |\n", "| MinQ2Vals | -1.16e+03 |\n", "| LossPi | 91.1 |\n", "| LossQ | 315 |\n", "| Time | 1.92e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 70 |\n", "| AverageEpRet | -556 |\n", "| StdEpRet | 188 |\n", "| MaxEpRet | -166 |\n", "| MinEpRet | -827 |\n", "| AverageTestEpRet | -466 |\n", "| StdTestEpRet | 163 |\n", "| MaxTestEpRet | -247 |\n", "| MinTestEpRet | -782 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.54e+05 |\n", "| AverageQ1Vals | -98.9 |\n", "| StdQ1Vals | 158 |\n", "| MaxQ1Vals | 55.3 |\n", "| MinQ1Vals | -1.2e+03 |\n", "| AverageQ2Vals | -98.9 |\n", "| StdQ2Vals | 158 |\n", "| MaxQ2Vals | 104 |\n", "| MinQ2Vals | -1.19e+03 |\n", "| LossPi | 89.6 |\n", "| LossQ | 298 |\n", "| Time | 1.96e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 71 |\n", "| AverageEpRet | -508 |\n", "| StdEpRet | 360 |\n", "| MaxEpRet | -116 |\n", "| MinEpRet | -1.65e+03 |\n", "| AverageTestEpRet | -503 |\n", "| StdTestEpRet | 290 |\n", "| MaxTestEpRet | -98.4 |\n", "| MinTestEpRet | -933 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.56e+05 |\n", "| AverageQ1Vals | -98.9 |\n", "| StdQ1Vals | 158 |\n", "| MaxQ1Vals | 68.3 |\n", "| MinQ1Vals | -1.16e+03 |\n", "| AverageQ2Vals | -98.9 |\n", "| StdQ2Vals | 158 |\n", "| MaxQ2Vals | 62.4 |\n", "| MinQ2Vals | -1.17e+03 |\n", "| LossPi | 89.9 |\n", "| LossQ | 310 |\n", "| Time | 1.98e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 72 |\n", "| AverageEpRet | -565 |\n", "| StdEpRet | 254 |\n", "| MaxEpRet | -154 |\n", "| MinEpRet | -1.08e+03 |\n", "| AverageTestEpRet | -595 |\n", "| StdTestEpRet | 299 |\n", "| MaxTestEpRet | -224 |\n", "| MinTestEpRet | -1.16e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.58e+05 |\n", "| AverageQ1Vals | -98.4 |\n", "| StdQ1Vals | 157 |\n", "| MaxQ1Vals | 40.1 |\n", "| MinQ1Vals | -1.14e+03 |\n", "| AverageQ2Vals | -98.4 |\n", "| StdQ2Vals | 157 |\n", "| MaxQ2Vals | 65.8 |\n", "| MinQ2Vals | -1.17e+03 |\n", "| LossPi | 89.2 |\n", "| LossQ | 307 |\n", "| Time | 2.01e+03 |\n", "---------------------------------------\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "---------------------------------------\n", "| Epoch | 73 |\n", "| AverageEpRet | -531 |\n", "| StdEpRet | 253 |\n", "| MaxEpRet | -152 |\n", "| MinEpRet | -1.18e+03 |\n", "| AverageTestEpRet | -403 |\n", "| StdTestEpRet | 239 |\n", "| MaxTestEpRet | -66.2 |\n", "| MinTestEpRet | -865 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.61e+05 |\n", "| AverageQ1Vals | -98 |\n", "| StdQ1Vals | 156 |\n", "| MaxQ1Vals | 123 |\n", "| MinQ1Vals | -1.18e+03 |\n", "| AverageQ2Vals | -98 |\n", "| StdQ2Vals | 156 |\n", "| MaxQ2Vals | 61.2 |\n", "| MinQ2Vals | -1.17e+03 |\n", "| LossPi | 89.2 |\n", "| LossQ | 290 |\n", "| Time | 2.05e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 74 |\n", "| AverageEpRet | -608 |\n", "| StdEpRet | 225 |\n", "| MaxEpRet | -242 |\n", "| MinEpRet | -1.07e+03 |\n", "| AverageTestEpRet | -421 |\n", "| StdTestEpRet | 224 |\n", "| MaxTestEpRet | -127 |\n", "| MinTestEpRet | -972 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.63e+05 |\n", "| AverageQ1Vals | -96.8 |\n", "| StdQ1Vals | 154 |\n", "| MaxQ1Vals | 84.5 |\n", "| MinQ1Vals | -1.11e+03 |\n", "| AverageQ2Vals | -96.8 |\n", "| StdQ2Vals | 154 |\n", "| MaxQ2Vals | 44 |\n", "| MinQ2Vals | -1.13e+03 |\n", "| LossPi | 87.6 |\n", "| LossQ | 280 |\n", "| Time | 2.08e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 75 |\n", "| AverageEpRet | -438 |\n", "| StdEpRet | 207 |\n", "| MaxEpRet | -103 |\n", "| MinEpRet | -930 |\n", "| AverageTestEpRet | -416 |\n", "| StdTestEpRet | 241 |\n", "| MaxTestEpRet | -135 |\n", "| MinTestEpRet | -887 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.65e+05 |\n", "| AverageQ1Vals | -96.7 |\n", "| StdQ1Vals | 155 |\n", "| MaxQ1Vals | 72.5 |\n", "| MinQ1Vals | -1.13e+03 |\n", "| AverageQ2Vals | -96.7 |\n", "| StdQ2Vals | 155 |\n", "| MaxQ2Vals | 75.7 |\n", "| MinQ2Vals | -1.2e+03 |\n", "| LossPi | 88.1 |\n", "| LossQ | 285 |\n", "| Time | 2.11e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 76 |\n", "| AverageEpRet | -639 |\n", "| StdEpRet | 315 |\n", "| MaxEpRet | -214 |\n", "| MinEpRet | -1.51e+03 |\n", "| AverageTestEpRet | -437 |\n", "| StdTestEpRet | 268 |\n", "| MaxTestEpRet | -19.2 |\n", "| MinTestEpRet | -1.04e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.67e+05 |\n", "| AverageQ1Vals | -95.7 |\n", "| StdQ1Vals | 153 |\n", "| MaxQ1Vals | 48.5 |\n", "| MinQ1Vals | -1.18e+03 |\n", "| AverageQ2Vals | -95.7 |\n", "| StdQ2Vals | 153 |\n", "| MaxQ2Vals | 46.2 |\n", "| MinQ2Vals | -1.16e+03 |\n", "| LossPi | 86.8 |\n", "| LossQ | 285 |\n", "| Time | 2.14e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 77 |\n", "| AverageEpRet | -468 |\n", "| StdEpRet | 228 |\n", "| MaxEpRet | -125 |\n", "| MinEpRet | -901 |\n", "| AverageTestEpRet | -556 |\n", "| StdTestEpRet | 262 |\n", "| MaxTestEpRet | -148 |\n", "| MinTestEpRet | -812 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.69e+05 |\n", "| AverageQ1Vals | -95.7 |\n", "| StdQ1Vals | 153 |\n", "| MaxQ1Vals | 37.2 |\n", "| MinQ1Vals | -1.17e+03 |\n", "| AverageQ2Vals | -95.7 |\n", "| StdQ2Vals | 153 |\n", "| MaxQ2Vals | 49.4 |\n", "| MinQ2Vals | -1.13e+03 |\n", "| LossPi | 86.9 |\n", "| LossQ | 283 |\n", "| Time | 2.18e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 78 |\n", "| AverageEpRet | -568 |\n", "| StdEpRet | 284 |\n", "| MaxEpRet | -123 |\n", "| MinEpRet | -1.27e+03 |\n", "| AverageTestEpRet | -550 |\n", "| StdTestEpRet | 360 |\n", "| MaxTestEpRet | -164 |\n", "| MinTestEpRet | -1.26e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.72e+05 |\n", "| AverageQ1Vals | -94.5 |\n", "| StdQ1Vals | 151 |\n", "| MaxQ1Vals | 47.8 |\n", "| MinQ1Vals | -1.2e+03 |\n", "| AverageQ2Vals | -94.5 |\n", "| StdQ2Vals | 151 |\n", "| MaxQ2Vals | 92 |\n", "| MinQ2Vals | -1.18e+03 |\n", "| LossPi | 85.9 |\n", "| LossQ | 265 |\n", "| Time | 2.21e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 79 |\n", "| AverageEpRet | -566 |\n", "| StdEpRet | 337 |\n", "| MaxEpRet | -96.5 |\n", "| MinEpRet | -1.45e+03 |\n", "| AverageTestEpRet | -543 |\n", "| StdTestEpRet | 365 |\n", "| MaxTestEpRet | -134 |\n", "| MinTestEpRet | -1.41e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.74e+05 |\n", "| AverageQ1Vals | -94.8 |\n", "| StdQ1Vals | 151 |\n", "| MaxQ1Vals | 69.7 |\n", "| MinQ1Vals | -1.21e+03 |\n", "| AverageQ2Vals | -94.8 |\n", "| StdQ2Vals | 151 |\n", "| MaxQ2Vals | 75.6 |\n", "| MinQ2Vals | -1.21e+03 |\n", "| LossPi | 86.4 |\n", "| LossQ | 278 |\n", "| Time | 2.24e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 80 |\n", "| AverageEpRet | -616 |\n", "| StdEpRet | 290 |\n", "| MaxEpRet | -114 |\n", "| MinEpRet | -1.16e+03 |\n", "| AverageTestEpRet | -447 |\n", "| StdTestEpRet | 196 |\n", "| MaxTestEpRet | -182 |\n", "| MinTestEpRet | -783 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.76e+05 |\n", "| AverageQ1Vals | -94.6 |\n", "| StdQ1Vals | 151 |\n", "| MaxQ1Vals | 59.6 |\n", "| MinQ1Vals | -1.13e+03 |\n", "| AverageQ2Vals | -94.6 |\n", "| StdQ2Vals | 151 |\n", "| MaxQ2Vals | 74.6 |\n", "| MinQ2Vals | -1.13e+03 |\n", "| LossPi | 86.4 |\n", "| LossQ | 271 |\n", "| Time | 2.28e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 81 |\n", "| AverageEpRet | -535 |\n", "| StdEpRet | 217 |\n", "| MaxEpRet | -131 |\n", "| MinEpRet | -999 |\n", "| AverageTestEpRet | -422 |\n", "| StdTestEpRet | 270 |\n", "| MaxTestEpRet | -67.3 |\n", "| MinTestEpRet | -1.09e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.78e+05 |\n", "| AverageQ1Vals | -94.2 |\n", "| StdQ1Vals | 150 |\n", "| MaxQ1Vals | 47.4 |\n", "| MinQ1Vals | -1.15e+03 |\n", "| AverageQ2Vals | -94.2 |\n", "| StdQ2Vals | 150 |\n", "| MaxQ2Vals | 71 |\n", "| MinQ2Vals | -1.15e+03 |\n", "| LossPi | 85.8 |\n", "| LossQ | 263 |\n", "| Time | 2.31e+03 |\n", "---------------------------------------\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "---------------------------------------\n", "| Epoch | 82 |\n", "| AverageEpRet | -505 |\n", "| StdEpRet | 251 |\n", "| MaxEpRet | -79.9 |\n", "| MinEpRet | -1.01e+03 |\n", "| AverageTestEpRet | -734 |\n", "| StdTestEpRet | 289 |\n", "| MaxTestEpRet | -227 |\n", "| MinTestEpRet | -1.22e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.8e+05 |\n", "| AverageQ1Vals | -94.2 |\n", "| StdQ1Vals | 149 |\n", "| MaxQ1Vals | 53 |\n", "| MinQ1Vals | -1.09e+03 |\n", "| AverageQ2Vals | -94.2 |\n", "| StdQ2Vals | 149 |\n", "| MaxQ2Vals | 67.3 |\n", "| MinQ2Vals | -1.08e+03 |\n", "| LossPi | 86.6 |\n", "| LossQ | 267 |\n", "| Time | 2.35e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 83 |\n", "| AverageEpRet | -585 |\n", "| StdEpRet | 348 |\n", "| MaxEpRet | -96.7 |\n", "| MinEpRet | -1.3e+03 |\n", "| AverageTestEpRet | -436 |\n", "| StdTestEpRet | 169 |\n", "| MaxTestEpRet | -212 |\n", "| MinTestEpRet | -748 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.83e+05 |\n", "| AverageQ1Vals | -92.9 |\n", "| StdQ1Vals | 147 |\n", "| MaxQ1Vals | 44.3 |\n", "| MinQ1Vals | -1.18e+03 |\n", "| AverageQ2Vals | -92.9 |\n", "| StdQ2Vals | 147 |\n", "| MaxQ2Vals | 75.2 |\n", "| MinQ2Vals | -1.15e+03 |\n", "| LossPi | 84.8 |\n", "| LossQ | 263 |\n", "| Time | 2.38e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 84 |\n", "| AverageEpRet | -406 |\n", "| StdEpRet | 232 |\n", "| MaxEpRet | -128 |\n", "| MinEpRet | -924 |\n", "| AverageTestEpRet | -650 |\n", "| StdTestEpRet | 236 |\n", "| MaxTestEpRet | -198 |\n", "| MinTestEpRet | -1.01e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.85e+05 |\n", "| AverageQ1Vals | -92.5 |\n", "| StdQ1Vals | 146 |\n", "| MaxQ1Vals | 46.3 |\n", "| MinQ1Vals | -1.12e+03 |\n", "| AverageQ2Vals | -92.5 |\n", "| StdQ2Vals | 146 |\n", "| MaxQ2Vals | 80.6 |\n", "| MinQ2Vals | -1.11e+03 |\n", "| LossPi | 84.4 |\n", "| LossQ | 258 |\n", "| Time | 2.41e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 85 |\n", "| AverageEpRet | -474 |\n", "| StdEpRet | 247 |\n", "| MaxEpRet | -180 |\n", "| MinEpRet | -1.22e+03 |\n", "| AverageTestEpRet | -527 |\n", "| StdTestEpRet | 163 |\n", "| MaxTestEpRet | -166 |\n", "| MinTestEpRet | -737 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.87e+05 |\n", "| AverageQ1Vals | -91.8 |\n", "| StdQ1Vals | 145 |\n", "| MaxQ1Vals | 51.6 |\n", "| MinQ1Vals | -1.09e+03 |\n", "| AverageQ2Vals | -91.8 |\n", "| StdQ2Vals | 145 |\n", "| MaxQ2Vals | 33.2 |\n", "| MinQ2Vals | -1.06e+03 |\n", "| LossPi | 84.1 |\n", "| LossQ | 249 |\n", "| Time | 2.44e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 86 |\n", "| AverageEpRet | -431 |\n", "| StdEpRet | 264 |\n", "| MaxEpRet | -112 |\n", "| MinEpRet | -1.26e+03 |\n", "| AverageTestEpRet | -665 |\n", "| StdTestEpRet | 378 |\n", "| MaxTestEpRet | -261 |\n", "| MinTestEpRet | -1.55e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.89e+05 |\n", "| AverageQ1Vals | -91.6 |\n", "| StdQ1Vals | 146 |\n", "| MaxQ1Vals | 65.2 |\n", "| MinQ1Vals | -1.16e+03 |\n", "| AverageQ2Vals | -91.7 |\n", "| StdQ2Vals | 146 |\n", "| MaxQ2Vals | 67.6 |\n", "| MinQ2Vals | -1.12e+03 |\n", "| LossPi | 83.5 |\n", "| LossQ | 238 |\n", "| Time | 2.47e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 87 |\n", "| AverageEpRet | -515 |\n", "| StdEpRet | 228 |\n", "| MaxEpRet | -122 |\n", "| MinEpRet | -976 |\n", "| AverageTestEpRet | -420 |\n", "| StdTestEpRet | 202 |\n", "| MaxTestEpRet | -180 |\n", "| MinTestEpRet | -829 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.91e+05 |\n", "| AverageQ1Vals | -92.1 |\n", "| StdQ1Vals | 146 |\n", "| MaxQ1Vals | 48.9 |\n", "| MinQ1Vals | -1.17e+03 |\n", "| AverageQ2Vals | -92.1 |\n", "| StdQ2Vals | 146 |\n", "| MaxQ2Vals | 54.4 |\n", "| MinQ2Vals | -1.16e+03 |\n", "| LossPi | 83.6 |\n", "| LossQ | 256 |\n", "| Time | 2.51e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 88 |\n", "| AverageEpRet | -572 |\n", "| StdEpRet | 258 |\n", "| MaxEpRet | -57 |\n", "| MinEpRet | -1.07e+03 |\n", "| AverageTestEpRet | -508 |\n", "| StdTestEpRet | 163 |\n", "| MaxTestEpRet | -217 |\n", "| MinTestEpRet | -794 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.94e+05 |\n", "| AverageQ1Vals | -91.3 |\n", "| StdQ1Vals | 145 |\n", "| MaxQ1Vals | 42.6 |\n", "| MinQ1Vals | -1.12e+03 |\n", "| AverageQ2Vals | -91.3 |\n", "| StdQ2Vals | 145 |\n", "| MaxQ2Vals | 58 |\n", "| MinQ2Vals | -1.09e+03 |\n", "| LossPi | 83.7 |\n", "| LossQ | 246 |\n", "| Time | 2.54e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 89 |\n", "| AverageEpRet | -503 |\n", "| StdEpRet | 241 |\n", "| MaxEpRet | -49.9 |\n", "| MinEpRet | -1.15e+03 |\n", "| AverageTestEpRet | -562 |\n", "| StdTestEpRet | 306 |\n", "| MaxTestEpRet | -68.2 |\n", "| MinTestEpRet | -1.15e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.96e+05 |\n", "| AverageQ1Vals | -90.3 |\n", "| StdQ1Vals | 144 |\n", "| MaxQ1Vals | 49.8 |\n", "| MinQ1Vals | -1.16e+03 |\n", "| AverageQ2Vals | -90.3 |\n", "| StdQ2Vals | 144 |\n", "| MaxQ2Vals | 54.1 |\n", "| MinQ2Vals | -1.15e+03 |\n", "| LossPi | 83 |\n", "| LossQ | 243 |\n", "| Time | 2.57e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 90 |\n", "| AverageEpRet | -478 |\n", "| StdEpRet | 286 |\n", "| MaxEpRet | -68 |\n", "| MinEpRet | -1.15e+03 |\n", "| AverageTestEpRet | -603 |\n", "| StdTestEpRet | 390 |\n", "| MaxTestEpRet | -123 |\n", "| MinTestEpRet | -1.55e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 1.98e+05 |\n", "| AverageQ1Vals | -89.9 |\n", "| StdQ1Vals | 143 |\n", "| MaxQ1Vals | 36.5 |\n", "| MinQ1Vals | -1.17e+03 |\n", "| AverageQ2Vals | -89.9 |\n", "| StdQ2Vals | 143 |\n", "| MaxQ2Vals | 65.2 |\n", "| MinQ2Vals | -1.14e+03 |\n", "| LossPi | 82.6 |\n", "| LossQ | 237 |\n", "| Time | 2.6e+03 |\n", "---------------------------------------\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "---------------------------------------\n", "| Epoch | 91 |\n", "| AverageEpRet | -509 |\n", "| StdEpRet | 252 |\n", "| MaxEpRet | -101 |\n", "| MinEpRet | -1.12e+03 |\n", "| AverageTestEpRet | -566 |\n", "| StdTestEpRet | 308 |\n", "| MaxTestEpRet | -62.9 |\n", "| MinTestEpRet | -1.02e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2e+05 |\n", "| AverageQ1Vals | -89.9 |\n", "| StdQ1Vals | 143 |\n", "| MaxQ1Vals | 36.4 |\n", "| MinQ1Vals | -1.16e+03 |\n", "| AverageQ2Vals | -89.9 |\n", "| StdQ2Vals | 143 |\n", "| MaxQ2Vals | 25.5 |\n", "| MinQ2Vals | -1.14e+03 |\n", "| LossPi | 82.7 |\n", "| LossQ | 241 |\n", "| Time | 2.63e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 92 |\n", "| AverageEpRet | -425 |\n", "| StdEpRet | 205 |\n", "| MaxEpRet | -170 |\n", "| MinEpRet | -998 |\n", "| AverageTestEpRet | -536 |\n", "| StdTestEpRet | 271 |\n", "| MaxTestEpRet | -209 |\n", "| MinTestEpRet | -1.04e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.02e+05 |\n", "| AverageQ1Vals | -88.7 |\n", "| StdQ1Vals | 143 |\n", "| MaxQ1Vals | 36 |\n", "| MinQ1Vals | -1.14e+03 |\n", "| AverageQ2Vals | -88.7 |\n", "| StdQ2Vals | 143 |\n", "| MaxQ2Vals | 32.9 |\n", "| MinQ2Vals | -1.14e+03 |\n", "| LossPi | 81.3 |\n", "| LossQ | 237 |\n", "| Time | 2.67e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 93 |\n", "| AverageEpRet | -498 |\n", "| StdEpRet | 277 |\n", "| MaxEpRet | -83.8 |\n", "| MinEpRet | -1.11e+03 |\n", "| AverageTestEpRet | -523 |\n", "| StdTestEpRet | 286 |\n", "| MaxTestEpRet | -83.5 |\n", "| MinTestEpRet | -967 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.05e+05 |\n", "| AverageQ1Vals | -88.2 |\n", "| StdQ1Vals | 144 |\n", "| MaxQ1Vals | 97.3 |\n", "| MinQ1Vals | -1.16e+03 |\n", "| AverageQ2Vals | -88.2 |\n", "| StdQ2Vals | 144 |\n", "| MaxQ2Vals | 36.8 |\n", "| MinQ2Vals | -1.18e+03 |\n", "| LossPi | 80.8 |\n", "| LossQ | 244 |\n", "| Time | 2.7e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 94 |\n", "| AverageEpRet | -470 |\n", "| StdEpRet | 231 |\n", "| MaxEpRet | -88.9 |\n", "| MinEpRet | -946 |\n", "| AverageTestEpRet | -407 |\n", "| StdTestEpRet | 194 |\n", "| MaxTestEpRet | -167 |\n", "| MinTestEpRet | -793 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.07e+05 |\n", "| AverageQ1Vals | -87.9 |\n", "| StdQ1Vals | 143 |\n", "| MaxQ1Vals | 48.9 |\n", "| MinQ1Vals | -1.16e+03 |\n", "| AverageQ2Vals | -87.9 |\n", "| StdQ2Vals | 143 |\n", "| MaxQ2Vals | 65.6 |\n", "| MinQ2Vals | -1.1e+03 |\n", "| LossPi | 80.4 |\n", "| LossQ | 244 |\n", "| Time | 2.73e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 95 |\n", "| AverageEpRet | -471 |\n", "| StdEpRet | 257 |\n", "| MaxEpRet | -113 |\n", "| MinEpRet | -994 |\n", "| AverageTestEpRet | -563 |\n", "| StdTestEpRet | 152 |\n", "| MaxTestEpRet | -261 |\n", "| MinTestEpRet | -827 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.09e+05 |\n", "| AverageQ1Vals | -87.2 |\n", "| StdQ1Vals | 141 |\n", "| MaxQ1Vals | 30.3 |\n", "| MinQ1Vals | -1.14e+03 |\n", "| AverageQ2Vals | -87.2 |\n", "| StdQ2Vals | 141 |\n", "| MaxQ2Vals | 45.3 |\n", "| MinQ2Vals | -1.11e+03 |\n", "| LossPi | 80.3 |\n", "| LossQ | 243 |\n", "| Time | 2.76e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 96 |\n", "| AverageEpRet | -473 |\n", "| StdEpRet | 268 |\n", "| MaxEpRet | -76.1 |\n", "| MinEpRet | -1.03e+03 |\n", "| AverageTestEpRet | -392 |\n", "| StdTestEpRet | 191 |\n", "| MaxTestEpRet | -90.2 |\n", "| MinTestEpRet | -713 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.11e+05 |\n", "| AverageQ1Vals | -86.8 |\n", "| StdQ1Vals | 139 |\n", "| MaxQ1Vals | 32.9 |\n", "| MinQ1Vals | -1.09e+03 |\n", "| AverageQ2Vals | -86.8 |\n", "| StdQ2Vals | 139 |\n", "| MaxQ2Vals | 40.5 |\n", "| MinQ2Vals | -1.1e+03 |\n", "| LossPi | 79.5 |\n", "| LossQ | 233 |\n", "| Time | 2.79e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 97 |\n", "| AverageEpRet | -497 |\n", "| StdEpRet | 345 |\n", "| MaxEpRet | -37.1 |\n", "| MinEpRet | -1.17e+03 |\n", "| AverageTestEpRet | -420 |\n", "| StdTestEpRet | 227 |\n", "| MaxTestEpRet | -72.6 |\n", "| MinTestEpRet | -742 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.13e+05 |\n", "| AverageQ1Vals | -86.5 |\n", "| StdQ1Vals | 140 |\n", "| MaxQ1Vals | 43 |\n", "| MinQ1Vals | -1.17e+03 |\n", "| AverageQ2Vals | -86.5 |\n", "| StdQ2Vals | 140 |\n", "| MaxQ2Vals | 38.9 |\n", "| MinQ2Vals | -1.18e+03 |\n", "| LossPi | 79.6 |\n", "| LossQ | 234 |\n", "| Time | 2.82e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 98 |\n", "| AverageEpRet | -429 |\n", "| StdEpRet | 215 |\n", "| MaxEpRet | -135 |\n", "| MinEpRet | -848 |\n", "| AverageTestEpRet | -511 |\n", "| StdTestEpRet | 337 |\n", "| MaxTestEpRet | -92.5 |\n", "| MinTestEpRet | -1.37e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.16e+05 |\n", "| AverageQ1Vals | -86.1 |\n", "| StdQ1Vals | 139 |\n", "| MaxQ1Vals | 30.3 |\n", "| MinQ1Vals | -1.25e+03 |\n", "| AverageQ2Vals | -86.1 |\n", "| StdQ2Vals | 139 |\n", "| MaxQ2Vals | 43.7 |\n", "| MinQ2Vals | -1.21e+03 |\n", "| LossPi | 79.1 |\n", "| LossQ | 226 |\n", "| Time | 2.85e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 99 |\n", "| AverageEpRet | -514 |\n", "| StdEpRet | 278 |\n", "| MaxEpRet | -141 |\n", "| MinEpRet | -1.21e+03 |\n", "| AverageTestEpRet | -633 |\n", "| StdTestEpRet | 489 |\n", "| MaxTestEpRet | -181 |\n", "| MinTestEpRet | -1.66e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.18e+05 |\n", "| AverageQ1Vals | -84.8 |\n", "| StdQ1Vals | 139 |\n", "| MaxQ1Vals | 30.2 |\n", "| MinQ1Vals | -1.19e+03 |\n", "| AverageQ2Vals | -84.8 |\n", "| StdQ2Vals | 139 |\n", "| MaxQ2Vals | 27.5 |\n", "| MinQ2Vals | -1.16e+03 |\n", "| LossPi | 77.7 |\n", "| LossQ | 225 |\n", "| Time | 2.88e+03 |\n", "---------------------------------------\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "---------------------------------------\n", "| Epoch | 100 |\n", "| AverageEpRet | -557 |\n", "| StdEpRet | 280 |\n", "| MaxEpRet | -26 |\n", "| MinEpRet | -1.17e+03 |\n", "| AverageTestEpRet | -544 |\n", "| StdTestEpRet | 372 |\n", "| MaxTestEpRet | -148 |\n", "| MinTestEpRet | -1.24e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.2e+05 |\n", "| AverageQ1Vals | -84 |\n", "| StdQ1Vals | 139 |\n", "| MaxQ1Vals | 51.4 |\n", "| MinQ1Vals | -1.18e+03 |\n", "| AverageQ2Vals | -84 |\n", "| StdQ2Vals | 139 |\n", "| MaxQ2Vals | 43 |\n", "| MinQ2Vals | -1.22e+03 |\n", "| LossPi | 76.6 |\n", "| LossQ | 220 |\n", "| Time | 2.92e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 101 |\n", "| AverageEpRet | -434 |\n", "| StdEpRet | 192 |\n", "| MaxEpRet | -155 |\n", "| MinEpRet | -806 |\n", "| AverageTestEpRet | -418 |\n", "| StdTestEpRet | 152 |\n", "| MaxTestEpRet | -244 |\n", "| MinTestEpRet | -730 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.22e+05 |\n", "| AverageQ1Vals | -82.7 |\n", "| StdQ1Vals | 138 |\n", "| MaxQ1Vals | 35.3 |\n", "| MinQ1Vals | -1.16e+03 |\n", "| AverageQ2Vals | -82.7 |\n", "| StdQ2Vals | 138 |\n", "| MaxQ2Vals | 54.9 |\n", "| MinQ2Vals | -1.16e+03 |\n", "| LossPi | 76.3 |\n", "| LossQ | 219 |\n", "| Time | 2.95e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 102 |\n", "| AverageEpRet | -625 |\n", "| StdEpRet | 341 |\n", "| MaxEpRet | -120 |\n", "| MinEpRet | -1.24e+03 |\n", "| AverageTestEpRet | -490 |\n", "| StdTestEpRet | 223 |\n", "| MaxTestEpRet | -73.4 |\n", "| MinTestEpRet | -824 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.24e+05 |\n", "| AverageQ1Vals | -81.2 |\n", "| StdQ1Vals | 137 |\n", "| MaxQ1Vals | 96.8 |\n", "| MinQ1Vals | -1.19e+03 |\n", "| AverageQ2Vals | -81.2 |\n", "| StdQ2Vals | 137 |\n", "| MaxQ2Vals | 71.4 |\n", "| MinQ2Vals | -1.16e+03 |\n", "| LossPi | 74.2 |\n", "| LossQ | 213 |\n", "| Time | 2.99e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 103 |\n", "| AverageEpRet | -617 |\n", "| StdEpRet | 327 |\n", "| MaxEpRet | -104 |\n", "| MinEpRet | -1.32e+03 |\n", "| AverageTestEpRet | -561 |\n", "| StdTestEpRet | 214 |\n", "| MaxTestEpRet | -248 |\n", "| MinTestEpRet | -906 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.27e+05 |\n", "| AverageQ1Vals | -80.7 |\n", "| StdQ1Vals | 138 |\n", "| MaxQ1Vals | 70.5 |\n", "| MinQ1Vals | -1.15e+03 |\n", "| AverageQ2Vals | -80.7 |\n", "| StdQ2Vals | 138 |\n", "| MaxQ2Vals | 41 |\n", "| MinQ2Vals | -1.13e+03 |\n", "| LossPi | 74.1 |\n", "| LossQ | 204 |\n", "| Time | 3.02e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 104 |\n", "| AverageEpRet | -527 |\n", "| StdEpRet | 254 |\n", "| MaxEpRet | -65.7 |\n", "| MinEpRet | -1.01e+03 |\n", "| AverageTestEpRet | -425 |\n", "| StdTestEpRet | 224 |\n", "| MaxTestEpRet | -92.5 |\n", "| MinTestEpRet | -774 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.29e+05 |\n", "| AverageQ1Vals | -79.9 |\n", "| StdQ1Vals | 137 |\n", "| MaxQ1Vals | 41.1 |\n", "| MinQ1Vals | -1.13e+03 |\n", "| AverageQ2Vals | -79.9 |\n", "| StdQ2Vals | 137 |\n", "| MaxQ2Vals | 44.5 |\n", "| MinQ2Vals | -1.11e+03 |\n", "| LossPi | 73.2 |\n", "| LossQ | 217 |\n", "| Time | 3.05e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 105 |\n", "| AverageEpRet | -469 |\n", "| StdEpRet | 235 |\n", "| MaxEpRet | -144 |\n", "| MinEpRet | -1.12e+03 |\n", "| AverageTestEpRet | -317 |\n", "| StdTestEpRet | 137 |\n", "| MaxTestEpRet | -134 |\n", "| MinTestEpRet | -541 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.31e+05 |\n", "| AverageQ1Vals | -78.8 |\n", "| StdQ1Vals | 135 |\n", "| MaxQ1Vals | 24.5 |\n", "| MinQ1Vals | -1.16e+03 |\n", "| AverageQ2Vals | -78.8 |\n", "| StdQ2Vals | 135 |\n", "| MaxQ2Vals | 38.7 |\n", "| MinQ2Vals | -1.14e+03 |\n", "| LossPi | 72.6 |\n", "| LossQ | 200 |\n", "| Time | 3.08e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 106 |\n", "| AverageEpRet | -509 |\n", "| StdEpRet | 244 |\n", "| MaxEpRet | -114 |\n", "| MinEpRet | -989 |\n", "| AverageTestEpRet | -542 |\n", "| StdTestEpRet | 277 |\n", "| MaxTestEpRet | -129 |\n", "| MinTestEpRet | -965 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.33e+05 |\n", "| AverageQ1Vals | -79.1 |\n", "| StdQ1Vals | 136 |\n", "| MaxQ1Vals | 40.6 |\n", "| MinQ1Vals | -1.09e+03 |\n", "| AverageQ2Vals | -79.1 |\n", "| StdQ2Vals | 136 |\n", "| MaxQ2Vals | 54 |\n", "| MinQ2Vals | -1.11e+03 |\n", "| LossPi | 72.7 |\n", "| LossQ | 207 |\n", "| Time | 3.11e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 107 |\n", "| AverageEpRet | -571 |\n", "| StdEpRet | 245 |\n", "| MaxEpRet | -189 |\n", "| MinEpRet | -969 |\n", "| AverageTestEpRet | -538 |\n", "| StdTestEpRet | 189 |\n", "| MaxTestEpRet | -255 |\n", "| MinTestEpRet | -880 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.35e+05 |\n", "| AverageQ1Vals | -78.4 |\n", "| StdQ1Vals | 135 |\n", "| MaxQ1Vals | 33.8 |\n", "| MinQ1Vals | -1.11e+03 |\n", "| AverageQ2Vals | -78.4 |\n", "| StdQ2Vals | 135 |\n", "| MaxQ2Vals | 45.3 |\n", "| MinQ2Vals | -1.16e+03 |\n", "| LossPi | 71.6 |\n", "| LossQ | 202 |\n", "| Time | 3.15e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 108 |\n", "| AverageEpRet | -481 |\n", "| StdEpRet | 187 |\n", "| MaxEpRet | -110 |\n", "| MinEpRet | -837 |\n", "| AverageTestEpRet | -399 |\n", "| StdTestEpRet | 162 |\n", "| MaxTestEpRet | -149 |\n", "| MinTestEpRet | -668 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.38e+05 |\n", "| AverageQ1Vals | -78 |\n", "| StdQ1Vals | 135 |\n", "| MaxQ1Vals | 34 |\n", "| MinQ1Vals | -1.15e+03 |\n", "| AverageQ2Vals | -78 |\n", "| StdQ2Vals | 135 |\n", "| MaxQ2Vals | 41.9 |\n", "| MinQ2Vals | -1.14e+03 |\n", "| LossPi | 72.1 |\n", "| LossQ | 217 |\n", "| Time | 3.18e+03 |\n", "---------------------------------------\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "---------------------------------------\n", "| Epoch | 109 |\n", "| AverageEpRet | -476 |\n", "| StdEpRet | 272 |\n", "| MaxEpRet | -63.6 |\n", "| MinEpRet | -1.04e+03 |\n", "| AverageTestEpRet | -531 |\n", "| StdTestEpRet | 326 |\n", "| MaxTestEpRet | -90.1 |\n", "| MinTestEpRet | -1.19e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.4e+05 |\n", "| AverageQ1Vals | -76.9 |\n", "| StdQ1Vals | 134 |\n", "| MaxQ1Vals | 59 |\n", "| MinQ1Vals | -1.19e+03 |\n", "| AverageQ2Vals | -76.9 |\n", "| StdQ2Vals | 134 |\n", "| MaxQ2Vals | 42.2 |\n", "| MinQ2Vals | -1.18e+03 |\n", "| LossPi | 70.7 |\n", "| LossQ | 212 |\n", "| Time | 3.21e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 110 |\n", "| AverageEpRet | -523 |\n", "| StdEpRet | 321 |\n", "| MaxEpRet | -29.2 |\n", "| MinEpRet | -1.39e+03 |\n", "| AverageTestEpRet | -583 |\n", "| StdTestEpRet | 282 |\n", "| MaxTestEpRet | -187 |\n", "| MinTestEpRet | -1.03e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.42e+05 |\n", "| AverageQ1Vals | -76.8 |\n", "| StdQ1Vals | 135 |\n", "| MaxQ1Vals | 43.9 |\n", "| MinQ1Vals | -1.19e+03 |\n", "| AverageQ2Vals | -76.8 |\n", "| StdQ2Vals | 135 |\n", "| MaxQ2Vals | 53.2 |\n", "| MinQ2Vals | -1.19e+03 |\n", "| LossPi | 70.9 |\n", "| LossQ | 202 |\n", "| Time | 3.24e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 111 |\n", "| AverageEpRet | -453 |\n", "| StdEpRet | 254 |\n", "| MaxEpRet | -81.5 |\n", "| MinEpRet | -1.13e+03 |\n", "| AverageTestEpRet | -524 |\n", "| StdTestEpRet | 105 |\n", "| MaxTestEpRet | -339 |\n", "| MinTestEpRet | -689 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.44e+05 |\n", "| AverageQ1Vals | -76.5 |\n", "| StdQ1Vals | 135 |\n", "| MaxQ1Vals | 30.1 |\n", "| MinQ1Vals | -1.19e+03 |\n", "| AverageQ2Vals | -76.5 |\n", "| StdQ2Vals | 135 |\n", "| MaxQ2Vals | 41.8 |\n", "| MinQ2Vals | -1.23e+03 |\n", "| LossPi | 70.4 |\n", "| LossQ | 207 |\n", "| Time | 3.27e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 112 |\n", "| AverageEpRet | -596 |\n", "| StdEpRet | 262 |\n", "| MaxEpRet | -173 |\n", "| MinEpRet | -1.26e+03 |\n", "| AverageTestEpRet | -415 |\n", "| StdTestEpRet | 161 |\n", "| MaxTestEpRet | -137 |\n", "| MinTestEpRet | -652 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.46e+05 |\n", "| AverageQ1Vals | -76.3 |\n", "| StdQ1Vals | 134 |\n", "| MaxQ1Vals | 34.9 |\n", "| MinQ1Vals | -1.19e+03 |\n", "| AverageQ2Vals | -76.3 |\n", "| StdQ2Vals | 134 |\n", "| MaxQ2Vals | 46.7 |\n", "| MinQ2Vals | -1.18e+03 |\n", "| LossPi | 70.3 |\n", "| LossQ | 198 |\n", "| Time | 3.3e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 113 |\n", "| AverageEpRet | -482 |\n", "| StdEpRet | 333 |\n", "| MaxEpRet | -62.8 |\n", "| MinEpRet | -1.44e+03 |\n", "| AverageTestEpRet | -559 |\n", "| StdTestEpRet | 304 |\n", "| MaxTestEpRet | -142 |\n", "| MinTestEpRet | -1.28e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.49e+05 |\n", "| AverageQ1Vals | -76.2 |\n", "| StdQ1Vals | 134 |\n", "| MaxQ1Vals | 38.3 |\n", "| MinQ1Vals | -1.18e+03 |\n", "| AverageQ2Vals | -76.2 |\n", "| StdQ2Vals | 134 |\n", "| MaxQ2Vals | 50.3 |\n", "| MinQ2Vals | -1.2e+03 |\n", "| LossPi | 69.7 |\n", "| LossQ | 200 |\n", "| Time | 3.33e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 114 |\n", "| AverageEpRet | -450 |\n", "| StdEpRet | 216 |\n", "| MaxEpRet | -94.9 |\n", "| MinEpRet | -872 |\n", "| AverageTestEpRet | -432 |\n", "| StdTestEpRet | 132 |\n", "| MaxTestEpRet | -232 |\n", "| MinTestEpRet | -645 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.51e+05 |\n", "| AverageQ1Vals | -75.7 |\n", "| StdQ1Vals | 132 |\n", "| MaxQ1Vals | 44.9 |\n", "| MinQ1Vals | -1.16e+03 |\n", "| AverageQ2Vals | -75.7 |\n", "| StdQ2Vals | 132 |\n", "| MaxQ2Vals | 44.4 |\n", "| MinQ2Vals | -1.13e+03 |\n", "| LossPi | 69.6 |\n", "| LossQ | 201 |\n", "| Time | 3.36e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 115 |\n", "| AverageEpRet | -487 |\n", "| StdEpRet | 240 |\n", "| MaxEpRet | -108 |\n", "| MinEpRet | -932 |\n", "| AverageTestEpRet | -371 |\n", "| StdTestEpRet | 152 |\n", "| MaxTestEpRet | -143 |\n", "| MinTestEpRet | -616 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.53e+05 |\n", "| AverageQ1Vals | -75.4 |\n", "| StdQ1Vals | 132 |\n", "| MaxQ1Vals | 21.2 |\n", "| MinQ1Vals | -1.14e+03 |\n", "| AverageQ2Vals | -75.4 |\n", "| StdQ2Vals | 132 |\n", "| MaxQ2Vals | 29.5 |\n", "| MinQ2Vals | -1.11e+03 |\n", "| LossPi | 69.7 |\n", "| LossQ | 205 |\n", "| Time | 3.4e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 116 |\n", "| AverageEpRet | -538 |\n", "| StdEpRet | 220 |\n", "| MaxEpRet | -110 |\n", "| MinEpRet | -960 |\n", "| AverageTestEpRet | -475 |\n", "| StdTestEpRet | 311 |\n", "| MaxTestEpRet | -173 |\n", "| MinTestEpRet | -1.23e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.55e+05 |\n", "| AverageQ1Vals | -75.4 |\n", "| StdQ1Vals | 132 |\n", "| MaxQ1Vals | 26 |\n", "| MinQ1Vals | -1.18e+03 |\n", "| AverageQ2Vals | -75.4 |\n", "| StdQ2Vals | 132 |\n", "| MaxQ2Vals | 37.1 |\n", "| MinQ2Vals | -1.17e+03 |\n", "| LossPi | 69.3 |\n", "| LossQ | 201 |\n", "| Time | 3.43e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 117 |\n", "| AverageEpRet | -437 |\n", "| StdEpRet | 203 |\n", "| MaxEpRet | -92.8 |\n", "| MinEpRet | -857 |\n", "| AverageTestEpRet | -582 |\n", "| StdTestEpRet | 247 |\n", "| MaxTestEpRet | -79.8 |\n", "| MinTestEpRet | -861 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.57e+05 |\n", "| AverageQ1Vals | -75.5 |\n", "| StdQ1Vals | 132 |\n", "| MaxQ1Vals | 49.5 |\n", "| MinQ1Vals | -1.13e+03 |\n", "| AverageQ2Vals | -75.5 |\n", "| StdQ2Vals | 132 |\n", "| MaxQ2Vals | 51 |\n", "| MinQ2Vals | -1.14e+03 |\n", "| LossPi | 69.4 |\n", "| LossQ | 201 |\n", "| Time | 3.47e+03 |\n", "---------------------------------------\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "---------------------------------------\n", "| Epoch | 118 |\n", "| AverageEpRet | -549 |\n", "| StdEpRet | 236 |\n", "| MaxEpRet | -111 |\n", "| MinEpRet | -1.28e+03 |\n", "| AverageTestEpRet | -588 |\n", "| StdTestEpRet | 404 |\n", "| MaxTestEpRet | -138 |\n", "| MinTestEpRet | -1.66e+03 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.6e+05 |\n", "| AverageQ1Vals | -75.1 |\n", "| StdQ1Vals | 130 |\n", "| MaxQ1Vals | 31.7 |\n", "| MinQ1Vals | -1.05e+03 |\n", "| AverageQ2Vals | -75.1 |\n", "| StdQ2Vals | 130 |\n", "| MaxQ2Vals | 38.6 |\n", "| MinQ2Vals | -1.05e+03 |\n", "| LossPi | 69 |\n", "| LossQ | 192 |\n", "| Time | 3.5e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 119 |\n", "| AverageEpRet | -491 |\n", "| StdEpRet | 247 |\n", "| MaxEpRet | -102 |\n", "| MinEpRet | -945 |\n", "| AverageTestEpRet | -535 |\n", "| StdTestEpRet | 217 |\n", "| MaxTestEpRet | -173 |\n", "| MinTestEpRet | -879 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.62e+05 |\n", "| AverageQ1Vals | -74.9 |\n", "| StdQ1Vals | 130 |\n", "| MaxQ1Vals | 60.9 |\n", "| MinQ1Vals | -1.11e+03 |\n", "| AverageQ2Vals | -74.9 |\n", "| StdQ2Vals | 130 |\n", "| MaxQ2Vals | 28.6 |\n", "| MinQ2Vals | -1.12e+03 |\n", "| LossPi | 69.2 |\n", "| LossQ | 204 |\n", "| Time | 3.53e+03 |\n", "---------------------------------------\n", "---------------------------------------\n", "| Epoch | 120 |\n", "| AverageEpRet | -431 |\n", "| StdEpRet | 249 |\n", "| MaxEpRet | -64.6 |\n", "| MinEpRet | -885 |\n", "| AverageTestEpRet | -519 |\n", "| StdTestEpRet | 242 |\n", "| MaxTestEpRet | -56.1 |\n", "| MinTestEpRet | -838 |\n", "| EpLen | 110 |\n", "| TestEpLen | 110 |\n", "| TotalEnvInteracts | 2.64e+05 |\n", "| AverageQ1Vals | -74.8 |\n", "| StdQ1Vals | 129 |\n", "| MaxQ1Vals | 105 |\n", "| MinQ1Vals | -1.11e+03 |\n", "| AverageQ2Vals | -74.8 |\n", "| StdQ2Vals | 129 |\n", "| MaxQ2Vals | 77.4 |\n", "| MinQ2Vals | -1.08e+03 |\n", "| LossPi | 69.1 |\n", "| LossQ | 197 |\n", "| Time | 3.56e+03 |\n", "---------------------------------------\n" ] } ], "source": [ "# Setup experiment\n", "logger_kwargs = dict(output_dir='model', exp_name='v0')\n", "\n", "# Run training\n", "spinup.td3_pytorch(GyroscopeEnv, seed=0, steps_per_epoch=110*20, epochs=120, replay_size=1000000, gamma=0.95,\n", "polyak=0.995, batch_size=100, start_steps=20000, update_after=800, update_every=50,max_ep_len=110,logger_kwargs=logger_kwargs)" ] }, { "cell_type": "markdown", "metadata": { "colab_type": "text", "id": "Gn3Gp40bcOVz" }, "source": [ "## Test" ] }, { "cell_type": "code", "execution_count": 4, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 106 }, "colab_type": "code", "executionInfo": { "elapsed": 972, "status": "ok", "timestamp": 1584036455886, "user": { "displayName": "Matthieu Le Cauchois", "photoUrl": "https://lh3.googleusercontent.com/a-/AOh14GgY9gRlHHK-FHlINeRnTJw_wewJsr639GH8MAWl=s64", "userId": "10992927378504656501" }, "user_tz": -60 }, "id": "6GyY0wE-QBOj", "outputId": "9a5e9011-e024-4a65-8383-83c062cdcad9" }, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "/home/matthieulc/Documents/MA2/PS1/ps1venv/lib/python3.6/site-packages/gym/logger.py:30: UserWarning: \u001b[33mWARN: Box bound precision lowered by casting to float32\u001b[0m\n", " warnings.warn(colorize('%s: %s'%('WARN', msg % args), 'yellow'))\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "-900.18321242575\n" ] } ], "source": [ "# Creat environment\n", "env = GyroscopeEnv()\n", "env.seed(2)\n", "\n", "# Create agent\n", "agent = torch.load('model/pyt_save/model.pt')\n", "\n", "# Test parameters\n", "x1,x2,x3,x4,x1_ref,x3_ref,w = 0,1,0,1,1,3,25\n", "state = env.reset(np.array([x1,x2,x3,x4,x1_ref,x3_ref,w]))\n", "val = []\n", "act = []\n", "dt = 0.01\n", "time = np.arange(0, 4, dt)\n", "score = 0\n", "for i in range(len(time)):\n", " val.append(state)\n", " action = agent.act(torch.as_tensor(state, dtype=torch.float32))\n", " act.append(action)\n", " state, reward, done, _ = env.step(action)\n", " score += reward\n", " if done:\n", " break \n", "\n", "env.close()\n", "print(score)" ] }, { "cell_type": "markdown", "metadata": { "colab_type": "text", "id": "vvMjuRHDcfrE" }, "source": [ "## Plot" ] }, { "cell_type": "code", "execution_count": 5, "metadata": { "colab": { "base_uri": "https://localhost:8080/", "height": 1000 }, "colab_type": "code", "executionInfo": { "elapsed": 1856, "status": "ok", "timestamp": 1584036457424, "user": { "displayName": "Matthieu Le Cauchois", "photoUrl": "https://lh3.googleusercontent.com/a-/AOh14GgY9gRlHHK-FHlINeRnTJw_wewJsr639GH8MAWl=s64", "userId": "10992927378504656501" }, "user_tz": -60 }, "id": "aCZCqujgcMVA", "outputId": "05490294-aab8-4933-ca9b-e13ba85ecf6d" }, "outputs": [ { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "f, axs = plt.subplots(4,2,figsize=(30,30))\n", "plt.subplot(4,2,1)\n", "plt.title('Red gimbal angle',fontsize=20)\n", "plt.xlabel('time (s)',fontsize=16)\n", "plt.ylabel(r'$\\theta$ (rad)',fontsize=16)\n", "plt.grid()\n", "plt.plot(time,[row[0] for row in val],'r-')\n", "plt.plot(time, [row[4] for row in val], color='black', linestyle='dashed')\n", "\n", "plt.subplot(4,2,2)\n", "plt.title('Blue gimbal angle',fontsize=20)\n", "plt.xlabel('time (s)',fontsize=16)\n", "plt.ylabel(r'$\\phi$ (rad)',fontsize=16)\n", "plt.grid()\n", "plt.plot(time,[row[2] for row in val],'b-')\n", "plt.plot(time, [row[5] for row in val], color='black', linestyle='dashed')\n", "\n", "plt.subplot(4,2,3)\n", "plt.title('Red gimbal speed',fontsize=20)\n", "plt.xlabel('time (s)',fontsize=16)\n", "plt.ylabel(r'$\\dot \\theta$ (rad/s)',fontsize=16)\n", "plt.grid()\n", "plt.plot(time,[row[1] for row in val],'r-')\n", "\n", "plt.subplot(4,2,4)\n", "plt.title('Blue gimbal speed',fontsize=20)\n", "plt.xlabel('time (s)',fontsize=16)\n", "plt.ylabel(r'$\\dot \\phi$ (rad/s)',fontsize=16)\n", "plt.grid()\n", "plt.plot(time,[row[3] for row in val],'b-')\n", "\n", "plt.subplot(4,2,5)\n", "plt.title('Red gimbal tracking error',fontsize=20)\n", "plt.xlabel('time (s)',fontsize=16)\n", "plt.ylabel(r'$\\theta$ error (rad)',fontsize=16)\n", "plt.grid()\n", "plt.plot(time,[angle_normalize(row[0]- row[4]) for row in val],'r-')\n", "\n", "plt.subplot(4,2,6)\n", "plt.title('Blue gimbal tracking error',fontsize=20)\n", "plt.xlabel('time (s)',fontsize=16)\n", "plt.ylabel(r'$\\phi$ error (rad)',fontsize=16)\n", "plt.grid()\n", "plt.plot(time,[angle_normalize(row[2]- row[5]) for row in val],'b-')\n", "\n", "plt.subplot(4,2,7)\n", "plt.title('Red gimbal input',fontsize=20)\n", "plt.xlabel('time (s)',fontsize=16)\n", "plt.ylabel(r'u1 (V)',fontsize=16)\n", "plt.grid()\n", "plt.plot(time,[row[0] for row in act],'r-')\n", "\n", "plt.subplot(4,2,8)\n", "plt.title('Blue gimbal input',fontsize=20)\n", "plt.xlabel('time (s)',fontsize=16)\n", "plt.ylabel(r'u2 (V)',fontsize=16)\n", "plt.grid()\n", "plt.plot(time,[row[1] for row in act],'b-')\n", "\n", "plt.show()" ] }, { "cell_type": "markdown", "metadata": { "colab_type": "text", "id": "fz9r-gaStzpk" }, "source": [ "## 3D rendering" ] }, { "cell_type": "code", "execution_count": 8, "metadata": { "colab": {}, "colab_type": "code", "id": "HQM1E8JYc-cC" }, "outputs": [ { "data": { "text/html": [ "
" ], "text/plain": [ "" ] }, "metadata": {}, "output_type": "display_data" }, { "data": { "application/javascript": [ "if (typeof Jupyter !== \"undefined\") { window.__context = { glowscript_container: $(\"#glowscript\").removeAttr(\"id\")};}else{ element.textContent = ' ';}" ], "text/plain": [ "" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "# Scene\n", "scene = canvas(background=color.white) \n", "\n", "# Objects\n", "redGimbal = ring(pos=vector(0,0,0), axis=vector(0,0,1), radius=2, thickness=0.2,color=vector(0.9,0,0))\n", "blueGimbal1 = cylinder(pos=vector(0,0,0), axis=vector(0,2,0), radius=0.3,color=color.blue)\n", "blueGimbal2 = cylinder(pos=vector(0,0,0), axis=vector(0,-2,0), radius=0.3,color=color.blue)\n", "disk1 = cylinder(pos=vector(0,0,0), axis=vector(0,0,0.15), radius=1.3,color=color.yellow)\n", "disk2 = cylinder(pos=vector(0,0,0), axis=vector(0,0,-0.15), radius=1.3,color=color.yellow)\n", "baseR = extrusion(path=[vec(0,0,0), vec(0.7,0,0)],shape=[ shapes.circle(radius=0.5) ], pos=vec(2,0,0), color=color.black)\n", "baseL = extrusion(path=[vec(-0.7,0,0), vec(0,0,0)],shape=[ shapes.circle(radius=0.5) ], pos=vec(-2,0,0), color=color.black)\n", "\n", "loops = 0\n", "ctime = 0\n", "start = clock()\n", "N = 400\n", "\n", "for k in range(len(time)):\n", " rate(N)\n", " ct = clock()\n", " theta = val[k][0]\n", " phi = val[k][2]\n", " redGimbal.axis = vector(0,-sin(theta), cos(theta))\n", " blueGimbal1.axis = 2*vector(0,cos(theta), sin(theta))\n", " blueGimbal2.axis = -2*vector(0,cos(theta), sin(theta))\n", " disk1.axis = 0.15*vector(-sin(phi),-sin(theta)*cos(phi),cos(theta)*cos(phi))\n", " disk2.axis = -0.15*vector(-sin(phi),-sin(theta)*cos(phi),cos(theta)*cos(phi))\n", " ctime += clock()-ct\n", " loops += 1" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [] } ], "metadata": { "accelerator": "GPU", "colab": { "collapsed_sections": [], "name": "gyroscope_ddpg_testing.ipynb", "provenance": [] }, "kernelspec": { "display_name": "ps1venv", "language": "python", "name": "ps1venv" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.6.9" } }, "nbformat": 4, "nbformat_minor": 1 }