mirror of
https://github.com/wassname/Run-Skeleton-Run.git
synced 2026-06-27 17:14:10 +08:00
add debug, vs multithread
This commit is contained in:
@@ -5,9 +5,10 @@
|
||||
"execution_count": 1,
|
||||
"metadata": {
|
||||
"ExecuteTime": {
|
||||
"end_time": "2018-01-18T08:48:06.489049Z",
|
||||
"start_time": "2018-01-18T08:48:06.486256Z"
|
||||
}
|
||||
"end_time": "2018-01-19T02:03:04.176331Z",
|
||||
"start_time": "2018-01-19T02:03:04.170597Z"
|
||||
},
|
||||
"collapsed": true
|
||||
},
|
||||
"outputs": [],
|
||||
"source": [
|
||||
@@ -21,8 +22,8 @@
|
||||
"execution_count": 2,
|
||||
"metadata": {
|
||||
"ExecuteTime": {
|
||||
"end_time": "2018-01-18T08:48:06.842630Z",
|
||||
"start_time": "2018-01-18T08:48:06.490286Z"
|
||||
"end_time": "2018-01-19T02:03:04.586375Z",
|
||||
"start_time": "2018-01-19T02:03:04.178204Z"
|
||||
}
|
||||
},
|
||||
"outputs": [
|
||||
@@ -45,8 +46,8 @@
|
||||
"execution_count": 3,
|
||||
"metadata": {
|
||||
"ExecuteTime": {
|
||||
"end_time": "2018-01-18T08:48:06.881370Z",
|
||||
"start_time": "2018-01-18T08:48:06.844048Z"
|
||||
"end_time": "2018-01-19T02:03:04.627472Z",
|
||||
"start_time": "2018-01-19T02:03:04.587944Z"
|
||||
},
|
||||
"scrolled": true
|
||||
},
|
||||
@@ -56,32 +57,30 @@
|
||||
"text/plain": [
|
||||
"['ddpg/train.py',\n",
|
||||
" '--logdir',\n",
|
||||
" './outputs/logs_ddpg',\n",
|
||||
" './outputs/logs_ddpg2',\n",
|
||||
" '--num-threads',\n",
|
||||
" '1',\n",
|
||||
" '--ddpg-wrapper',\n",
|
||||
" '--skip-frames',\n",
|
||||
" '5',\n",
|
||||
" '--fail-reward',\n",
|
||||
" '-0.2',\n",
|
||||
" '3',\n",
|
||||
" '--reward-scale',\n",
|
||||
" '1',\n",
|
||||
" '--flip-state-action',\n",
|
||||
" '0.001',\n",
|
||||
" '--actor-layers',\n",
|
||||
" '64-64',\n",
|
||||
" '64-64-64',\n",
|
||||
" '--actor-layer-norm',\n",
|
||||
" '--actor-parameters-noise',\n",
|
||||
" '--actor-lr',\n",
|
||||
" '0.001',\n",
|
||||
" '--actor-lr-end',\n",
|
||||
" '0.00001',\n",
|
||||
" '0.000001',\n",
|
||||
" '--dynamics-lr',\n",
|
||||
" '0.0001',\n",
|
||||
" '--dynamics-lr-end',\n",
|
||||
" '0.0000001',\n",
|
||||
" '--critic-layers',\n",
|
||||
" '64-32',\n",
|
||||
" '--critic-layer-norm',\n",
|
||||
" '--critic-lr',\n",
|
||||
" '0.002',\n",
|
||||
" '--critic-lr-end',\n",
|
||||
" '0.00001',\n",
|
||||
" '0.000001',\n",
|
||||
" '--initial-epsilon',\n",
|
||||
" '0.5',\n",
|
||||
" '--final-epsilon',\n",
|
||||
@@ -96,18 +95,24 @@
|
||||
}
|
||||
],
|
||||
"source": [
|
||||
"os.sys.argv=\"ddpg/train.py --logdir ./outputs/logs_ddpg --num-threads 1 --ddpg-wrapper --skip-frames 5 --fail-reward -0.2 --reward-scale 1 --flip-state-action --actor-layers 64-64 --actor-layer-norm --actor-parameters-noise --actor-lr 0.001 --actor-lr-end 0.00001 --critic-layers 64-32 --critic-layer-norm --critic-lr 0.002 --critic-lr-end 0.00001 --initial-epsilon 0.5 --final-epsilon 0.001 --tau 0.0001\".split(\" \")\n",
|
||||
"os.sys.argv=\"ddpg/train.py --logdir ./outputs/logs_ddpg2 \\\n",
|
||||
"--num-threads 3 --num-train-threads 3 \\\n",
|
||||
"--reward-scale 0.001 \\\n",
|
||||
"--actor-layers 64-64-64 --actor-layer-norm --actor-parameters-noise --actor-lr 0.001 --actor-lr-end 0.000001 \\\n",
|
||||
"--dynamics-lr 0.0001 --dynamics-lr-end 0.0000001 \\\n",
|
||||
"--critic-layers 64-32 --critic-layer-norm --critic-lr 0.002 --critic-lr-end 0.000001 \\\n",
|
||||
"--initial-epsilon 0.5 --final-epsilon 0.001 --tau 0.0001\".split(\" \")\n",
|
||||
"os.sys.argv"
|
||||
]
|
||||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 5,
|
||||
"execution_count": null,
|
||||
"metadata": {
|
||||
"ExecuteTime": {
|
||||
"end_time": "2018-01-18T08:49:02.648421Z",
|
||||
"start_time": "2018-01-18T08:49:02.573206Z"
|
||||
}
|
||||
"start_time": "2018-01-19T02:03:03.852Z"
|
||||
},
|
||||
"collapsed": true
|
||||
},
|
||||
"outputs": [],
|
||||
"source": [
|
||||
@@ -119,7 +124,7 @@
|
||||
"execution_count": null,
|
||||
"metadata": {
|
||||
"ExecuteTime": {
|
||||
"start_time": "2018-01-18T08:49:03.555Z"
|
||||
"start_time": "2018-01-19T02:03:03.855Z"
|
||||
},
|
||||
"scrolled": true
|
||||
},
|
||||
@@ -128,9 +133,7 @@
|
||||
"name": "stderr",
|
||||
"output_type": "stream",
|
||||
"text": [
|
||||
"[2018-01-18 16:49:08,700] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-18 16:49:08,777] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-18 16:49:08,780] Making new env: Pendulum-v0\n"
|
||||
"[2018-01-19 10:03:05,421] Making new env: Pendulum-v0\n"
|
||||
]
|
||||
},
|
||||
{
|
||||
@@ -148,6 +151,10 @@
|
||||
" (layer_norm_1): LayerNorm (\n",
|
||||
" )\n",
|
||||
" (act_1): ReLU ()\n",
|
||||
" (linear_2): NoisyLinear (64 -> 64)\n",
|
||||
" (layer_norm_2): LayerNorm (\n",
|
||||
" )\n",
|
||||
" (act_2): ReLU ()\n",
|
||||
" )\n",
|
||||
" )\n",
|
||||
")\n",
|
||||
@@ -163,13 +170,17 @@
|
||||
" (layer_norm_1): LayerNorm (\n",
|
||||
" )\n",
|
||||
" (act_1): ReLU ()\n",
|
||||
" (linear_2): NoisyLinear (64 -> 64)\n",
|
||||
" (layer_norm_2): LayerNorm (\n",
|
||||
" )\n",
|
||||
" (act_2): ReLU ()\n",
|
||||
" )\n",
|
||||
" )\n",
|
||||
" )\n",
|
||||
" (policy_net): LinearNet (\n",
|
||||
" (net): Sequential (\n",
|
||||
" (linear_0): Linear (64 -> 1)\n",
|
||||
" (act_0): Tanh ()\n",
|
||||
" (act_0): ELU (alpha=1.0)\n",
|
||||
" )\n",
|
||||
" )\n",
|
||||
")\n",
|
||||
@@ -185,6 +196,10 @@
|
||||
" (layer_norm_1): LayerNorm (\n",
|
||||
" )\n",
|
||||
" (act_1): ReLU ()\n",
|
||||
" (linear_2): NoisyLinear (64 -> 64)\n",
|
||||
" (layer_norm_2): LayerNorm (\n",
|
||||
" )\n",
|
||||
" (act_2): ReLU ()\n",
|
||||
" )\n",
|
||||
" )\n",
|
||||
" )\n",
|
||||
@@ -202,16 +217,123 @@
|
||||
" (layer_norm_1): LayerNorm (\n",
|
||||
" )\n",
|
||||
" (act_1): ReLU ()\n",
|
||||
" (linear_2): NoisyLinear (64 -> 64)\n",
|
||||
" (layer_norm_2): LayerNorm (\n",
|
||||
" )\n",
|
||||
" (act_2): ReLU ()\n",
|
||||
" )\n",
|
||||
" )\n",
|
||||
" )\n",
|
||||
" (value_net): Linear (65 -> 3)\n",
|
||||
" (value_net): LinearNet (\n",
|
||||
" (net): Sequential (\n",
|
||||
" (linear_0): Linear (65 -> 64)\n",
|
||||
" (layer_norm_0): LayerNorm (\n",
|
||||
" )\n",
|
||||
" (act_0): ReLU ()\n",
|
||||
" )\n",
|
||||
" )\n",
|
||||
" (value_net2): Linear (64 -> 3)\n",
|
||||
")\n"
|
||||
]
|
||||
},
|
||||
{
|
||||
"name": "stderr",
|
||||
"output_type": "stream",
|
||||
"text": [
|
||||
"[2018-01-19 10:03:05,570] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:03:05,589] Making new env: Pendulum-v0\n",
|
||||
"Process Process-1:\n",
|
||||
"Traceback (most recent call last):\n",
|
||||
" File \"/home/isisilon/.pyenv/versions/3.6.0/lib/python3.6/multiprocessing/process.py\", line 249, in _bootstrap\n",
|
||||
" self.run()\n",
|
||||
" File \"/home/isisilon/.pyenv/versions/3.6.0/lib/python3.6/multiprocessing/process.py\", line 93, in run\n",
|
||||
" self._target(*self._args, **self._kwargs)\n",
|
||||
" File \"/media/isisilon/Data/My_Documents/Documents/eclipse-workspace/ddpg_implicit_state/Run-Skeleton-Run/ddpg/model.py\", line 440, in train_single_thread\n",
|
||||
" logger.scalar_summary(key, value, update_step)\n",
|
||||
" File \"/media/isisilon/Data/My_Documents/Documents/eclipse-workspace/ddpg_implicit_state/Run-Skeleton-Run/common/logger.py\", line 17, in scalar_summary\n",
|
||||
" self.writer.add_scalar(tag, value, step)\n",
|
||||
" File \"/home/isisilon/.pyenv/versions/3.6.0/envs/jupyter3/lib/python3.6/site-packages/tensorboardX/writer.py\", line 262, in add_scalar\n",
|
||||
" self.file_writer.add_summary(scalar(tag, scalar_value), global_step)\n",
|
||||
" File \"/home/isisilon/.pyenv/versions/3.6.0/envs/jupyter3/lib/python3.6/site-packages/tensorboardX/summary.py\", line 88, in scalar\n",
|
||||
" assert(scalar.squeeze().ndim==0), 'scalar should be 0D'\n",
|
||||
"AttributeError: 'NoneType' object has no attribute 'squeeze'\n",
|
||||
"[2018-01-19 10:04:01,980] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:04:05,897] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:04:56,915] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:04:59,842] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:05:51,136] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:05:54,795] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:06:58,471] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:07:01,303] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:08:06,776] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:08:11,823] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:09:24,555] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:09:28,326] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:10:25,677] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:10:28,134] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:11:21,746] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:11:22,767] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:12:19,668] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:12:20,498] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:13:16,087] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:13:19,701] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:14:20,287] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:14:25,255] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:15:25,534] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:15:30,307] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:16:24,529] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:16:27,554] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:17:23,602] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:17:24,952] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:18:19,517] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:18:21,783] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:19:17,384] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:19:19,827] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:20:15,270] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:20:15,364] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:21:09,305] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:21:12,535] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:22:03,694] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:22:05,211] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:22:59,166] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:23:03,510] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:23:52,806] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:23:58,895] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:24:44,687] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:24:52,964] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:25:37,681] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:25:51,033] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:26:34,755] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:26:45,860] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:27:27,254] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:27:44,223] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:28:25,083] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:28:40,452] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:29:21,854] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:29:40,183] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:30:20,224] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:30:43,777] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:31:21,376] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:31:43,822] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:32:19,617] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:32:42,093] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:33:13,267] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:33:38,685] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:34:08,173] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:34:36,100] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:35:03,554] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:35:31,869] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:36:02,086] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:36:30,077] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:37:04,189] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:37:33,748] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:38:03,424] Making new env: Pendulum-v0\n",
|
||||
"[2018-01-19 10:38:35,036] Making new env: Pendulum-v0\n"
|
||||
]
|
||||
}
|
||||
],
|
||||
"source": [
|
||||
"os.environ['OMP_NUM_THREADS'] = '1'\n",
|
||||
"os.environ['OMP_NUM_THREADS'] = '3'\n",
|
||||
"torch.set_num_threads(1)\n",
|
||||
"args = parse_args()\n",
|
||||
"train(args,\n",
|
||||
@@ -227,7 +349,8 @@
|
||||
"execution_count": null,
|
||||
"metadata": {
|
||||
"ExecuteTime": {
|
||||
"start_time": "2018-01-18T08:39:00.927Z"
|
||||
"end_time": "2018-01-19T02:01:33.149379Z",
|
||||
"start_time": "2018-01-19T02:01:30.923966Z"
|
||||
}
|
||||
},
|
||||
"outputs": [],
|
||||
@@ -239,7 +362,8 @@
|
||||
"metadata": {
|
||||
"ExecuteTime": {
|
||||
"start_time": "2018-01-18T08:39:00.929Z"
|
||||
}
|
||||
},
|
||||
"collapsed": true
|
||||
},
|
||||
"outputs": [],
|
||||
"source": []
|
||||
|
||||
@@ -0,0 +1,362 @@
|
||||
{
|
||||
"cells": [
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 6,
|
||||
"metadata": {
|
||||
"ExecuteTime": {
|
||||
"end_time": "2018-01-19T02:39:09.387985Z",
|
||||
"start_time": "2018-01-19T02:39:09.291235Z"
|
||||
},
|
||||
"collapsed": true
|
||||
},
|
||||
"outputs": [],
|
||||
"source": [
|
||||
"import os\n",
|
||||
"os.environ['CUDA_VISIBLE_DEVICES']=\"\"\n",
|
||||
"os.environ[\"PYTHONPATH\"]='.'"
|
||||
]
|
||||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 7,
|
||||
"metadata": {
|
||||
"ExecuteTime": {
|
||||
"end_time": "2018-01-19T02:39:09.542108Z",
|
||||
"start_time": "2018-01-19T02:39:09.390592Z"
|
||||
}
|
||||
},
|
||||
"outputs": [
|
||||
{
|
||||
"name": "stdout",
|
||||
"output_type": "stream",
|
||||
"text": [
|
||||
"Populating the interactive namespace from numpy and matplotlib\n"
|
||||
]
|
||||
}
|
||||
],
|
||||
"source": [
|
||||
"%pylab --no-import-all inline\n",
|
||||
"%reload_ext autoreload\n",
|
||||
"%autoreload 2"
|
||||
]
|
||||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 8,
|
||||
"metadata": {
|
||||
"ExecuteTime": {
|
||||
"end_time": "2018-01-19T02:39:09.722311Z",
|
||||
"start_time": "2018-01-19T02:39:09.552596Z"
|
||||
},
|
||||
"scrolled": true
|
||||
},
|
||||
"outputs": [
|
||||
{
|
||||
"data": {
|
||||
"text/plain": [
|
||||
"['ddpg/train.py',\n",
|
||||
" '--logdir',\n",
|
||||
" './outputs/logs_ddpg',\n",
|
||||
" '--num-threads',\n",
|
||||
" '1',\n",
|
||||
" '--reward-scale',\n",
|
||||
" '1',\n",
|
||||
" '--actor-layers',\n",
|
||||
" '64-64-64',\n",
|
||||
" '--actor-layer-norm',\n",
|
||||
" '--actor-parameters-noise',\n",
|
||||
" '--actor-lr',\n",
|
||||
" '0.001',\n",
|
||||
" '--actor-lr-end',\n",
|
||||
" '0.000001',\n",
|
||||
" '--dynamics-lr',\n",
|
||||
" '0.0001',\n",
|
||||
" '--dynamics-lr-end',\n",
|
||||
" '0.0000001',\n",
|
||||
" '--critic-layers',\n",
|
||||
" '64-32',\n",
|
||||
" '--critic-layer-norm',\n",
|
||||
" '--critic-lr',\n",
|
||||
" '0.002',\n",
|
||||
" '--critic-lr-end',\n",
|
||||
" '0.000001',\n",
|
||||
" '--initial-epsilon',\n",
|
||||
" '0.5',\n",
|
||||
" '--final-epsilon',\n",
|
||||
" '0.001',\n",
|
||||
" '--tau',\n",
|
||||
" '0.0001']"
|
||||
]
|
||||
},
|
||||
"execution_count": 8,
|
||||
"metadata": {},
|
||||
"output_type": "execute_result"
|
||||
}
|
||||
],
|
||||
"source": [
|
||||
"os.sys.argv=\"ddpg/train.py --logdir ./outputs/logs_ddpg \\\n",
|
||||
"--num-threads 1 \\\n",
|
||||
"--reward-scale 1 \\\n",
|
||||
"--actor-layers 64-64-64 --actor-layer-norm --actor-parameters-noise --actor-lr 0.001 --actor-lr-end 0.000001 \\\n",
|
||||
"--dynamics-lr 0.0001 --dynamics-lr-end 0.0000001 \\\n",
|
||||
"--critic-layers 64-32 --critic-layer-norm --critic-lr 0.002 --critic-lr-end 0.000001 \\\n",
|
||||
"--initial-epsilon 0.5 --final-epsilon 0.001 --tau 0.0001\".split(\" \")\n",
|
||||
"os.sys.argv"
|
||||
]
|
||||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 9,
|
||||
"metadata": {
|
||||
"ExecuteTime": {
|
||||
"end_time": "2018-01-19T02:39:09.829347Z",
|
||||
"start_time": "2018-01-19T02:39:09.724292Z"
|
||||
},
|
||||
"collapsed": true
|
||||
},
|
||||
"outputs": [],
|
||||
"source": [
|
||||
"from ddpg.train import *"
|
||||
]
|
||||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": 10,
|
||||
"metadata": {
|
||||
"ExecuteTime": {
|
||||
"end_time": "2018-01-19T02:39:18.905244Z",
|
||||
"start_time": "2018-01-19T02:39:09.834586Z"
|
||||
},
|
||||
"scrolled": true
|
||||
},
|
||||
"outputs": [
|
||||
{
|
||||
"name": "stderr",
|
||||
"output_type": "stream",
|
||||
"text": [
|
||||
"[2018-01-19 10:39:09,999] Making new env: Pendulum-v0\n"
|
||||
]
|
||||
},
|
||||
{
|
||||
"name": "stdout",
|
||||
"output_type": "stream",
|
||||
"text": [
|
||||
"Base (\n",
|
||||
" (feature_net): LinearNet (\n",
|
||||
" (net): Sequential (\n",
|
||||
" (linear_0): NoisyLinear (3 -> 64)\n",
|
||||
" (layer_norm_0): LayerNorm (\n",
|
||||
" )\n",
|
||||
" (act_0): ReLU ()\n",
|
||||
" (linear_1): NoisyLinear (64 -> 64)\n",
|
||||
" (layer_norm_1): LayerNorm (\n",
|
||||
" )\n",
|
||||
" (act_1): ReLU ()\n",
|
||||
" (linear_2): NoisyLinear (64 -> 64)\n",
|
||||
" (layer_norm_2): LayerNorm (\n",
|
||||
" )\n",
|
||||
" (act_2): ReLU ()\n",
|
||||
" )\n",
|
||||
" )\n",
|
||||
")\n",
|
||||
"ActorHead (\n",
|
||||
" (base): Base (\n",
|
||||
" (feature_net): LinearNet (\n",
|
||||
" (net): Sequential (\n",
|
||||
" (linear_0): NoisyLinear (3 -> 64)\n",
|
||||
" (layer_norm_0): LayerNorm (\n",
|
||||
" )\n",
|
||||
" (act_0): ReLU ()\n",
|
||||
" (linear_1): NoisyLinear (64 -> 64)\n",
|
||||
" (layer_norm_1): LayerNorm (\n",
|
||||
" )\n",
|
||||
" (act_1): ReLU ()\n",
|
||||
" (linear_2): NoisyLinear (64 -> 64)\n",
|
||||
" (layer_norm_2): LayerNorm (\n",
|
||||
" )\n",
|
||||
" (act_2): ReLU ()\n",
|
||||
" )\n",
|
||||
" )\n",
|
||||
" )\n",
|
||||
" (policy_net): LinearNet (\n",
|
||||
" (net): Sequential (\n",
|
||||
" (linear_0): Linear (64 -> 1)\n",
|
||||
" (act_0): ELU (alpha=1.0)\n",
|
||||
" )\n",
|
||||
" )\n",
|
||||
")\n",
|
||||
"CriticHead (\n",
|
||||
" (base): Base (\n",
|
||||
" (feature_net): LinearNet (\n",
|
||||
" (net): Sequential (\n",
|
||||
" (linear_0): NoisyLinear (3 -> 64)\n",
|
||||
" (layer_norm_0): LayerNorm (\n",
|
||||
" )\n",
|
||||
" (act_0): ReLU ()\n",
|
||||
" (linear_1): NoisyLinear (64 -> 64)\n",
|
||||
" (layer_norm_1): LayerNorm (\n",
|
||||
" )\n",
|
||||
" (act_1): ReLU ()\n",
|
||||
" (linear_2): NoisyLinear (64 -> 64)\n",
|
||||
" (layer_norm_2): LayerNorm (\n",
|
||||
" )\n",
|
||||
" (act_2): ReLU ()\n",
|
||||
" )\n",
|
||||
" )\n",
|
||||
" )\n",
|
||||
" (value_net): Linear (64 -> 1)\n",
|
||||
")\n",
|
||||
"DynamicsHead (\n",
|
||||
" (base): Base (\n",
|
||||
" (feature_net): LinearNet (\n",
|
||||
" (net): Sequential (\n",
|
||||
" (linear_0): NoisyLinear (3 -> 64)\n",
|
||||
" (layer_norm_0): LayerNorm (\n",
|
||||
" )\n",
|
||||
" (act_0): ReLU ()\n",
|
||||
" (linear_1): NoisyLinear (64 -> 64)\n",
|
||||
" (layer_norm_1): LayerNorm (\n",
|
||||
" )\n",
|
||||
" (act_1): ReLU ()\n",
|
||||
" (linear_2): NoisyLinear (64 -> 64)\n",
|
||||
" (layer_norm_2): LayerNorm (\n",
|
||||
" )\n",
|
||||
" (act_2): ReLU ()\n",
|
||||
" )\n",
|
||||
" )\n",
|
||||
" )\n",
|
||||
" (value_net): LinearNet (\n",
|
||||
" (net): Sequential (\n",
|
||||
" (linear_0): Linear (65 -> 64)\n",
|
||||
" (layer_norm_0): LayerNorm (\n",
|
||||
" )\n",
|
||||
" (act_0): ReLU ()\n",
|
||||
" )\n",
|
||||
" )\n",
|
||||
" (value_net2): Linear (64 -> 3)\n",
|
||||
")\n"
|
||||
]
|
||||
}
|
||||
],
|
||||
"source": [
|
||||
"os.environ['OMP_NUM_THREADS'] = '1'\n",
|
||||
"torch.set_num_threads(1)\n",
|
||||
"args = parse_args()\n",
|
||||
"train(args,\n",
|
||||
" create_model,\n",
|
||||
" create_act_update_fns,\n",
|
||||
" train_multi_thread,\n",
|
||||
" train_single_thread,\n",
|
||||
" play_single_thread)"
|
||||
]
|
||||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": null,
|
||||
"metadata": {
|
||||
"ExecuteTime": {
|
||||
"start_time": "2018-01-18T08:39:00.927Z"
|
||||
},
|
||||
"collapsed": true
|
||||
},
|
||||
"outputs": [],
|
||||
"source": []
|
||||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": null,
|
||||
"metadata": {
|
||||
"ExecuteTime": {
|
||||
"start_time": "2018-01-18T08:39:00.929Z"
|
||||
},
|
||||
"collapsed": true
|
||||
},
|
||||
"outputs": [],
|
||||
"source": []
|
||||
},
|
||||
{
|
||||
"cell_type": "code",
|
||||
"execution_count": null,
|
||||
"metadata": {
|
||||
"collapsed": true
|
||||
},
|
||||
"outputs": [],
|
||||
"source": []
|
||||
}
|
||||
],
|
||||
"metadata": {
|
||||
"kernelspec": {
|
||||
"display_name": "jupyter3",
|
||||
"language": "python",
|
||||
"name": "jupyter3"
|
||||
},
|
||||
"language_info": {
|
||||
"codemirror_mode": {
|
||||
"name": "ipython",
|
||||
"version": 3
|
||||
},
|
||||
"file_extension": ".py",
|
||||
"mimetype": "text/x-python",
|
||||
"name": "python",
|
||||
"nbconvert_exporter": "python",
|
||||
"pygments_lexer": "ipython3",
|
||||
"version": "3.6.0"
|
||||
},
|
||||
"toc": {
|
||||
"colors": {
|
||||
"hover_highlight": "#DAA520",
|
||||
"navigate_num": "#000000",
|
||||
"navigate_text": "#333333",
|
||||
"running_highlight": "#FF0000",
|
||||
"selected_highlight": "#FFD700",
|
||||
"sidebar_border": "#EEEEEE",
|
||||
"wrapper_background": "#FFFFFF"
|
||||
},
|
||||
"moveMenuLeft": true,
|
||||
"nav_menu": {
|
||||
"height": "12px",
|
||||
"width": "252px"
|
||||
},
|
||||
"navigate_menu": true,
|
||||
"number_sections": true,
|
||||
"sideBar": true,
|
||||
"threshold": 4,
|
||||
"toc_cell": false,
|
||||
"toc_section_display": "block",
|
||||
"toc_window_display": false,
|
||||
"widenNotebook": false
|
||||
},
|
||||
"varInspector": {
|
||||
"cols": {
|
||||
"lenName": 16,
|
||||
"lenType": 16,
|
||||
"lenVar": 40
|
||||
},
|
||||
"kernels_config": {
|
||||
"python": {
|
||||
"delete_cmd_postfix": "",
|
||||
"delete_cmd_prefix": "del ",
|
||||
"library": "var_list.py",
|
||||
"varRefreshCmd": "print(var_dic_list())"
|
||||
},
|
||||
"r": {
|
||||
"delete_cmd_postfix": ") ",
|
||||
"delete_cmd_prefix": "rm(",
|
||||
"library": "var_list.r",
|
||||
"varRefreshCmd": "cat(var_dic_list()) "
|
||||
}
|
||||
},
|
||||
"types_to_exclude": [
|
||||
"module",
|
||||
"function",
|
||||
"builtin_function_or_method",
|
||||
"instance",
|
||||
"_Feature"
|
||||
],
|
||||
"window_display": false
|
||||
}
|
||||
},
|
||||
"nbformat": 4,
|
||||
"nbformat_minor": 2
|
||||
}
|
||||
Reference in New Issue
Block a user