try plan2explore

This commit is contained in:
wassname
2024-06-08 11:04:39 +08:00
parent 66440b0e48
commit d8a207144f
2 changed files with 32 additions and 25 deletions
+27 -24
View File
@@ -149,30 +149,33 @@ craftax:
imag_gradient: 'reinforce' imag_gradient: 'reinforce'
time_limit: 4000 time_limit: 4000
# craftax_small: craftax_small:
# task: craftax_Craftax-Symbolic-AutoReset-v1 task: craftax_Craftax-Symbolic-AutoReset-v1
# step: 1e6 step: 1e6
# action_repeat: 1 action_repeat: 1
# envs: 1 envs: 1
# train_ratio: 512 train_ratio: 512
# video_pred_log: false video_pred_log: true
# dyn_hidden: 256 dyn_hidden: 256
# dyn_deter: 256 dyn_deter: 512
# dyn_stoch: 24 dyn_stoch: 24
# dyn_discrete: 24 dyn_discrete: 24
# # note: depth is cnn hidden_dim # note: depth is cnn hidden_dim
# encoder: {cnn_keys: 'state_map', cnn_depth: 32, kernel_size: 4, minres: 2, mlp_keys: "state_inventory", mlp_layers: 2, mlp_units: 16} encoder: {cnn_keys: 'state_map', cnn_depth: 48, kernel_size: 4, minres: 2, mlp_keys: "state_inventory", mlp_layers: 2, mlp_units: 128}
# decoder: {cnn_keys: 'state_map', cnn_depth: 32, kernel_size: 4, minres: 2, mlp_keys: "state_inventory", mlp_layers: 2, mlp_units: 16} decoder: {cnn_keys: 'state_map', cnn_depth: 48, kernel_size: 4, minres: 2, mlp_keys: "state_inventory", mlp_layers: 2, mlp_units: 128}
# actor: {layers: 3, dist: 'onehot', std: 'none'} actor: {layers: 3, dist: 'onehot', std: 'none'}
# value: {layers: 3} value: {layers: 3}
# # note units is the head hidden_dim # note units is the head hidden_dim
# units: 256 units: 256
# reward_head: {layers: 3} reward_head: {layers: 4}
# cont_head: {layers: 3} cont_head: {layers: 4}
# imag_gradient: 'reinforce' imag_gradient: 'reinforce'
# batch_size: 256 batch_size: 96
# batch_length: 32 batch_length: 48
# time_limit: 4000 time_limit: 6000
dataset_size: 20_000
precision: 16
expl_behavior: plan2explore
craftax_smaller: craftax_smaller:
task: craftax_Craftax-Symbolic-AutoReset-v1 task: craftax_Craftax-Symbolic-AutoReset-v1
+5 -1
View File
@@ -4,9 +4,13 @@ set export
export OSTYPE := "linux-gnu" export OSTYPE := "linux-gnu"
export TQDM_MININTERVAL := "30" export TQDM_MININTERVAL := "30"
main: craftax_smaller:
. ./.venv/bin/activate . ./.venv/bin/activate
python dreamer.py --configs craftax_smaller --logdir ./logdir/craftax_smaller python dreamer.py --configs craftax_smaller --logdir ./logdir/craftax_smaller
craftax_small:
. ./.venv/bin/activate
python dreamer.py --configs craftax_small --logdir ./logdir/craftax_small2
logs: logs:
tensorboard --logdir logdir/craftax tensorboard --logdir logdir/craftax