-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathconfig.yaml
111 lines (108 loc) · 2.58 KB
/
config.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
CartPole-v0:
env: CartPole-v0
max_epochs: 10
batch_size: 32
abstract_state_dim: 128
lr_decay: 0.95
optimizer:
name: Adam
params: { lr: !!python/float 1e-2 }
# grad_clip_norm: 1.0
# qnet_lr: !!python/float 5e-4
# encoder_lr: !!python/float 5e-4
gamma: 0.99
sync_rate: 20
replay_size: 1000
warm_start_size: 1000
eps_last_frame: 500
eps_start: 1.0
eps_end: 0.01
max_episode_length: 200
max_episode_reward: 200
planning_depth: 0
is_atari: False
replace: True
update_experience: True
logger_dir: lightning_dirs/cartpole
plot_dir: /home/aayn/Programming/crar-pytorch/plots/cartpole
PongNoFrameskip-v4:
env: PongNoFrameskip-v4
max_epochs: 50000
batch_size: 32
abstract_state_dim: 100
lr_decay: 0.95
optimizer:
name: Adam
params: { lr: !!python/float 1e-4 }
# qnet_lr: !!python/float 5e-4
# encoder_lr: !!python/float 5e-4
gamma: 0.99
sync_rate: 1000
replay_size: 10000
warm_start_size: 10000
eps_last_frame: 50000
eps_start: 1.0
eps_end: 0.01
max_episode_length: 5000
max_episode_reward: 21
planning_depth: 0
is_atari: True
replace: True
update_experience: True
logger_dir: lightning_dirs/pong
SimpleMaze-v0:
env: SimpleMaze-v0
max_epochs: 500
batch_size: 32
abstract_state_dim: 2
lr: !!python/float 5e-4
lr_decay: 0.95
optimizer:
name: RMSprop
params: { lr: !!python/float 5e-4 }
grad_clip_norm: 1.0
# qnet_lr: !!python/float 5e-4
# encoder_lr: !!python/float 5e-4
gamma: 0.99
sync_rate: 1000 # freeze interval
replay_size: 5000
warm_start_size: 5000
eps_last_frame: 10000
eps_start: 1.0
eps_end: 1.0 # Random actions
max_episode_length: 2000
max_episode_reward: 0
planning_depth: 0
is_atari: False
replace: True
update_experience: False
logger_dir: lightning_dirs/simple_mazev0
plot_dir: /home/aayn/Programming/crar-pytorch/plots/simple_maze_v0
SimpleMaze-v1:
env: SimpleMaze-v1
max_epochs: 500
batch_size: 32
abstract_state_dim: 2
lr: !!python/float 5e-4
lr_decay: 0.95
optimizer:
name: RMSprop
params: { lr: !!python/float 5e-4 }
grad_clip_norm: 1.0
# qnet_lr: !!python/float 5e-4
# encoder_lr: !!python/float 5e-4
gamma: 0.99
sync_rate: 1000 # freeze interval
replay_size: 5000
warm_start_size: 5000
eps_last_frame: 10000
eps_start: 1.0
eps_end: 0.01 # Random actions
max_episode_length: 500
max_episode_reward: 100
planning_depth: 0
is_atari: False
replace: True
update_experience: True
logger_dir: lightning_dirs/simple_mazev1
plot_dir: /home/aayn/Programming/crar-pytorch/plots/simple_maze_v1