-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathtrain_kill_enemies.ron
64 lines (64 loc) · 1.38 KB
/
train_kill_enemies.ron
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
TrainConfig(
version: 4,
env: EnvConfig(
kwargs: "{}",
id: "MoveToOrigin",
validate: true,
),
net: RogueNetConfig(
embd_pdrop: 0.0,
resid_pdrop: 0.0,
attn_pdrop: 0.0,
n_layer: 2,
n_head: 2,
d_model: 32,
pooling: None,
relpos_encoding: None,
d_qk: 16,
translation: None,
),
optim: OptimizerConfig(
lr: 0.0001,
lr_warmup_steps: None,
bs: 256,
weight_decay: 0.0,
micro_bs: None,
anneal_lr: true,
update_epochs: 3,
max_grad_norm: 2.0,
),
ppo: PPOConfig(
gae: true,
gamma: 0.99,
gae_lambda: 0.95,
norm_adv: true,
clip_coef: 0.2,
clip_vloss: true,
ent_coef: 0.1,
vf_coef: 0.5,
target_kl: None,
anneal_entropy: true,
),
rollout: RolloutConfig(
steps: 1024,
num_envs: 1,
processes: 1,
),
eval: None,
vf_net: None,
name: "config",
seed: 1,
total_timesteps: 2000,
max_train_time: None,
torch_deterministic: true,
cuda: true,
track: false,
wandb_project_name: "enn-ppo",
wandb_entity: "entity-neural-network",
capture_samples: None,
capture_logits: false,
capture_samples_subsample: 1,
trial: None,
data_dir: ".",
cuda_empty_cache: false,
)