-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathconfig.yml
More file actions
71 lines (65 loc) · 1.17 KB
/
config.yml
File metadata and controls
71 lines (65 loc) · 1.17 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
environment_config:
n_agents: 20
n_dim: 2
ep_length: 20
freeze: True
fps: 0.8
use_actual_best: True
reward_type: full
opt_bound: 0.9
envs_cache_path: 'envRegistry.pkl'
policy_config:
state_dim: 4
action_dim: 1
init_std: 0.3
std_min: 0.05
std_max: 0.3
std_type: 'linear_decay'
fixed_std: True
std_pow: 1
std_switch_time: 4000
hidden_dim: [32, 32]
lr: 0.00001
betas: 0.999
gamma: 0.9
K_epochs: 32
eps_clip: 0.2
initialization: None
pretrained: False
learn_std: False
activation: None
decay_rate: 0.001
ckpt_folder:
std_mode: hybrid
test_policy_config:
init_std: 0.3
std_min: 0.05
std_max: 0.3
std_type: 'euclidean'
fixed_std: True
std_decay_rate: 0.02
learn_std: True
std_mode: hybrid
ckpt_folder: models/model.pth
state_dim: 4
action_dim: 1
hidden_dim: [32, 32]
pretrained: True
std_type: linear_decay
initialization: None
lr: 0.00001
betas: 0.999
gamma: 0.9
K_epochs: 32
eps_clip: 0.2
run_config:
n_run: 5
train_config:
max_episodes: 1000
use_gbest: False
update_timestep: 50
save_interval: 100
render_interval: 100
decay_timestep: 50
log_interval: 100
save_cutoff: 50