AnnaMats commited on
Commit
df142c3
·
1 Parent(s): ff1137d

Upload configuration.yaml

Browse files
Files changed (1) hide show
  1. configuration.yaml +32 -0
configuration.yaml ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ behaviors:
2
+ Pyramids:
3
+ trainer_type: ppo
4
+ hyperparameters:
5
+ batch_size: 128
6
+ buffer_size: 2048
7
+ learning_rate: 0.0003
8
+ beta: 0.01
9
+ epsilon: 0.2
10
+ lambd: 0.95
11
+ num_epoch: 3
12
+ learning_rate_schedule: linear
13
+ network_settings:
14
+ normalize: false
15
+ hidden_units: 512
16
+ num_layers: 2
17
+ vis_encode_type: simple
18
+ reward_signals:
19
+ extrinsic:
20
+ gamma: 0.99
21
+ strength: 1.0
22
+ rnd:
23
+ gamma: 0.99
24
+ strength: 0.01
25
+ network_settings:
26
+ hidden_units: 64
27
+ num_layers: 3
28
+ learning_rate: 0.0001
29
+ keep_checkpoints: 5
30
+ max_steps: 1000000
31
+ time_horizon: 128
32
+ summary_freq: 30000