available_demo_1
This commit is contained in:
@@ -17,7 +17,7 @@ params:
|
||||
name: default
|
||||
sigma_init:
|
||||
name: const_initializer
|
||||
val: 1.0
|
||||
val: 0.80
|
||||
fixed_sigma: False
|
||||
mlp:
|
||||
units: [512, 256, 128]
|
||||
@@ -41,20 +41,20 @@ params:
|
||||
normalize_advantage: True
|
||||
gamma: 0.99
|
||||
tau: 0.95
|
||||
learning_rate: 5e-4
|
||||
learning_rate: 3e-4
|
||||
lr_schedule: adaptive
|
||||
kl_threshold: 0.01
|
||||
kl_threshold: 0.013
|
||||
score_to_win: 20000
|
||||
max_epochs: 500000
|
||||
save_best_after: 50
|
||||
save_frequency: 100
|
||||
grad_norm: 1.0
|
||||
entropy_coef: 0.01
|
||||
grad_norm: 0.8
|
||||
entropy_coef: 0.00008
|
||||
truncate_grads: True
|
||||
bounds_loss_coef: 0.01
|
||||
e_clip: 0.2
|
||||
horizon_length: 256
|
||||
minibatch_size: 65536
|
||||
horizon_length: 192
|
||||
minibatch_size: 49152
|
||||
mini_epochs: 4
|
||||
critic_coef: 1
|
||||
clip_value: True
|
||||
Reference in New Issue
Block a user