-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathparams.yaml_old
46 lines (46 loc) · 1.03 KB
/
params.yaml_old
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
env_name: ASTEnv
seed: 1
cuda: True
cuda_deterministic: False
num_processes: 8
num_steps: 128
log_interval: 1
eval_interval: 1000
save_interval: 100
num_env_steps: 1.0e+8
use_linear_lr_decay: True
env:
max_episode_steps: 1
perturbation: 0
assignment_dir: /RL_env/data/generated_tests/binary_tests/train
num_assignments: 7
code_per_assignment: [117, 28, 48, 15, 7, 2, 2]
cursor_start_pos: [1, 4, 2, 6, 8, 10, 12]
# num_assignments: 1
# code_per_assignment: [9]
# cursor_start_pos: [6]
eval:
perturbation: 0
assignment_dir: /RL_env/data/generated_tests/binary_tests/test
num_assignments: 6
code_per_assignment: [26, 4, 14, 4, 2, 1]
cursor_start_pos: [1, 4, 2, 6, 8, 10]
base:
hidden_size: 128
num_layers: [11, 12, 13, 14]
embedding_size: 100
cursor: True
ppo:
lr: [5.0e-5, 1.0e-5, 5.0e-6, 1.0e-6]
eps: 1.0e-5
value_loss_coef: 0.5
max_grad_norm: 0.5
ppo_epoch: 4
num_mini_batch: 4
clip_param: 0.1
entropy_coef: 0.01
return:
gamma: 0.99
use_gae: True
gae_lambda: 0.95
use_proper_time_limits: False