-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathconfig-example.jsonc
107 lines (107 loc) · 2.04 KB
/
config-example.jsonc
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
{
"environment": {
"rom_file": "roms/ms_pacman/ms_pacman.bin",
"end_episode_on_life_loss": false,
"clip_reward": false, // clip with the agent instead so the displayed score is correct
"frame_skip": 4,
"noop_reset_max_frames": 10,
"frame_stack": 4,
"grayscale": true,
"use_float": false,
"output_resolution": [
84,
84
]
},
"observation_save_period": 500,
"observation_gif_save_period": 1000,
"agent": {
"env_count": 8,
"cuda_devices": [
-1 // use all available cuda devices
],
"train_algorithm": {
"train_algorithm_type": "PPO",
"horizon_steps": 256,
"total_timesteps": 5000,
"start_timestep": 0,
"num_epoch": 4,
"num_mini_batch": 4,
"kl_target": 0.03,
"clip_range_policy": 0.1,
"clip_vf": true,
"clip_range_vf": 0.1,
"entropy_coef": 0.01,
"policy_loss_coef": 1.0,
"value_loss_coef": 0.5,
"gamma": [
0.996
],
"gae_lambda": 0.95,
"optimiser": {
"type": "Adam",
"epsilon": 1e-8,
"learning_rate": 0.00025,
"learning_rate_min": 0.000001,
"lr_schedule_type": "Linear",
"lr_decay_rate": 1.0,
"grad_norm_clip": 0.5
}
},
"rewards": {
"reward_clamp_min": -1.0,
"reward_clamp_max": 1.0,
"combine_rewards": false
},
"model": {
"model_type": "ActorCritic",
// "gru_hidden_size": 512, // Uncomment to use recurrent model
"feature_extractor": [
{
// Nature CNN
"type": "CNN",
"layers": [
{
"type": "Conv2d",
"out_channels": 32,
"kernel_size": 8,
"stride": 4
},
{
"activation": "ReLU"
},
{
"type": "Conv2d",
"out_channels": 64,
"kernel_size": 4,
"stride": 2
},
{
"activation": "ReLU"
},
{
"type": "Conv2d",
"out_channels": 64,
"kernel_size": 3,
"stride": 1
},
{
"activation": "ReLU"
}
]
}
],
"shared": {
"layers": [
{
"type": "Linear",
"size": 512
},
{
"activation": "ReLU"
}
]
}
}
}
}