forked from kakaoenterprise/JORLDY
-
Notifications
You must be signed in to change notification settings - Fork 0
/
atari.py
50 lines (46 loc) · 1.03 KB
/
atari.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
### PPO Atari Config ###
env = {
# "name": it should be defined in the command. ex) python main.py --config config.AGENT.atari --env.name breakout
"render": False,
"gray_img": True,
"img_width": 84,
"img_height": 84,
"stack_frame": 4,
"no_op": True,
"skip_frame": 4,
"reward_clip": True,
"episodic_life": True,
}
agent = {
"name": "ppo",
"network": "discrete_policy_value",
"head": "cnn",
"gamma": 0.99,
"batch_size": 32,
"n_step": 128,
"n_epoch": 3,
"_lambda": 0.95,
"epsilon_clip": 0.1,
"vf_coef": 1.0,
"ent_coef": 0.01,
"clip_grad_norm": 1.0,
"use_standardization": True,
}
optim = {
"name": "adam",
"lr": 2.5e-4,
}
train = {
"training": True,
"load_path": None,
"run_step": 10000000,
"print_period": 10000,
"save_period": 100000,
"eval_iteration": 5,
"record": True,
"record_period": 500000,
# distributed setting
"distributed_batch_size": 256,
"update_period": agent["n_step"],
"num_workers": 8,
}