-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathconfig1.py
51 lines (40 loc) · 1.82 KB
/
config1.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
#path variables
import os
abs_path = os.path.dirname(__file__)
args = {
# env setting
"game_url": "http://www.aboutsamyuen.com/projects/chrome_dino_js/index.html",
"chrome_driver_path": "/usr/lib/chromium-browser/chromedriver",
"train": 'test', # 'train', 'test'
"init_script": "document.getElementsByClassName('runner-canvas')[0].id = 'runner-canvas'", #create id for canvas for faster selection from DOM
"getbase64Script": "canvasRunner = document.getElementById('runner-canvas'); \
return canvasRunner.toDataURL().substring(22)", #get image from canvas
"img_rows": 80,
"img_cols": 80,
"img_channels": 4, #We stack 4 frames
"checkpoint" : "./weights/double_dqn_high1.pth",
"SAVE_EVERY": 100000,
"num_test_episode": 100,
"cam_visualization": False, # real-time Grad CAM visualization (XAI)
"TEST_EVERY": 50,
"SAVE_GIF": False,
"SLEEP": 0.007, # using sleep() to control the fps in testing
# hypyerparameter
"algorithm": "DoubleDQN",
"EPISODE": 5000,
"ACTIONS": 2, # possible actions: jump, duck () and do nothing
"GAMMA": 0.99, # decay rate of past observations original 0.99
"OBSERVATION": 2000, # timesteps to observe before training
"FINAL_EPSILON": 1e-1, # final value of epsilon
"INITIAL_EPSILON": 1, # starting value of epsilon (initial randomness)
"EPSILON_DECAY": 0.9999925, #0.999975
"REPLAY_MEMORY": 100000, # number of previous transitions to remember
"BATCH": 32, # size of minibatch
"FRAME_PER_ACTION": 1,
"lr": 1e-4,
"weight_decay": 1e-4,
"SYNC_EVERY": 1e4, # no. of experiences between Q_target & Q_online sync
"TRAIN_EVERY": 3,
"prioritized_replay": False, # FPS is slower than unprioritized and needs larger RAM (>40GB) otherwise killed
"grad_norm_clipping": 10, # prevent gradien explosion
}