-
Notifications
You must be signed in to change notification settings - Fork 7
/
Copy pathdagger_constants.py
75 lines (64 loc) · 2.28 KB
/
dagger_constants.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
# -*- coding: utf-8 -*-
LOCAL_T_MAX = 5 # repeat step size
RMSP_ALPHA = 0.99 # decay parameter for RMSProp
RMSP_EPSILON = 0.1 # epsilon parameter for RMSProp
CHECKPOINT_DIR = 'checkpoints'
LOG_FILE = 'logs'
INITIAL_ALPHA_LOW = 1e-4 # log_uniform low limit for learning rate
INITIAL_ALPHA_HIGH = 1e-2 # log_uniform high limit for learning rate
ACTION_SIZE = 4 # action size
# log_uniform interpolate rate for learning rate (around 7 * 10^-4)
INITIAL_ALPHA_LOG_RATE = 0.4226
GAMMA = 0.99 # discount factor for rewards
ENTROPY_BETA = 0.01 # entropy regurarlization constant
MAX_TIME_STEP = 10.0 * 10**6 # 10 million frames
GRAD_NORM_CLIP = 40.0 # gradient norm clipping
USE_GPU = True # To use GPU, set True
NUM_CPU = 8
VERBOSE = True
SCREEN_WIDTH = 84
SCREEN_HEIGHT = 84
HISTORY_LENGTH = 4
NUM_EVAL_EPISODES = 1 # number of episodes for evaluation
VERBOSE_EVAL = True
EVAL_INIT_LOC = 433
TASK_TYPE = 'navigation' # no need to change
# DAGGER IMITATION LEARNING SPECIFIC
INITIAL_DIFFIDENCE_RATE = 0
PARALLEL_SIZE = 32 # parallel thread size
# TRAIN_TASK_LIST = {
# 'bathroom_02' : ['26', '37', '43', '53'],
# 'bedroom_04' : ['134', '264', '320', '384'],
# 'kitchen_02' : ['90', '136', '157', '207'],
# 'living_room_08' : ['92', '135', '193', '228']
# }
# TEST_TASK_LIST = {
# 'bathroom_02' : ['26', '37', '43', '53', '69'],
# 'bedroom_04' : ['134', '264', '320', '384', '387'],
# 'kitchen_02' : ['90', '136', '157', '207', '329'],
# 'living_room_08' : ['92', '135', '193', '228', '254']
# }
# VALID_TASK_LIST = {
# 'bathroom_02' : ['26', '69'],
# 'bedroom_04' : ['134', '387'],
# 'kitchen_02' : ['90', '329'],
# 'living_room_08' : ['92', '254']
# }
TRAIN_TASK_LIST = {
'bathroom_02': ['26', '37', '43', '53', '16', '28', '32', '41']
# 'living_room_08': ['92', '135', '193', '228', '132', '251', '303', '13'],
}
VALID_TASK_LIST = {
'bathroom_02': ['27', '38', '40', '54', '32', '48', '52', '45']
# 'living_room_08': ['104', '131', '197', '240', '164', '247', '300', '17'],
}
TEST_TASK_LIST = {
'living_room_08': ['256', '252', '171', '393', '312', '344', '387', '79'],
}
NUM_VAL_EPISODES = 20
VALIDATE = False
DYNAMIC_VALIDATE = True
VALIDATE_FREQUENCY = 50000
SUCCESS_CUTOFF = 500
MAX_VALID_STEPS = 1000
ENCOURAGE_SYMMETRY = False