forked from miyosuda/unreal
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathconstants.py
More file actions
33 lines (27 loc) · 1.13 KB
/
constants.py
File metadata and controls
33 lines (27 loc) · 1.13 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
# -*- coding: utf-8 -*-
LOCAL_T_MAX = 20 # repeat step size
RMSP_ALPHA = 0.99 # decay parameter for RMSProp
RMSP_EPSILON = 0.1 # epsilon parameter for RMSProp
CHECKPOINT_DIR = '/tmp/unreal_checkpoints'
LOG_FILE = '/tmp/unreal_log/unreal_log'
INITIAL_ALPHA_LOW = 1e-4 # log_uniform low limit for learning rate
INITIAL_ALPHA_HIGH = 5e-3 # log_uniform high limit for learning rate
PARALLEL_SIZE = 8 # parallel thread size
ENV_TYPE = 'lab' # 'lab' or 'gym' or 'maze'
ENV_NAME = 'seekavoid_arena_01'
#ENV_NAME = 'stairway_to_melon'
#ENV_NAME = 'nav_maze_static_01'
#ENV_TYPE = 'gym'
#ENV_NAME = 'Breakout-v0'
INITIAL_ALPHA_LOG_RATE = 0.5 # log_uniform interpolate rate for learning rate
GAMMA = 0.99 # discount factor for rewards
ENTROPY_BETA = 0.001 # entropy regurarlization constant
PIXEL_CHANGE_LAMBDA = 0.05 # 0.01 ~ 0.1 for Lab, 0.0001 ~ 0.01 for Gym
EXPERIENCE_HISTORY_SIZE = 2000 # Experience replay buffer size
USE_PIXEL_CHANGE = True
USE_VALUE_REPLAY = True
USE_REWARD_PREDICTION = True
MAX_TIME_STEP = 10 * 10**7
SAVE_INTERVAL_STEP = 100 * 1000
GRAD_NORM_CLIP = 40.0 # gradient norm clipping
USE_GPU = True # To use GPU, set True