-
Notifications
You must be signed in to change notification settings - Fork 0
/
config.yaml
34 lines (30 loc) · 1.3 KB
/
config.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
# Filename: config.yaml
# Description: Contains configuration variables for navigation project
# Author: Thomas Wood (odell.wood@gmail.com)
# Parameters for the Unity Environment
Environment:
# location of executable
Filepath: /data/Banana_Linux_NoVis/Banana.x86_64
Success: 13.0 # score success cutoff
# Parameters for the DQN Agent
Agent:
Buffer_size: 100000 # replay buffer size
Batch_size: 64 # minibatch size
Gamma: 0.99 # discount factor
Tau: 0.001 # for soft update of target parameters
Lr: 0.0005 # learning rate
Update_every: 4 # how often to update the network
Brain_index: 0 # index of agent in environment
# Hyperparameters used during optimization
Training:
Number_episodes: 2000 # Number of episodes
Max_timesteps: 1000 # Maximum number of timesteps per episode
Eps_start: 1.0 # Starting epsilon value for e-Greedy agent
Eps_end: # Minimum value for e-Greedy agent
Eps_decay: 0.995 # How much epsilon decays during each episode
Train_mode: True
Score_window: 100
# Hyperparameters used to define the network architecture
Model:
fc1_size: 100 # Dimensionality of first fully connected layer
fc2_size: 100 # Dimensionality of second fully connected layer