# Importing libraries
import os
import numpy as np
import random
import math
from collections import deque
import collections
import pickle
# for building DQN model
from keras import layers
from keras import Sequential
from keras.layers import Dense, Activation, Flatten
from tensorflow.keras.optimizers import Adam
# for plotting graphs
import matplotlib.pyplot as plt
# Import the environment
from Env import CabDriver
import glob
import os
env = CabDriver()
# Loading the time matrix provided
Time_matrix = np.load("TM.npy")
states_track = collections.defaultdict(dict)
def initialise_states_for_tracking():
# Initializina Tracking Q-values for a couple of state action pairs
sample_q_values = [((4,3,2),(4,1)),((0,0,0),(0,4))]
for q_values in sample_q_values:
state = q_values[0]
action = q_values[1]
#array to trace state-action pair after every 25th episode
states_track[state][action] = []
# Defining a function to save the tracked Q-values in the dictionry
def save_tracking_states():
print("saving states...")
for state in states_track.keys():
for action in states_track[state].keys():
state_encod = env.state_trans(state)
state_encod = np.reshape(state_encod, [1, agent.state_size])
prediction = agent.model.predict(state_encod)
action_index = env.action_space.index(action)
Q = prediction[0][action_index]
states_track[state][action].append(Q)
#Defining a function to save a dictionary as a pickle file
def save_obj(obj, name ):
with open(name + '.pkl', 'wb') as f:
pickle.dump(obj, f, pickle.HIGHEST_PROTOCOL)
If you are using this framework, you need to fill the following to complete the following code block:
- State and Action Size
- Hyperparameters
- Create a neural-network model in function 'build_model()'
- Define epsilon-greedy strategy in function 'get_action()'
- Complete the function 'append_sample()'. This function appends the recent experience tuple <state, action, reward, new-state> to the memory
- Complete the 'train_model()' function with following logic:
- If the memory size is greater than mini-batch size, you randomly sample experiences from memory as per the mini-batch size and do the following:
- Initialise your input and output batch for training the model
- Calculate the target Q value for each sample: reward + gamma*max(Q(s'a,))
- Get Q(s', a) values from the last trained model
- Update the input batch as your encoded state and output batch as your Q-values
- Then fit your DQN model using the updated input and output batch.
- If the memory size is greater than mini-batch size, you randomly sample experiences from memory as per the mini-batch size and do the following:
We chose to train our model every Episode instead of every step to make use of parallelization
m = 5
t = 24
d = 7
class DQNAgent:
def __init__(self, state_size):
# Define size of state and action
self.state_size = m+t+d
self.action_size = m*(m-1) + 1
self.action_space = [[i,j] for i in range(m) for j in range(m) if i!=j or i==0]
# These are hyper parameters for the DQN
self.discount_factor = 0.95
self.learning_rate = 0.01
self.epsilon_max = 1.0
self.epsilon_decay = 0.0009
self.epsilon_min = 0.00000001
self.batch_size = 2048*3
# create replay memory using deque
self.memory = deque(maxlen=2048*64)
# create main model and target model
self.model = self.build_model()
# approximate Q function using Neural Network
def build_model(self):
model = Sequential()
model.add(Dense(32, input_dim = self.state_size,activation ='relu'))
model.add(Dense(32,activation ='relu'))
model.add(Dense(self.action_size,activation ='linear'))
model.compile(loss='mse',optimizer=Adam(learning_rate=self.learning_rate))
model.summary
return model
def get_action(self, state, episode):
# get action from model using epsilon-greedy policy
# Decay in e after we generate each sample from the environment
poss_actions_index, poss_actions = env.requests(state)
epsilon = self.epsilon_min + (self.epsilon_max - self.epsilon_min) * np.exp(-self.epsilon_decay*episode)
if np.random.rand() <= epsilon: # Exploration: randomly choosing and action
action_index = np.random.choice(poss_actions_index)
action = self.action_space[action_index]
else: #Exploitation: this gets the action corresponding to max q-value of current state
state_encod = env.state_trans(state)
state_encod = np.reshape(state_encod, [1, self.state_size])
q_value = self.model.predict(state_encod)
q_value = q_value[0][poss_actions_index]
action_index = np.argmax(q_value)
action = poss_actions[action_index]
return action, epsilon
# save sample <s,a,r,s'> to the replay memory
def append_sample(self, state, action, reward, next_state, terminal_state):
self.memory.append((state, action, reward, next_state, terminal_state))
# pick samples randomly from replay memory (with batch_size) and train the network
def train_model(self):
if len(self.memory) < self.batch_size:
return
print('Training...')
# Sample batch from the memory
mini_batch = random.sample(self.memory, self.batch_size)
update_output = np.zeros((self.batch_size, self.state_size))
update_input = np.zeros((self.batch_size, self.state_size))
actions, rewards, terminal_states = [], [], []
for i in range(self.batch_size):
state, action, reward, next_state, terminal_state = mini_batch[i]
actions.append(self.action_space.index(list(action)))
rewards.append(reward)
terminal_states.append(terminal_state)
update_input[i] = env.state_trans(state)
update_output[i] = env.state_trans(next_state)
target = self.model.predict(update_input)
target_val = self.model.predict(update_output)
# get your target Q-value on the basis of terminal state
for i in range(self.batch_size):
if terminal_states[i]:
target[i][actions[i]] = rewards[i]
else:
target[i][actions[i]] = rewards[i] + self.discount_factor * (np.amax(target_val[i]))
self.model.fit(update_input, target, batch_size=self.batch_size, epochs=1, verbose=0)
def save(self, name):
self.model.save_weights(name)
def load(self, name):
self.model.load_weights(name)
# make directory
if not os.path.exists("saved_pickle_files"):
os.mkdir("saved_pickle_files")
# Initialising the environment
env = CabDriver()
# get size of state and action from environment
state_size = len(env.state_space)
action_space = env.action_space
Time_matrix = np.load("TM.npy")
state_space = env.state_space
start_episode = 0;
# agent needs to be initialised outside the loop since the DQN
# network will be initialised along with the agent
agent = DQNAgent(state_size)
#Loading wights from disk (The training was interupted due to power failure)
# agent.load('./cab_driver.h5')
# start_episode = 2400 # Index of the episode to restart training from
# tracking average reward per episode = total rewards in an episode/ total steps in an episode
avg_reward = []
# tracking total rewards per episode
total_reward = []
initialise_states_for_tracking()
Episodes = 20000
for episode in range(start_episode,Episodes):
# tracking total rewards, step count
tot_reward = 0
step_count = 0
state = env.reset()
terminal_state = False
state_space = env.state_space
while not terminal_state:
action, epsilon = agent.get_action(state, episode)
reward = env.reward_func(state, action, Time_matrix)
next_state, terminal_state = env.next_state_func(state, action, Time_matrix)
# save the sample <s, a, r, s'> to the replay memory
agent.append_sample(state, action, reward, next_state, terminal_state)
tot_reward += reward
state = next_state
step_count += 1
# Store the rewards for every 25th episode
if terminal_state and episode % 1 == 0:
avg_reward.append(tot_reward/step_count)
total_reward.append(tot_reward)
print("episode:", episode," no of steps:",step_count, " score:", tot_reward, " avg score:", round(tot_reward/step_count,4),
" memorylength:", len(agent.memory), " epsilon:", epsilon)
#For every 25th episode,track the states.
if episode % 50 == 0: #every 25 episode
save_tracking_states()
if episode % 50 == 0 and episode !=0:
Rewardname = "saved_pickle_files/Rewards"+str(episode)
Statesname = "saved_pickle_files/States_tracked"+str(episode)
save_obj(total_reward,Rewardname)
save_obj(states_track,Statesname)
agent.save("./cab_driver.h5")
#Train the model every episode
agent.train_model()
episode: 0 no of steps: 127 score: -257.0 avg score: -2.0236 memorylength: 127 epsilon: 1.0
saving states...
episode: 1 no of steps: 149 score: -446.0 avg score: -2.9933 memorylength: 276 epsilon: 0.9991004048875233
episode: 2 no of steps: 141 score: -400.0 avg score: -2.8369 memorylength: 417 epsilon: 0.9982016190464211
episode: 3 no of steps: 140 score: -256.0 avg score: -1.8286 memorylength: 557 epsilon: 0.9973036417486767
episode: 4 no of steps: 137 score: -351.0 avg score: -2.562 memorylength: 694 epsilon: 0.9964064722669286
episode: 5 no of steps: 174 score: -208.0 avg score: -1.1954 memorylength: 868 epsilon: 0.9955101098744694
episode: 6 no of steps: 131 score: -220.0 avg score: -1.6794 memorylength: 999 epsilon: 0.9946145538452457
episode: 7 no of steps: 131 score: -320.0 avg score: -2.4427 memorylength: 1130 epsilon: 0.9937198034538567
episode: 8 no of steps: 142 score: -412.0 avg score: -2.9014 memorylength: 1272 epsilon: 0.9928258579755548
episode: 9 no of steps: 129 score: -219.0 avg score: -1.6977 memorylength: 1401 epsilon: 0.9919327166862439
episode: 10 no of steps: 136 score: -253.0 avg score: -1.8603 memorylength: 1537 epsilon: 0.9910403788624799
episode: 11 no of steps: 155 score: -86.0 avg score: -0.5548 memorylength: 1692 epsilon: 0.9901488437814687
episode: 12 no of steps: 170 score: -221.0 avg score: -1.3 memorylength: 1862 epsilon: 0.9892581107210671
episode: 13 no of steps: 128 score: -252.0 avg score: -1.9688 memorylength: 1990 epsilon: 0.988368178959781
episode: 14 no of steps: 155 score: -198.0 avg score: -1.2774 memorylength: 2145 epsilon: 0.987479047776766
episode: 15 no of steps: 145 score: -544.0 avg score: -3.7517 memorylength: 2290 epsilon: 0.9865907164518255
episode: 16 no of steps: 146 score: -237.0 avg score: -1.6233 memorylength: 2436 epsilon: 0.9857031842654111
episode: 17 no of steps: 164 score: -130.0 avg score: -0.7927 memorylength: 2600 epsilon: 0.9848164504986219
episode: 18 no of steps: 124 score: -57.0 avg score: -0.4597 memorylength: 2724 epsilon: 0.9839305144332032
episode: 19 no of steps: 128 score: 104.0 avg score: 0.8125 memorylength: 2852 epsilon: 0.983045375351547
episode: 20 no of steps: 138 score: -100.0 avg score: -0.7246 memorylength: 2990 epsilon: 0.9821610325366904
episode: 21 no of steps: 152 score: -230.0 avg score: -1.5132 memorylength: 3142 epsilon: 0.9812774852723157
episode: 22 no of steps: 136 score: -267.0 avg score: -1.9632 memorylength: 3278 epsilon: 0.9803947328427498
episode: 23 no of steps: 129 score: -88.0 avg score: -0.6822 memorylength: 3407 epsilon: 0.9795127745329629
episode: 24 no of steps: 140 score: -189.0 avg score: -1.35 memorylength: 3547 epsilon: 0.9786316096285689
episode: 25 no of steps: 151 score: -294.0 avg score: -1.947 memorylength: 3698 epsilon: 0.9777512374158239
episode: 26 no of steps: 149 score: -302.0 avg score: -2.0268 memorylength: 3847 epsilon: 0.9768716571816268
episode: 27 no of steps: 133 score: -162.0 avg score: -1.218 memorylength: 3980 epsilon: 0.9759928682135173
episode: 28 no of steps: 130 score: -208.0 avg score: -1.6 memorylength: 4110 epsilon: 0.9751148697996762
episode: 29 no of steps: 148 score: -245.0 avg score: -1.6554 memorylength: 4258 epsilon: 0.9742376612289249
episode: 30 no of steps: 123 score: -271.0 avg score: -2.2033 memorylength: 4381 epsilon: 0.9733612417907244
episode: 31 no of steps: 135 score: -137.0 avg score: -1.0148 memorylength: 4516 epsilon: 0.9724856107751748
episode: 32 no of steps: 142 score: -415.0 avg score: -2.9225 memorylength: 4658 epsilon: 0.9716107674730151
episode: 33 no of steps: 157 score: -291.0 avg score: -1.8535 memorylength: 4815 epsilon: 0.970736711175622
episode: 34 no of steps: 152 score: -396.0 avg score: -2.6053 memorylength: 4967 epsilon: 0.9698634411750099
episode: 35 no of steps: 153 score: -91.0 avg score: -0.5948 memorylength: 5120 epsilon: 0.9689909567638301
episode: 36 no of steps: 134 score: -196.0 avg score: -1.4627 memorylength: 5254 epsilon: 0.9681192572353702
episode: 37 no of steps: 154 score: -399.0 avg score: -2.5909 memorylength: 5408 epsilon: 0.9672483418835535
episode: 38 no of steps: 145 score: -518.0 avg score: -3.5724 memorylength: 5553 epsilon: 0.9663782100029384
episode: 39 no of steps: 164 score: -396.0 avg score: -2.4146 memorylength: 5717 epsilon: 0.9655088608887183
episode: 40 no of steps: 133 score: -95.0 avg score: -0.7143 memorylength: 5850 epsilon: 0.9646402938367201
episode: 41 no of steps: 135 score: -374.0 avg score: -2.7704 memorylength: 5985 epsilon: 0.9637725081434045
episode: 42 no of steps: 140 score: -196.0 avg score: -1.4 memorylength: 6125 epsilon: 0.9629055031058652
episode: 43 no of steps: 147 score: -493.0 avg score: -3.3537 memorylength: 6272 epsilon: 0.962039278021828
Training...
episode: 44 no of steps: 144 score: -388.0 avg score: -2.6944 memorylength: 6416 epsilon: 0.9611738321896504
Training...
episode: 45 no of steps: 147 score: -288.0 avg score: -1.9592 memorylength: 6563 epsilon: 0.9603091649083214
Training...
episode: 46 no of steps: 157 score: -500.0 avg score: -3.1847 memorylength: 6720 epsilon: 0.9594452754774603
Training...
episode: 47 no of steps: 146 score: -199.0 avg score: -1.363 memorylength: 6866 epsilon: 0.9585821631973167
Training...
episode: 48 no of steps: 155 score: -196.0 avg score: -1.2645 memorylength: 7021 epsilon: 0.9577198273687696
Training...
episode: 49 no of steps: 143 score: -352.0 avg score: -2.4615 memorylength: 7164 epsilon: 0.956858267293327
Training...
episode: 50 no of steps: 128 score: -133.0 avg score: -1.0391 memorylength: 7292 epsilon: 0.9559974822731252
saving states...
Training...
episode: 51 no of steps: 144 score: -180.0 avg score: -1.25 memorylength: 7436 epsilon: 0.955137471610928
Training...
episode: 52 no of steps: 143 score: -206.0 avg score: -1.4406 memorylength: 7579 epsilon: 0.9542782346101271
Training...
episode: 53 no of steps: 133 score: -77.0 avg score: -0.5789 memorylength: 7712 epsilon: 0.9534197705747401
Training...
episode: 54 no of steps: 134 score: -454.0 avg score: -3.3881 memorylength: 7846 epsilon: 0.9525620788094115
Training...
episode: 55 no of steps: 137 score: -262.0 avg score: -1.9124 memorylength: 7983 epsilon: 0.9517051586194106
Training...
episode: 56 no of steps: 124 score: -316.0 avg score: -2.5484 memorylength: 8107 epsilon: 0.9508490093106322
Training...
episode: 57 no of steps: 149 score: 75.0 avg score: 0.5034 memorylength: 8256 epsilon: 0.9499936301895952
Training...
episode: 58 no of steps: 126 score: -303.0 avg score: -2.4048 memorylength: 8382 epsilon: 0.9491390205634425
Training...
episode: 59 no of steps: 144 score: 63.0 avg score: 0.4375 memorylength: 8526 epsilon: 0.9482851797399402
Training...
episode: 60 no of steps: 139 score: 15.0 avg score: 0.1079 memorylength: 8665 epsilon: 0.9474321070274773
Training...
episode: 61 no of steps: 137 score: -450.0 avg score: -3.2847 memorylength: 8802 epsilon: 0.9465798017350647
Training...
episode: 62 no of steps: 124 score: -321.0 avg score: -2.5887 memorylength: 8926 epsilon: 0.9457282631723353
Training...
episode: 63 no of steps: 143 score: -152.0 avg score: -1.0629 memorylength: 9069 epsilon: 0.9448774906495425
Training...
episode: 64 no of steps: 138 score: -536.0 avg score: -3.8841 memorylength: 9207 epsilon: 0.9440274834775608
Training...
episode: 65 no of steps: 140 score: -288.0 avg score: -2.0571 memorylength: 9347 epsilon: 0.9431782409678842
Training...
episode: 66 no of steps: 128 score: -316.0 avg score: -2.4688 memorylength: 9475 epsilon: 0.9423297624326262
Training...
episode: 67 no of steps: 143 score: -1.0 avg score: -0.007 memorylength: 9618 epsilon: 0.9414820471845194
Training...
episode: 68 no of steps: 151 score: -248.0 avg score: -1.6424 memorylength: 9769 epsilon: 0.940635094536914
Training...
episode: 69 no of steps: 156 score: -322.0 avg score: -2.0641 memorylength: 9925 epsilon: 0.9397889038037786
Training...
episode: 70 no of steps: 154 score: -33.0 avg score: -0.2143 memorylength: 10079 epsilon: 0.9389434742996985
Training...
episode: 71 no of steps: 131 score: -446.0 avg score: -3.4046 memorylength: 10210 epsilon: 0.9380988053398759
Training...
episode: 72 no of steps: 138 score: -337.0 avg score: -2.442 memorylength: 10348 epsilon: 0.9372548962401288
Training...
episode: 73 no of steps: 128 score: -378.0 avg score: -2.9531 memorylength: 10476 epsilon: 0.9364117463168907
Training...
episode: 74 no of steps: 157 score: 78.0 avg score: 0.4968 memorylength: 10633 epsilon: 0.9355693548872103
Training...
episode: 75 no of steps: 130 score: -65.0 avg score: -0.5 memorylength: 10763 epsilon: 0.9347277212687503
Training...
episode: 76 no of steps: 139 score: -203.0 avg score: -1.4604 memorylength: 10902 epsilon: 0.9338868447797877
Training...
episode: 77 no of steps: 152 score: 84.0 avg score: 0.5526 memorylength: 11054 epsilon: 0.9330467247392122
Training...
episode: 78 no of steps: 149 score: 87.0 avg score: 0.5839 memorylength: 11203 epsilon: 0.9322073604665266
Training...
episode: 79 no of steps: 141 score: -382.0 avg score: -2.7092 memorylength: 11344 epsilon: 0.931368751281846
Training...
episode: 80 no of steps: 140 score: -179.0 avg score: -1.2786 memorylength: 11484 epsilon: 0.9305308965058968
Training...
episode: 81 no of steps: 140 score: -190.0 avg score: -1.3571 memorylength: 11624 epsilon: 0.9296937954600164
Training...
episode: 82 no of steps: 127 score: -288.0 avg score: -2.2677 memorylength: 11751 epsilon: 0.9288574474661532
Training...
episode: 83 no of steps: 136 score: 195.0 avg score: 1.4338 memorylength: 11887 epsilon: 0.9280218518468649
Training...
episode: 84 no of steps: 152 score: -414.0 avg score: -2.7237 memorylength: 12039 epsilon: 0.9271870079253194
Training...
episode: 85 no of steps: 131 score: -330.0 avg score: -2.5191 memorylength: 12170 epsilon: 0.926352915025293
Training...
episode: 86 no of steps: 150 score: 238.0 avg score: 1.5867 memorylength: 12320 epsilon: 0.9255195724711702
Training...
episode: 87 no of steps: 132 score: -150.0 avg score: -1.1364 memorylength: 12452 epsilon: 0.9246869795879437
Training...
episode: 88 no of steps: 138 score: -446.0 avg score: -3.2319 memorylength: 12590 epsilon: 0.923855135701213
Training...
episode: 89 no of steps: 163 score: -281.0 avg score: -1.7239 memorylength: 12753 epsilon: 0.9230240401371846
Training...
episode: 90 no of steps: 123 score: -327.0 avg score: -2.6585 memorylength: 12876 epsilon: 0.9221936922226711
Training...
episode: 91 no of steps: 147 score: -197.0 avg score: -1.3401 memorylength: 13023 epsilon: 0.9213640912850907
Training...
episode: 92 no of steps: 149 score: 70.0 avg score: 0.4698 memorylength: 13172 epsilon: 0.9205352366524665
Training...
episode: 93 no of steps: 146 score: 151.0 avg score: 1.0342 memorylength: 13318 epsilon: 0.9197071276534262
Training...
episode: 94 no of steps: 143 score: -360.0 avg score: -2.5175 memorylength: 13461 epsilon: 0.9188797636172015
Training...
episode: 95 no of steps: 154 score: -73.0 avg score: -0.474 memorylength: 13615 epsilon: 0.9180531438736275
Training...
episode: 96 no of steps: 172 score: -63.0 avg score: -0.3663 memorylength: 13787 epsilon: 0.917227267753142
Training...
episode: 97 no of steps: 151 score: -299.0 avg score: -1.9801 memorylength: 13938 epsilon: 0.9164021345867855
Training...
episode: 98 no of steps: 156 score: -439.0 avg score: -2.8141 memorylength: 14094 epsilon: 0.9155777437062002
Training...
episode: 99 no of steps: 157 score: -289.0 avg score: -1.8408 memorylength: 14251 epsilon: 0.9147540944436291
Training...
episode: 100 no of steps: 154 score: -448.0 avg score: -2.9091 memorylength: 14405 epsilon: 0.9139311861319164
saving states...
Training...
episode: 101 no of steps: 135 score: 111.0 avg score: 0.8222 memorylength: 14540 epsilon: 0.9131090181045063
Training...
episode: 102 no of steps: 140 score: -88.0 avg score: -0.6286 memorylength: 14680 epsilon: 0.9122875896954428
Training...
episode: 103 no of steps: 139 score: -165.0 avg score: -1.1871 memorylength: 14819 epsilon: 0.9114669002393686
Training...
episode: 104 no of steps: 140 score: -315.0 avg score: -2.25 memorylength: 14959 epsilon: 0.9106469490715253
Training...
episode: 105 no of steps: 156 score: -410.0 avg score: -2.6282 memorylength: 15115 epsilon: 0.9098277355277526
Training...
episode: 106 no of steps: 137 score: -279.0 avg score: -2.0365 memorylength: 15252 epsilon: 0.9090092589444873
Training...
episode: 107 no of steps: 143 score: -514.0 avg score: -3.5944 memorylength: 15395 epsilon: 0.9081915186587634
Training...
episode: 108 no of steps: 146 score: -136.0 avg score: -0.9315 memorylength: 15541 epsilon: 0.907374514008211
Training...
episode: 109 no of steps: 139 score: 21.0 avg score: 0.1511 memorylength: 15680 epsilon: 0.9065582443310565
Training...
episode: 110 no of steps: 125 score: 33.0 avg score: 0.264 memorylength: 15805 epsilon: 0.9057427089661214
Training...
episode: 111 no of steps: 153 score: -420.0 avg score: -2.7451 memorylength: 15958 epsilon: 0.904927907252822
Training...
episode: 112 no of steps: 137 score: -482.0 avg score: -3.5182 memorylength: 16095 epsilon: 0.9041138385311689
Training...
episode: 113 no of steps: 140 score: -234.0 avg score: -1.6714 memorylength: 16235 epsilon: 0.9033005021417663
Training...
episode: 114 no of steps: 133 score: -291.0 avg score: -2.188 memorylength: 16368 epsilon: 0.9024878974258117
Training...
episode: 115 no of steps: 160 score: -677.0 avg score: -4.2312 memorylength: 16528 epsilon: 0.9016760237250953
Training...
episode: 116 no of steps: 130 score: 46.0 avg score: 0.3538 memorylength: 16658 epsilon: 0.9008648803819992
Training...
episode: 117 no of steps: 140 score: -118.0 avg score: -0.8429 memorylength: 16798 epsilon: 0.9000544667394974
Training...
episode: 118 no of steps: 139 score: -106.0 avg score: -0.7626 memorylength: 16937 epsilon: 0.8992447821411548
Training...
episode: 119 no of steps: 157 score: -273.0 avg score: -1.7389 memorylength: 17094 epsilon: 0.8984358259311269
Training...
episode: 120 no of steps: 145 score: -223.0 avg score: -1.5379 memorylength: 17239 epsilon: 0.8976275974541589
Training...
episode: 121 no of steps: 146 score: -487.0 avg score: -3.3356 memorylength: 17385 epsilon: 0.8968200960555859
Training...
episode: 122 no of steps: 153 score: 22.0 avg score: 0.1438 memorylength: 17538 epsilon: 0.8960133210813316
Training...
episode: 123 no of steps: 144 score: -88.0 avg score: -0.6111 memorylength: 17682 epsilon: 0.8952072718779083
Training...
episode: 124 no of steps: 149 score: -281.0 avg score: -1.8859 memorylength: 17831 epsilon: 0.894401947792416
Training...
episode: 125 no of steps: 148 score: -342.0 avg score: -2.3108 memorylength: 17979 epsilon: 0.8935973481725422
Training...
episode: 126 no of steps: 144 score: -189.0 avg score: -1.3125 memorylength: 18123 epsilon: 0.8927934723665613
Training...
episode: 127 no of steps: 141 score: -191.0 avg score: -1.3546 memorylength: 18264 epsilon: 0.8919903197233335
Training...
episode: 128 no of steps: 136 score: -271.0 avg score: -1.9926 memorylength: 18400 epsilon: 0.8911878895923055
Training...
episode: 129 no of steps: 145 score: -333.0 avg score: -2.2966 memorylength: 18545 epsilon: 0.8903861813235088
Training...
episode: 130 no of steps: 145 score: -181.0 avg score: -1.2483 memorylength: 18690 epsilon: 0.8895851942675594
Training...
episode: 131 no of steps: 133 score: -306.0 avg score: -2.3008 memorylength: 18823 epsilon: 0.8887849277756579
Training...
episode: 132 no of steps: 144 score: -155.0 avg score: -1.0764 memorylength: 18967 epsilon: 0.8879853811995885
Training...
episode: 133 no of steps: 123 score: -138.0 avg score: -1.122 memorylength: 19090 epsilon: 0.8871865538917182
Training...
episode: 134 no of steps: 133 score: -52.0 avg score: -0.391 memorylength: 19223 epsilon: 0.886388445204997
Training...
episode: 135 no of steps: 134 score: -231.0 avg score: -1.7239 memorylength: 19357 epsilon: 0.8855910544929568
Training...
episode: 136 no of steps: 128 score: -63.0 avg score: -0.4922 memorylength: 19485 epsilon: 0.8847943811097111
Training...
episode: 137 no of steps: 150 score: -438.0 avg score: -2.92 memorylength: 19635 epsilon: 0.8839984244099544
Training...
episode: 138 no of steps: 143 score: -179.0 avg score: -1.2517 memorylength: 19778 epsilon: 0.8832031837489616
Training...
episode: 139 no of steps: 130 score: -351.0 avg score: -2.7 memorylength: 19908 epsilon: 0.8824086584825879
Training...
episode: 140 no of steps: 149 score: -45.0 avg score: -0.302 memorylength: 20057 epsilon: 0.8816148479672676
Training...
episode: 141 no of steps: 137 score: -186.0 avg score: -1.3577 memorylength: 20194 epsilon: 0.8808217515600143
Training...
episode: 142 no of steps: 128 score: 118.0 avg score: 0.9219 memorylength: 20322 epsilon: 0.8800293686184198
Training...
episode: 143 no of steps: 118 score: -96.0 avg score: -0.8136 memorylength: 20440 epsilon: 0.879237698500654
Training...
episode: 144 no of steps: 136 score: -475.0 avg score: -3.4926 memorylength: 20576 epsilon: 0.8784467405654639
Training...
episode: 145 no of steps: 138 score: -103.0 avg score: -0.7464 memorylength: 20714 epsilon: 0.8776564941721736
Training...
episode: 146 no of steps: 141 score: -34.0 avg score: -0.2411 memorylength: 20855 epsilon: 0.8768669586806835
Training...
episode: 147 no of steps: 138 score: -338.0 avg score: -2.4493 memorylength: 20993 epsilon: 0.8760781334514698
Training...
episode: 148 no of steps: 162 score: 15.0 avg score: 0.0926 memorylength: 21155 epsilon: 0.8752900178455839
Training...
episode: 149 no of steps: 149 score: 6.0 avg score: 0.0403 memorylength: 21304 epsilon: 0.8745026112246522
Training...
episode: 150 no of steps: 126 score: -319.0 avg score: -2.5317 memorylength: 21430 epsilon: 0.8737159129508754
saving states...
Training...
episode: 151 no of steps: 133 score: -126.0 avg score: -0.9474 memorylength: 21563 epsilon: 0.8729299223870276
Training...
episode: 152 no of steps: 134 score: -189.0 avg score: -1.4104 memorylength: 21697 epsilon: 0.8721446388964567
Training...
episode: 153 no of steps: 128 score: -301.0 avg score: -2.3516 memorylength: 21825 epsilon: 0.8713600618430829
Training...
episode: 154 no of steps: 126 score: -311.0 avg score: -2.4683 memorylength: 21951 epsilon: 0.8705761905913987
Training...
episode: 155 no of steps: 141 score: -269.0 avg score: -1.9078 memorylength: 22092 epsilon: 0.8697930245064683
Training...
episode: 156 no of steps: 128 score: -231.0 avg score: -1.8047 memorylength: 22220 epsilon: 0.8690105629539273
Training...
episode: 157 no of steps: 136 score: -284.0 avg score: -2.0882 memorylength: 22356 epsilon: 0.8682288052999816
Training...
episode: 158 no of steps: 149 score: -132.0 avg score: -0.8859 memorylength: 22505 epsilon: 0.8674477509114077
Training...
episode: 159 no of steps: 147 score: -289.0 avg score: -1.966 memorylength: 22652 epsilon: 0.8666673991555514
Training...
episode: 160 no of steps: 156 score: -270.0 avg score: -1.7308 memorylength: 22808 epsilon: 0.8658877494003275
Training...
episode: 161 no of steps: 144 score: -99.0 avg score: -0.6875 memorylength: 22952 epsilon: 0.8651088010142199
Training...
episode: 162 no of steps: 139 score: 57.0 avg score: 0.4101 memorylength: 23091 epsilon: 0.8643305533662805
Training...
episode: 163 no of steps: 139 score: 115.0 avg score: 0.8273 memorylength: 23230 epsilon: 0.8635530058261284
Training...
episode: 164 no of steps: 151 score: -5.0 avg score: -0.0331 memorylength: 23381 epsilon: 0.8627761577639501
Training...
episode: 165 no of steps: 145 score: -293.0 avg score: -2.0207 memorylength: 23526 epsilon: 0.8620000085504986
Training...
episode: 166 no of steps: 130 score: 21.0 avg score: 0.1615 memorylength: 23656 epsilon: 0.8612245575570932
Training...
episode: 167 no of steps: 140 score: -155.0 avg score: -1.1071 memorylength: 23796 epsilon: 0.8604498041556182
Training...
episode: 168 no of steps: 125 score: -185.0 avg score: -1.48 memorylength: 23921 epsilon: 0.8596757477185237
Training...
episode: 169 no of steps: 147 score: 193.0 avg score: 1.3129 memorylength: 24068 epsilon: 0.8589023876188238
Training...
episode: 170 no of steps: 134 score: -56.0 avg score: -0.4179 memorylength: 24202 epsilon: 0.8581297232300966
Training...
episode: 171 no of steps: 138 score: -145.0 avg score: -1.0507 memorylength: 24340 epsilon: 0.8573577539264841
Training...
episode: 172 no of steps: 131 score: -424.0 avg score: -3.2366 memorylength: 24471 epsilon: 0.856586479082691
Training...
episode: 173 no of steps: 141 score: -83.0 avg score: -0.5887 memorylength: 24612 epsilon: 0.8558158980739847
Training...
episode: 174 no of steps: 132 score: -415.0 avg score: -3.1439 memorylength: 24744 epsilon: 0.8550460102761945
Training...
episode: 175 no of steps: 140 score: -196.0 avg score: -1.4 memorylength: 24884 epsilon: 0.8542768150657114
Training...
episode: 176 no of steps: 137 score: -20.0 avg score: -0.146 memorylength: 25021 epsilon: 0.8535083118194869
Training...
episode: 177 no of steps: 127 score: -86.0 avg score: -0.6772 memorylength: 25148 epsilon: 0.8527404999150338
Training...
episode: 178 no of steps: 149 score: -423.0 avg score: -2.8389 memorylength: 25297 epsilon: 0.851973378730424
Training...
episode: 179 no of steps: 158 score: -123.0 avg score: -0.7785 memorylength: 25455 epsilon: 0.8512069476442895
Training...
episode: 180 no of steps: 142 score: -186.0 avg score: -1.3099 memorylength: 25597 epsilon: 0.850441206035821
Training...
episode: 181 no of steps: 141 score: -77.0 avg score: -0.5461 memorylength: 25738 epsilon: 0.8496761532847678
Training...
episode: 182 no of steps: 143 score: -555.0 avg score: -3.8811 memorylength: 25881 epsilon: 0.848911788771437
Training...
episode: 183 no of steps: 141 score: -353.0 avg score: -2.5035 memorylength: 26022 epsilon: 0.8481481118766936
Training...
episode: 184 no of steps: 130 score: -200.0 avg score: -1.5385 memorylength: 26152 epsilon: 0.847385121981959
Training...
episode: 185 no of steps: 128 score: 49.0 avg score: 0.3828 memorylength: 26280 epsilon: 0.8466228184692115
Training...
episode: 186 no of steps: 149 score: -113.0 avg score: -0.7584 memorylength: 26429 epsilon: 0.8458612007209851
Training...
episode: 187 no of steps: 146 score: -153.0 avg score: -1.0479 memorylength: 26575 epsilon: 0.8451002681203694
Training...
episode: 188 no of steps: 134 score: 129.0 avg score: 0.9627 memorylength: 26709 epsilon: 0.844340020051009
Training...
episode: 189 no of steps: 133 score: -185.0 avg score: -1.391 memorylength: 26842 epsilon: 0.843580455897103
Training...
episode: 190 no of steps: 136 score: -489.0 avg score: -3.5956 memorylength: 26978 epsilon: 0.8428215750434042
Training...
episode: 191 no of steps: 133 score: -309.0 avg score: -2.3233 memorylength: 27111 epsilon: 0.8420633768752193
Training...
episode: 192 no of steps: 147 score: -468.0 avg score: -3.1837 memorylength: 27258 epsilon: 0.8413058607784074
Training...
episode: 193 no of steps: 145 score: -170.0 avg score: -1.1724 memorylength: 27403 epsilon: 0.8405490261393808
Training...
episode: 194 no of steps: 145 score: -118.0 avg score: -0.8138 memorylength: 27548 epsilon: 0.839792872345103
Training...
episode: 195 no of steps: 136 score: -34.0 avg score: -0.25 memorylength: 27684 epsilon: 0.8390373987830898
Training...
episode: 196 no of steps: 124 score: -143.0 avg score: -1.1532 memorylength: 27808 epsilon: 0.8382826048414074
Training...
episode: 197 no of steps: 125 score: -288.0 avg score: -2.304 memorylength: 27933 epsilon: 0.8375284899086727
Training...
episode: 198 no of steps: 122 score: 88.0 avg score: 0.7213 memorylength: 28055 epsilon: 0.8367750533740523
Training...
episode: 199 no of steps: 124 score: -455.0 avg score: -3.6694 memorylength: 28179 epsilon: 0.8360222946272631
Training...
episode: 200 no of steps: 126 score: 178.0 avg score: 1.4127 memorylength: 28305 epsilon: 0.8352702130585699
saving states...
Training...
episode: 201 no of steps: 154 score: -231.0 avg score: -1.5 memorylength: 28459 epsilon: 0.834518808058787
Training...
episode: 202 no of steps: 145 score: -128.0 avg score: -0.8828 memorylength: 28604 epsilon: 0.8337680790192761
Training...
episode: 203 no of steps: 144 score: -216.0 avg score: -1.5 memorylength: 28748 epsilon: 0.8330180253319466
Training...
episode: 204 no of steps: 134 score: -307.0 avg score: -2.291 memorylength: 28882 epsilon: 0.8322686463892551
Training...
episode: 205 no of steps: 144 score: -277.0 avg score: -1.9236 memorylength: 29026 epsilon: 0.8315199415842047
Training...
episode: 206 no of steps: 137 score: -171.0 avg score: -1.2482 memorylength: 29163 epsilon: 0.8307719103103441
Training...
episode: 207 no of steps: 130 score: -28.0 avg score: -0.2154 memorylength: 29293 epsilon: 0.8300245519617685
Training...
episode: 208 no of steps: 131 score: -513.0 avg score: -3.916 memorylength: 29424 epsilon: 0.829277865933117
Training...
episode: 209 no of steps: 140 score: -442.0 avg score: -3.1571 memorylength: 29564 epsilon: 0.8285318516195743
Training...
episode: 210 no of steps: 119 score: -251.0 avg score: -2.1092 memorylength: 29683 epsilon: 0.8277865084168686
Training...
episode: 211 no of steps: 147 score: -402.0 avg score: -2.7347 memorylength: 29830 epsilon: 0.8270418357212719
Training...
episode: 212 no of steps: 147 score: 110.0 avg score: 0.7483 memorylength: 29977 epsilon: 0.8262978329295991
Training...
episode: 213 no of steps: 116 score: 13.0 avg score: 0.1121 memorylength: 30093 epsilon: 0.8255544994392082
Training...
episode: 214 no of steps: 131 score: -306.0 avg score: -2.3359 memorylength: 30224 epsilon: 0.8248118346479988
Training...
episode: 215 no of steps: 125 score: -122.0 avg score: -0.976 memorylength: 30349 epsilon: 0.8240698379544125
Training...
episode: 216 no of steps: 152 score: -374.0 avg score: -2.4605 memorylength: 30501 epsilon: 0.8233285087574318
Training...
episode: 217 no of steps: 150 score: -212.0 avg score: -1.4133 memorylength: 30651 epsilon: 0.8225878464565802
Training...
episode: 218 no of steps: 133 score: -311.0 avg score: -2.3383 memorylength: 30784 epsilon: 0.8218478504519211
Training...
episode: 219 no of steps: 121 score: -36.0 avg score: -0.2975 memorylength: 30905 epsilon: 0.8211085201440578
Training...
episode: 220 no of steps: 138 score: 206.0 avg score: 1.4928 memorylength: 31043 epsilon: 0.8203698549341325
Training...
episode: 221 no of steps: 140 score: 150.0 avg score: 1.0714 memorylength: 31183 epsilon: 0.8196318542238266
Training...
episode: 222 no of steps: 150 score: -354.0 avg score: -2.36 memorylength: 31333 epsilon: 0.8188945174153591
Training...
episode: 223 no of steps: 135 score: -246.0 avg score: -1.8222 memorylength: 31468 epsilon: 0.8181578439114875
Training...
episode: 224 no of steps: 150 score: 0.0 avg score: 0.0 memorylength: 31618 epsilon: 0.8174218331155061
Training...
episode: 225 no of steps: 127 score: -256.0 avg score: -2.0157 memorylength: 31745 epsilon: 0.816686484431246
Training...
episode: 226 no of steps: 145 score: -248.0 avg score: -1.7103 memorylength: 31890 epsilon: 0.815951797263075
Training...
episode: 227 no of steps: 152 score: -116.0 avg score: -0.7632 memorylength: 32042 epsilon: 0.8152177710158962
Training...
episode: 228 no of steps: 139 score: -70.0 avg score: -0.5036 memorylength: 32181 epsilon: 0.8144844050951485
Training...
episode: 229 no of steps: 143 score: 80.0 avg score: 0.5594 memorylength: 32324 epsilon: 0.8137516989068052
Training...
episode: 230 no of steps: 144 score: -362.0 avg score: -2.5139 memorylength: 32468 epsilon: 0.8130196518573746
Training...
episode: 231 no of steps: 137 score: -313.0 avg score: -2.2847 memorylength: 32605 epsilon: 0.8122882633538981
Training...
episode: 232 no of steps: 143 score: -284.0 avg score: -1.986 memorylength: 32748 epsilon: 0.8115575328039515
Training...
episode: 233 no of steps: 138 score: -191.0 avg score: -1.3841 memorylength: 32886 epsilon: 0.8108274596156426
Training...
episode: 234 no of steps: 154 score: -573.0 avg score: -3.7208 memorylength: 33040 epsilon: 0.8100980431976122
Training...
episode: 235 no of steps: 137 score: -123.0 avg score: -0.8978 memorylength: 33177 epsilon: 0.8093692829590331
Training...
episode: 236 no of steps: 138 score: 22.0 avg score: 0.1594 memorylength: 33315 epsilon: 0.8086411783096092
Training...
episode: 237 no of steps: 141 score: -68.0 avg score: -0.4823 memorylength: 33456 epsilon: 0.8079137286595759
Training...
episode: 238 no of steps: 148 score: -469.0 avg score: -3.1689 memorylength: 33604 epsilon: 0.8071869334196989
Training...
episode: 239 no of steps: 133 score: -121.0 avg score: -0.9098 memorylength: 33737 epsilon: 0.806460792001274
Training...
episode: 240 no of steps: 146 score: -504.0 avg score: -3.4521 memorylength: 33883 epsilon: 0.8057353038161267
Training...
episode: 241 no of steps: 122 score: -309.0 avg score: -2.5328 memorylength: 34005 epsilon: 0.8050104682766114
Training...
episode: 242 no of steps: 122 score: -72.0 avg score: -0.5902 memorylength: 34127 epsilon: 0.8042862847956113
Training...
episode: 243 no of steps: 141 score: -148.0 avg score: -1.0496 memorylength: 34268 epsilon: 0.8035627527865377
Training...
episode: 244 no of steps: 132 score: -411.0 avg score: -3.1136 memorylength: 34400 epsilon: 0.8028398716633297
Training...
episode: 245 no of steps: 171 score: 27.0 avg score: 0.1579 memorylength: 34571 epsilon: 0.8021176408404536
Training...
episode: 246 no of steps: 139 score: -266.0 avg score: -1.9137 memorylength: 34710 epsilon: 0.8013960597329023
Training...
episode: 247 no of steps: 164 score: 45.0 avg score: 0.2744 memorylength: 34874 epsilon: 0.8006751277561951
Training...
episode: 248 no of steps: 141 score: -23.0 avg score: -0.1631 memorylength: 35015 epsilon: 0.7999548443263771
Training...
episode: 249 no of steps: 157 score: -369.0 avg score: -2.3503 memorylength: 35172 epsilon: 0.7992352088600185
Training...
episode: 250 no of steps: 161 score: -64.0 avg score: -0.3975 memorylength: 35333 epsilon: 0.7985162207742149
saving states...
Training...
episode: 251 no of steps: 144 score: -219.0 avg score: -1.5208 memorylength: 35477 epsilon: 0.7977978794865855
Training...
episode: 252 no of steps: 129 score: -301.0 avg score: -2.3333 memorylength: 35606 epsilon: 0.7970801844152741
Training...
episode: 253 no of steps: 138 score: -162.0 avg score: -1.1739 memorylength: 35744 epsilon: 0.7963631349789475
Training...
episode: 254 no of steps: 145 score: -208.0 avg score: -1.4345 memorylength: 35889 epsilon: 0.7956467305967957
Training...
episode: 255 no of steps: 140 score: -449.0 avg score: -3.2071 memorylength: 36029 epsilon: 0.7949309706885311
Training...
episode: 256 no of steps: 156 score: -239.0 avg score: -1.5321 memorylength: 36185 epsilon: 0.7942158546743882
Training...
episode: 257 no of steps: 149 score: -27.0 avg score: -0.1812 memorylength: 36334 epsilon: 0.7935013819751228
Training...
episode: 258 no of steps: 138 score: 2.0 avg score: 0.0145 memorylength: 36472 epsilon: 0.7927875520120121
Training...
episode: 259 no of steps: 140 score: -82.0 avg score: -0.5857 memorylength: 36612 epsilon: 0.7920743642068538
Training...
episode: 260 no of steps: 144 score: -216.0 avg score: -1.5 memorylength: 36756 epsilon: 0.7913618179819657
Training...
episode: 261 no of steps: 133 score: -271.0 avg score: -2.0376 memorylength: 36889 epsilon: 0.7906499127601854
Training...
episode: 262 no of steps: 146 score: -88.0 avg score: -0.6027 memorylength: 37035 epsilon: 0.7899386479648695
Training...
episode: 263 no of steps: 130 score: -135.0 avg score: -1.0385 memorylength: 37165 epsilon: 0.7892280230198935
Training...
episode: 264 no of steps: 139 score: -68.0 avg score: -0.4892 memorylength: 37304 epsilon: 0.7885180373496512
Training...
episode: 265 no of steps: 143 score: -333.0 avg score: -2.3287 memorylength: 37447 epsilon: 0.7878086903790542
Training...
episode: 266 no of steps: 135 score: -28.0 avg score: -0.2074 memorylength: 37582 epsilon: 0.7870999815335313
Training...
episode: 267 no of steps: 138 score: 34.0 avg score: 0.2464 memorylength: 37720 epsilon: 0.7863919102390287
Training...
episode: 268 no of steps: 129 score: -59.0 avg score: -0.4574 memorylength: 37849 epsilon: 0.785684475922008
Training...
episode: 269 no of steps: 133 score: -37.0 avg score: -0.2782 memorylength: 37982 epsilon: 0.7849776780094476
Training...
episode: 270 no of steps: 151 score: -421.0 avg score: -2.7881 memorylength: 38133 epsilon: 0.7842715159288414
Training...
episode: 271 no of steps: 151 score: -245.0 avg score: -1.6225 memorylength: 38284 epsilon: 0.7835659891081977
Training...
episode: 272 no of steps: 140 score: -369.0 avg score: -2.6357 memorylength: 38424 epsilon: 0.78286109697604
Training...
episode: 273 no of steps: 128 score: -262.0 avg score: -2.0469 memorylength: 38552 epsilon: 0.7821568389614056
Training...
episode: 274 no of steps: 135 score: -288.0 avg score: -2.1333 memorylength: 38687 epsilon: 0.7814532144938454
Training...
episode: 275 no of steps: 139 score: -47.0 avg score: -0.3381 memorylength: 38826 epsilon: 0.7807502230034236
Training...
episode: 276 no of steps: 149 score: -81.0 avg score: -0.5436 memorylength: 38975 epsilon: 0.7800478639207169
Training...
episode: 277 no of steps: 140 score: -98.0 avg score: -0.7 memorylength: 39115 epsilon: 0.7793461366768145
Training...
episode: 278 no of steps: 135 score: -184.0 avg score: -1.363 memorylength: 39250 epsilon: 0.7786450407033176
Training...
episode: 279 no of steps: 140 score: 68.0 avg score: 0.4857 memorylength: 39390 epsilon: 0.7779445754323379
Training...
episode: 280 no of steps: 133 score: -128.0 avg score: -0.9624 memorylength: 39523 epsilon: 0.7772447402964987
Training...
episode: 281 no of steps: 132 score: -181.0 avg score: -1.3712 memorylength: 39655 epsilon: 0.7765455347289337
Training...
episode: 282 no of steps: 148 score: -252.0 avg score: -1.7027 memorylength: 39803 epsilon: 0.7758469581632861
Training...
episode: 283 no of steps: 131 score: -172.0 avg score: -1.313 memorylength: 39934 epsilon: 0.775149010033709
Training...
episode: 284 no of steps: 147 score: -110.0 avg score: -0.7483 memorylength: 40081 epsilon: 0.7744516897748642
Training...
episode: 285 no of steps: 145 score: -140.0 avg score: -0.9655 memorylength: 40226 epsilon: 0.7737549968219225
Training...
episode: 286 no of steps: 140 score: -35.0 avg score: -0.25 memorylength: 40366 epsilon: 0.7730589306105623
Training...
episode: 287 no of steps: 139 score: 4.0 avg score: 0.0288 memorylength: 40505 epsilon: 0.7723634905769701
Training...
episode: 288 no of steps: 132 score: -222.0 avg score: -1.6818 memorylength: 40637 epsilon: 0.7716686761578395
Training...
episode: 289 no of steps: 137 score: -144.0 avg score: -1.0511 memorylength: 40774 epsilon: 0.7709744867903705
Training...
episode: 290 no of steps: 149 score: -254.0 avg score: -1.7047 memorylength: 40923 epsilon: 0.7702809219122699
Training...
episode: 291 no of steps: 130 score: -325.0 avg score: -2.5 memorylength: 41053 epsilon: 0.7695879809617502
Training...
episode: 292 no of steps: 144 score: -189.0 avg score: -1.3125 memorylength: 41197 epsilon: 0.7688956633775289
Training...
episode: 293 no of steps: 137 score: 332.0 avg score: 2.4234 memorylength: 41334 epsilon: 0.768203968598829
Training...
episode: 294 no of steps: 140 score: -297.0 avg score: -2.1214 memorylength: 41474 epsilon: 0.7675128960653774
Training...
episode: 295 no of steps: 133 score: -97.0 avg score: -0.7293 memorylength: 41607 epsilon: 0.7668224452174056
Training...
episode: 296 no of steps: 131 score: -199.0 avg score: -1.5191 memorylength: 41738 epsilon: 0.7661326154956484
Training...
episode: 297 no of steps: 137 score: -473.0 avg score: -3.4526 memorylength: 41875 epsilon: 0.7654434063413432
Training...
episode: 298 no of steps: 136 score: -258.0 avg score: -1.8971 memorylength: 42011 epsilon: 0.7647548171962312
Training...
episode: 299 no of steps: 131 score: -198.0 avg score: -1.5115 memorylength: 42142 epsilon: 0.7640668475025545
Training...
episode: 300 no of steps: 135 score: -131.0 avg score: -0.9704 memorylength: 42277 epsilon: 0.7633794967030583
saving states...
Training...
episode: 301 no of steps: 139 score: 12.0 avg score: 0.0863 memorylength: 42416 epsilon: 0.7626927642409879
Training...
episode: 302 no of steps: 137 score: -115.0 avg score: -0.8394 memorylength: 42553 epsilon: 0.7620066495600902
Training...
episode: 303 no of steps: 140 score: 27.0 avg score: 0.1929 memorylength: 42693 epsilon: 0.7613211521046122
Training...
episode: 304 no of steps: 141 score: 212.0 avg score: 1.5035 memorylength: 42834 epsilon: 0.7606362713193008
Training...
episode: 305 no of steps: 128 score: -335.0 avg score: -2.6172 memorylength: 42962 epsilon: 0.7599520066494028
Training...
episode: 306 no of steps: 147 score: -173.0 avg score: -1.1769 memorylength: 43109 epsilon: 0.7592683575406636
Training...
episode: 307 no of steps: 141 score: 114.0 avg score: 0.8085 memorylength: 43250 epsilon: 0.7585853234393273
Training...
episode: 308 no of steps: 136 score: -68.0 avg score: -0.5 memorylength: 43386 epsilon: 0.7579029037921364
Training...
episode: 309 no of steps: 148 score: -227.0 avg score: -1.5338 memorylength: 43534 epsilon: 0.7572210980463311
Training...
episode: 310 no of steps: 124 score: -91.0 avg score: -0.7339 memorylength: 43658 epsilon: 0.7565399056496483
Training...
episode: 311 no of steps: 132 score: 51.0 avg score: 0.3864 memorylength: 43790 epsilon: 0.7558593260503225
Training...
episode: 312 no of steps: 134 score: 53.0 avg score: 0.3955 memorylength: 43924 epsilon: 0.755179358697084
Training...
episode: 313 no of steps: 137 score: -154.0 avg score: -1.1241 memorylength: 44061 epsilon: 0.7545000030391591
Training...
episode: 314 no of steps: 147 score: -72.0 avg score: -0.4898 memorylength: 44208 epsilon: 0.7538212585262699
Training...
episode: 315 no of steps: 138 score: -115.0 avg score: -0.8333 memorylength: 44346 epsilon: 0.7531431246086333
Training...
episode: 316 no of steps: 144 score: 286.0 avg score: 1.9861 memorylength: 44490 epsilon: 0.7524656007369607
Training...
episode: 317 no of steps: 141 score: -93.0 avg score: -0.6596 memorylength: 44631 epsilon: 0.7517886863624577
Training...
episode: 318 no of steps: 155 score: 35.0 avg score: 0.2258 memorylength: 44786 epsilon: 0.7511123809368235
Training...
episode: 319 no of steps: 132 score: -176.0 avg score: -1.3333 memorylength: 44918 epsilon: 0.750436683912251
Training...
episode: 320 no of steps: 151 score: -234.0 avg score: -1.5497 memorylength: 45069 epsilon: 0.7497615947414253
Training...
episode: 321 no of steps: 144 score: -95.0 avg score: -0.6597 memorylength: 45213 epsilon: 0.7490871128775244
Training...
episode: 322 no of steps: 148 score: 211.0 avg score: 1.4257 memorylength: 45361 epsilon: 0.7484132377742176
Training...
episode: 323 no of steps: 130 score: 103.0 avg score: 0.7923 memorylength: 45491 epsilon: 0.7477399688856664
Training...
episode: 324 no of steps: 139 score: -385.0 avg score: -2.7698 memorylength: 45630 epsilon: 0.7470673056665227
Training...
episode: 325 no of steps: 149 score: -45.0 avg score: -0.302 memorylength: 45779 epsilon: 0.7463952475719293
Training...
episode: 326 no of steps: 126 score: -117.0 avg score: -0.9286 memorylength: 45905 epsilon: 0.7457237940575192
Training...
episode: 327 no of steps: 137 score: -351.0 avg score: -2.562 memorylength: 46042 epsilon: 0.7450529445794148
Training...
episode: 328 no of steps: 123 score: -133.0 avg score: -1.0813 memorylength: 46165 epsilon: 0.7443826985942283
Training...
episode: 329 no of steps: 129 score: -224.0 avg score: -1.7364 memorylength: 46294 epsilon: 0.7437130555590602
Training...
episode: 330 no of steps: 167 score: 236.0 avg score: 1.4132 memorylength: 46461 epsilon: 0.7430440149314997
Training...
episode: 331 no of steps: 130 score: -411.0 avg score: -3.1615 memorylength: 46591 epsilon: 0.7423755761696239
Training...
episode: 332 no of steps: 128 score: -371.0 avg score: -2.8984 memorylength: 46719 epsilon: 0.7417077387319971
Training...
episode: 333 no of steps: 138 score: -138.0 avg score: -1.0 memorylength: 46857 epsilon: 0.7410405020776712
Training...
episode: 334 no of steps: 148 score: -538.0 avg score: -3.6351 memorylength: 47005 epsilon: 0.7403738656661846
Training...
episode: 335 no of steps: 121 score: -387.0 avg score: -3.1983 memorylength: 47126 epsilon: 0.7397078289575613
Training...
episode: 336 no of steps: 129 score: -19.0 avg score: -0.1473 memorylength: 47255 epsilon: 0.7390423914123119
Training...
episode: 337 no of steps: 139 score: -246.0 avg score: -1.7698 memorylength: 47394 epsilon: 0.7383775524914318
Training...
episode: 338 no of steps: 142 score: -116.0 avg score: -0.8169 memorylength: 47536 epsilon: 0.7377133116564015
Training...
episode: 339 no of steps: 119 score: -126.0 avg score: -1.0588 memorylength: 47655 epsilon: 0.737049668369186
Training...
episode: 340 no of steps: 149 score: 13.0 avg score: 0.0872 memorylength: 47804 epsilon: 0.7363866220922339
Training...
episode: 341 no of steps: 136 score: -110.0 avg score: -0.8088 memorylength: 47940 epsilon: 0.735724172288478
Training...
episode: 342 no of steps: 140 score: -149.0 avg score: -1.0643 memorylength: 48080 epsilon: 0.7350623184213336
Training...
episode: 343 no of steps: 129 score: -170.0 avg score: -1.3178 memorylength: 48209 epsilon: 0.7344010599546994
Training...
episode: 344 no of steps: 143 score: -133.0 avg score: -0.9301 memorylength: 48352 epsilon: 0.7337403963529557
Training...
episode: 345 no of steps: 134 score: 0.0 avg score: 0.0 memorylength: 48486 epsilon: 0.7330803270809652
Training...
episode: 346 no of steps: 140 score: -236.0 avg score: -1.6857 memorylength: 48626 epsilon: 0.7324208516040714
Training...
episode: 347 no of steps: 142 score: -115.0 avg score: -0.8099 memorylength: 48768 epsilon: 0.7317619693880996
Training...
episode: 348 no of steps: 140 score: 18.0 avg score: 0.1286 memorylength: 48908 epsilon: 0.7311036798993548
Training...
episode: 349 no of steps: 127 score: -176.0 avg score: -1.3858 memorylength: 49035 epsilon: 0.7304459826046226
Training...
episode: 350 no of steps: 131 score: -134.0 avg score: -1.0229 memorylength: 49166 epsilon: 0.7297888769711681
saving states...
Training...
episode: 351 no of steps: 129 score: -159.0 avg score: -1.2326 memorylength: 49295 epsilon: 0.7291323624667357
Training...
episode: 352 no of steps: 133 score: -198.0 avg score: -1.4887 memorylength: 49428 epsilon: 0.7284764385595488
Training...
episode: 353 no of steps: 132 score: -101.0 avg score: -0.7652 memorylength: 49560 epsilon: 0.7278211047183089
Training...
episode: 354 no of steps: 148 score: 156.0 avg score: 1.0541 memorylength: 49708 epsilon: 0.7271663604121953
Training...
episode: 355 no of steps: 154 score: -250.0 avg score: -1.6234 memorylength: 49862 epsilon: 0.7265122051108653
Training...
episode: 356 no of steps: 136 score: -36.0 avg score: -0.2647 memorylength: 49998 epsilon: 0.7258586382844532
Training...
episode: 357 no of steps: 138 score: 170.0 avg score: 1.2319 memorylength: 50136 epsilon: 0.7252056594035697
Training...
episode: 358 no of steps: 150 score: -285.0 avg score: -1.9 memorylength: 50286 epsilon: 0.7245532679393019
Training...
episode: 359 no of steps: 148 score: -250.0 avg score: -1.6892 memorylength: 50434 epsilon: 0.7239014633632126
Training...
episode: 360 no of steps: 138 score: -113.0 avg score: -0.8188 memorylength: 50572 epsilon: 0.7232502451473399
Training...
episode: 361 no of steps: 139 score: -408.0 avg score: -2.9353 memorylength: 50711 epsilon: 0.7225996127641975
Training...
episode: 362 no of steps: 137 score: 74.0 avg score: 0.5401 memorylength: 50848 epsilon: 0.7219495656867727
Training...
episode: 363 no of steps: 144 score: -271.0 avg score: -1.8819 memorylength: 50992 epsilon: 0.7213001033885276
Training...
episode: 364 no of steps: 140 score: -351.0 avg score: -2.5071 memorylength: 51132 epsilon: 0.7206512253433974
Training...
episode: 365 no of steps: 149 score: -486.0 avg score: -3.2617 memorylength: 51281 epsilon: 0.7200029310257912
Training...
episode: 366 no of steps: 137 score: -124.0 avg score: -0.9051 memorylength: 51418 epsilon: 0.7193552199105904
Training...
episode: 367 no of steps: 143 score: -132.0 avg score: -0.9231 memorylength: 51561 epsilon: 0.7187080914731488
Training...
episode: 368 no of steps: 149 score: -271.0 avg score: -1.8188 memorylength: 51710 epsilon: 0.7180615451892927
Training...
episode: 369 no of steps: 152 score: -106.0 avg score: -0.6974 memorylength: 51862 epsilon: 0.7174155805353191
Training...
episode: 370 no of steps: 142 score: 17.0 avg score: 0.1197 memorylength: 52004 epsilon: 0.716770196987997
Training...
episode: 371 no of steps: 144 score: -91.0 avg score: -0.6319 memorylength: 52148 epsilon: 0.7161253940245657
Training...
episode: 372 no of steps: 135 score: -83.0 avg score: -0.6148 memorylength: 52283 epsilon: 0.7154811711227343
Training...
episode: 373 no of steps: 146 score: 42.0 avg score: 0.2877 memorylength: 52429 epsilon: 0.7148375277606827
Training...
episode: 374 no of steps: 131 score: -54.0 avg score: -0.4122 memorylength: 52560 epsilon: 0.7141944634170596
Training...
episode: 375 no of steps: 127 score: -164.0 avg score: -1.2913 memorylength: 52687 epsilon: 0.7135519775709829
Training...
episode: 376 no of steps: 124 score: -280.0 avg score: -2.2581 memorylength: 52811 epsilon: 0.7129100697020386
Training...
episode: 377 no of steps: 150 score: -158.0 avg score: -1.0533 memorylength: 52961 epsilon: 0.7122687392902819
Training...
episode: 378 no of steps: 145 score: -125.0 avg score: -0.8621 memorylength: 53106 epsilon: 0.7116279858162348
Training...
episode: 379 no of steps: 155 score: -233.0 avg score: -1.5032 memorylength: 53261 epsilon: 0.7109878087608871
Training...
episode: 380 no of steps: 158 score: 12.0 avg score: 0.0759 memorylength: 53419 epsilon: 0.7103482076056952
Training...
episode: 381 no of steps: 139 score: -149.0 avg score: -1.0719 memorylength: 53558 epsilon: 0.7097091818325822
Training...
episode: 382 no of steps: 150 score: -181.0 avg score: -1.2067 memorylength: 53708 epsilon: 0.7090707309239372
Training...
episode: 383 no of steps: 118 score: -154.0 avg score: -1.3051 memorylength: 53826 epsilon: 0.7084328543626149
Training...
episode: 384 no of steps: 145 score: -59.0 avg score: -0.4069 memorylength: 53971 epsilon: 0.7077955516319353
Training...
episode: 385 no of steps: 154 score: -393.0 avg score: -2.5519 memorylength: 54125 epsilon: 0.7071588222156832
Training...
episode: 386 no of steps: 140 score: -271.0 avg score: -1.9357 memorylength: 54265 epsilon: 0.7065226655981075
Training...
episode: 387 no of steps: 138 score: -369.0 avg score: -2.6739 memorylength: 54403 epsilon: 0.7058870812639215
Training...
episode: 388 no of steps: 153 score: 12.0 avg score: 0.0784 memorylength: 54556 epsilon: 0.7052520686983019
Training...
episode: 389 no of steps: 127 score: 115.0 avg score: 0.9055 memorylength: 54683 epsilon: 0.7046176273868884
Training...
episode: 390 no of steps: 136 score: 132.0 avg score: 0.9706 memorylength: 54819 epsilon: 0.7039837568157834
Training...
episode: 391 no of steps: 134 score: -28.0 avg score: -0.209 memorylength: 54953 epsilon: 0.7033504564715519
Training...
episode: 392 no of steps: 157 score: -19.0 avg score: -0.121 memorylength: 55110 epsilon: 0.7027177258412204
Training...
episode: 393 no of steps: 141 score: -239.0 avg score: -1.695 memorylength: 55251 epsilon: 0.7020855644122772
Training...
episode: 394 no of steps: 136 score: -333.0 avg score: -2.4485 memorylength: 55387 epsilon: 0.7014539716726715
Training...
episode: 395 no of steps: 134 score: -9.0 avg score: -0.0672 memorylength: 55521 epsilon: 0.7008229471108132
Training...
episode: 396 no of steps: 133 score: -78.0 avg score: -0.5865 memorylength: 55654 epsilon: 0.7001924902155721
Training...
episode: 397 no of steps: 135 score: -50.0 avg score: -0.3704 memorylength: 55789 epsilon: 0.6995626004762784
Training...
episode: 398 no of steps: 133 score: -11.0 avg score: -0.0827 memorylength: 55922 epsilon: 0.6989332773827212
Training...
episode: 399 no of steps: 133 score: -234.0 avg score: -1.7594 memorylength: 56055 epsilon: 0.6983045204251486
Training...
episode: 400 no of steps: 143 score: -14.0 avg score: -0.0979 memorylength: 56198 epsilon: 0.6976763290942678
saving states...
Training...
episode: 401 no of steps: 152 score: -150.0 avg score: -0.9868 memorylength: 56350 epsilon: 0.6970487028812435
Training...
episode: 402 no of steps: 124 score: -176.0 avg score: -1.4194 memorylength: 56474 epsilon: 0.6964216412776987
Training...
episode: 403 no of steps: 146 score: -128.0 avg score: -0.8767 memorylength: 56620 epsilon: 0.6957951437757133
Training...
episode: 404 no of steps: 130 score: -145.0 avg score: -1.1154 memorylength: 56750 epsilon: 0.6951692098678243
Training...
episode: 405 no of steps: 134 score: -127.0 avg score: -0.9478 memorylength: 56884 epsilon: 0.694543839047025
Training...
episode: 406 no of steps: 109 score: -205.0 avg score: -1.8807 memorylength: 56993 epsilon: 0.6939190308067654
Training...
episode: 407 no of steps: 129 score: -3.0 avg score: -0.0233 memorylength: 57122 epsilon: 0.6932947846409505
Training...
episode: 408 no of steps: 140 score: -423.0 avg score: -3.0214 memorylength: 57262 epsilon: 0.6926711000439412
Training...
episode: 409 no of steps: 142 score: -57.0 avg score: -0.4014 memorylength: 57404 epsilon: 0.6920479765105524
Training...
episode: 410 no of steps: 132 score: -137.0 avg score: -1.0379 memorylength: 57536 epsilon: 0.6914254135360544
Training...
episode: 411 no of steps: 130 score: -189.0 avg score: -1.4538 memorylength: 57666 epsilon: 0.6908034106161711
Training...
episode: 412 no of steps: 139 score: -347.0 avg score: -2.4964 memorylength: 57805 epsilon: 0.6901819672470801
Training...
episode: 413 no of steps: 126 score: -217.0 avg score: -1.7222 memorylength: 57931 epsilon: 0.6895610829254122
Training...
episode: 414 no of steps: 148 score: -195.0 avg score: -1.3176 memorylength: 58079 epsilon: 0.688940757148251
Training...
episode: 415 no of steps: 131 score: 88.0 avg score: 0.6718 memorylength: 58210 epsilon: 0.6883209894131327
Training...
episode: 416 no of steps: 126 score: -183.0 avg score: -1.4524 memorylength: 58336 epsilon: 0.6877017792180453
Training...
episode: 417 no of steps: 134 score: -63.0 avg score: -0.4701 memorylength: 58470 epsilon: 0.6870831260614287
Training...
episode: 418 no of steps: 133 score: -18.0 avg score: -0.1353 memorylength: 58603 epsilon: 0.6864650294421736
Training...
episode: 419 no of steps: 127 score: -243.0 avg score: -1.9134 memorylength: 58730 epsilon: 0.6858474888596218
Training...
episode: 420 no of steps: 150 score: -432.0 avg score: -2.88 memorylength: 58880 epsilon: 0.6852305038135653
Training...
episode: 421 no of steps: 126 score: 81.0 avg score: 0.6429 memorylength: 59006 epsilon: 0.6846140738042463
Training...
episode: 422 no of steps: 155 score: 17.0 avg score: 0.1097 memorylength: 59161 epsilon: 0.6839981983323564
Training...
episode: 423 no of steps: 131 score: -63.0 avg score: -0.4809 memorylength: 59292 epsilon: 0.6833828768990365
Training...
episode: 424 no of steps: 137 score: 18.0 avg score: 0.1314 memorylength: 59429 epsilon: 0.6827681090058761
Training...
episode: 425 no of steps: 144 score: -129.0 avg score: -0.8958 memorylength: 59573 epsilon: 0.6821538941549133
Training...
episode: 426 no of steps: 135 score: -180.0 avg score: -1.3333 memorylength: 59708 epsilon: 0.6815402318486339
Training...
episode: 427 no of steps: 132 score: -153.0 avg score: -1.1591 memorylength: 59840 epsilon: 0.6809271215899715
Training...
episode: 428 no of steps: 150 score: -34.0 avg score: -0.2267 memorylength: 59990 epsilon: 0.6803145628823066
Training...
episode: 429 no of steps: 118 score: -195.0 avg score: -1.6525 memorylength: 60108 epsilon: 0.6797025552294668
Training...
episode: 430 no of steps: 147 score: -29.0 avg score: -0.1973 memorylength: 60255 epsilon: 0.6790910981357259
Training...
episode: 431 no of steps: 131 score: -276.0 avg score: -2.1069 memorylength: 60386 epsilon: 0.6784801911058034
Training...
episode: 432 no of steps: 143 score: -111.0 avg score: -0.7762 memorylength: 60529 epsilon: 0.6778698336448647
Training...
episode: 433 no of steps: 142 score: -351.0 avg score: -2.4718 memorylength: 60671 epsilon: 0.6772600252585202
Training...
episode: 434 no of steps: 134 score: -117.0 avg score: -0.8731 memorylength: 60805 epsilon: 0.6766507654528252
Training...
episode: 435 no of steps: 135 score: 264.0 avg score: 1.9556 memorylength: 60940 epsilon: 0.6760420537342791
Training...
episode: 436 no of steps: 130 score: -247.0 avg score: -1.9 memorylength: 61070 epsilon: 0.6754338896098253
Training...
episode: 437 no of steps: 133 score: 29.0 avg score: 0.218 memorylength: 61203 epsilon: 0.6748262725868509
Training...
episode: 438 no of steps: 133 score: 171.0 avg score: 1.2857 memorylength: 61336 epsilon: 0.6742192021731862
Training...
episode: 439 no of steps: 144 score: -45.0 avg score: -0.3125 memorylength: 61480 epsilon: 0.6736126778771039
Training...
episode: 440 no of steps: 128 score: 2.0 avg score: 0.0156 memorylength: 61608 epsilon: 0.6730066992073196
Training...
episode: 441 no of steps: 135 score: -392.0 avg score: -2.9037 memorylength: 61743 epsilon: 0.6724012656729901
Training...
episode: 442 no of steps: 144 score: -201.0 avg score: -1.3958 memorylength: 61887 epsilon: 0.6717963767837146
Training...
episode: 443 no of steps: 138 score: -253.0 avg score: -1.8333 memorylength: 62025 epsilon: 0.6711920320495329
Training...
episode: 444 no of steps: 140 score: -198.0 avg score: -1.4143 memorylength: 62165 epsilon: 0.6705882309809258
Training...
episode: 445 no of steps: 143 score: -104.0 avg score: -0.7273 memorylength: 62308 epsilon: 0.6699849730888142
Training...
episode: 446 no of steps: 141 score: 197.0 avg score: 1.3972 memorylength: 62449 epsilon: 0.6693822578845595
Training...
episode: 447 no of steps: 152 score: 47.0 avg score: 0.3092 memorylength: 62601 epsilon: 0.6687800848799622
Training...
episode: 448 no of steps: 134 score: 63.0 avg score: 0.4701 memorylength: 62735 epsilon: 0.668178453587262
Training...
episode: 449 no of steps: 139 score: -115.0 avg score: -0.8273 memorylength: 62874 epsilon: 0.6675773635191378
Training...
episode: 450 no of steps: 133 score: -165.0 avg score: -1.2406 memorylength: 63007 epsilon: 0.6669768141887062
saving states...
Training...
episode: 451 no of steps: 130 score: -92.0 avg score: -0.7077 memorylength: 63137 epsilon: 0.6663768051095227
Training...
episode: 452 no of steps: 136 score: -208.0 avg score: -1.5294 memorylength: 63273 epsilon: 0.6657773357955796
Training...
episode: 453 no of steps: 130 score: 162.0 avg score: 1.2462 memorylength: 63403 epsilon: 0.6651784057613068
Training...
episode: 454 no of steps: 123 score: -129.0 avg score: -1.0488 memorylength: 63526 epsilon: 0.6645800145215709
Training...
episode: 455 no of steps: 130 score: -119.0 avg score: -0.9154 memorylength: 63656 epsilon: 0.663982161591675
Training...
episode: 456 no of steps: 127 score: -404.0 avg score: -3.1811 memorylength: 63783 epsilon: 0.6633848464873582
Training...
episode: 457 no of steps: 133 score: 255.0 avg score: 1.9173 memorylength: 63916 epsilon: 0.6627880687247952
Training...
episode: 458 no of steps: 123 score: -163.0 avg score: -1.3252 memorylength: 64039 epsilon: 0.6621918278205962
Training...
episode: 459 no of steps: 128 score: -86.0 avg score: -0.6719 memorylength: 64167 epsilon: 0.6615961232918056
Training...
episode: 460 no of steps: 140 score: -168.0 avg score: -1.2 memorylength: 64307 epsilon: 0.661000954655903
Training...
episode: 461 no of steps: 140 score: 103.0 avg score: 0.7357 memorylength: 64447 epsilon: 0.6604063214308017
Training...
episode: 462 no of steps: 132 score: 46.0 avg score: 0.3485 memorylength: 64579 epsilon: 0.6598122231348488
Training...
episode: 463 no of steps: 135 score: 74.0 avg score: 0.5481 memorylength: 64714 epsilon: 0.6592186592868245
Training...
episode: 464 no of steps: 147 score: -144.0 avg score: -0.9796 memorylength: 64861 epsilon: 0.6586256294059424
Training...
episode: 465 no of steps: 130 score: -9.0 avg score: -0.0692 memorylength: 64991 epsilon: 0.658033133011848
Training...
episode: 466 no of steps: 131 score: 196.0 avg score: 1.4962 memorylength: 65122 epsilon: 0.657441169624619
Training...
episode: 467 no of steps: 129 score: -42.0 avg score: -0.3256 memorylength: 65251 epsilon: 0.6568497387647653
Training...
episode: 468 no of steps: 146 score: 21.0 avg score: 0.1438 memorylength: 65397 epsilon: 0.656258839953228
Training...
episode: 469 no of steps: 133 score: -252.0 avg score: -1.8947 memorylength: 65530 epsilon: 0.6556684727113786
Training...
episode: 470 no of steps: 131 score: 3.0 avg score: 0.0229 memorylength: 65661 epsilon: 0.65507863656102
Training...
episode: 471 no of steps: 139 score: -20.0 avg score: -0.1439 memorylength: 65800 epsilon: 0.6544893310243847
Training...
episode: 472 no of steps: 125 score: -180.0 avg score: -1.44 memorylength: 65925 epsilon: 0.6539005556241352
Training...
episode: 473 no of steps: 135 score: -404.0 avg score: -2.9926 memorylength: 66060 epsilon: 0.6533123098833634
Training...
episode: 474 no of steps: 131 score: -83.0 avg score: -0.6336 memorylength: 66191 epsilon: 0.6527245933255902
Training...
episode: 475 no of steps: 144 score: -209.0 avg score: -1.4514 memorylength: 66335 epsilon: 0.6521374054747652
Training...
episode: 476 no of steps: 141 score: -74.0 avg score: -0.5248 memorylength: 66476 epsilon: 0.6515507458552663
Training...
episode: 477 no of steps: 142 score: -15.0 avg score: -0.1056 memorylength: 66618 epsilon: 0.6509646139918989
Training...
episode: 478 no of steps: 132 score: 148.0 avg score: 1.1212 memorylength: 66750 epsilon: 0.6503790094098965
Training...
episode: 479 no of steps: 146 score: 54.0 avg score: 0.3699 memorylength: 66896 epsilon: 0.649793931634919
Training...
episode: 480 no of steps: 132 score: -127.0 avg score: -0.9621 memorylength: 67028 epsilon: 0.6492093801930537
Training...
episode: 481 no of steps: 131 score: 104.0 avg score: 0.7939 memorylength: 67159 epsilon: 0.6486253546108136
Training...
episode: 482 no of steps: 134 score: -108.0 avg score: -0.806 memorylength: 67293 epsilon: 0.6480418544151383
Training...
episode: 483 no of steps: 149 score: -41.0 avg score: -0.2752 memorylength: 67442 epsilon: 0.6474588791333923
Training...
episode: 484 no of steps: 123 score: 234.0 avg score: 1.9024 memorylength: 67565 epsilon: 0.6468764282933656
Training...
episode: 485 no of steps: 118 score: -54.0 avg score: -0.4576 memorylength: 67683 epsilon: 0.6462945014232733
Training...
episode: 486 no of steps: 132 score: -153.0 avg score: -1.1591 memorylength: 67815 epsilon: 0.6457130980517541
Training...
episode: 487 no of steps: 132 score: 49.0 avg score: 0.3712 memorylength: 67947 epsilon: 0.6451322177078718
Training...
episode: 488 no of steps: 136 score: -74.0 avg score: -0.5441 memorylength: 68083 epsilon: 0.6445518599211129
Training...
episode: 489 no of steps: 123 score: 301.0 avg score: 2.4472 memorylength: 68206 epsilon: 0.6439720242213877
Training...
episode: 490 no of steps: 138 score: 135.0 avg score: 0.9783 memorylength: 68344 epsilon: 0.6433927101390292
Training...
episode: 491 no of steps: 129 score: -136.0 avg score: -1.0543 memorylength: 68473 epsilon: 0.642813917204793
Training...
episode: 492 no of steps: 129 score: -227.0 avg score: -1.7597 memorylength: 68602 epsilon: 0.6422356449498567
Training...
episode: 493 no of steps: 132 score: -119.0 avg score: -0.9015 memorylength: 68734 epsilon: 0.64165789290582
Training...
episode: 494 no of steps: 134 score: -65.0 avg score: -0.4851 memorylength: 68868 epsilon: 0.6410806606047035
Training...
episode: 495 no of steps: 149 score: -21.0 avg score: -0.1409 memorylength: 69017 epsilon: 0.6405039475789488
Training...
episode: 496 no of steps: 134 score: 183.0 avg score: 1.3657 memorylength: 69151 epsilon: 0.6399277533614188
Training...
episode: 497 no of steps: 138 score: 183.0 avg score: 1.3261 memorylength: 69289 epsilon: 0.6393520774853958
Training...
episode: 498 no of steps: 140 score: 45.0 avg score: 0.3214 memorylength: 69429 epsilon: 0.6387769194845825
Training...
episode: 499 no of steps: 139 score: 224.0 avg score: 1.6115 memorylength: 69568 epsilon: 0.6382022788931008
Training...
episode: 500 no of steps: 137 score: -147.0 avg score: -1.073 memorylength: 69705 epsilon: 0.6376281552454919
saving states...
Training...
episode: 501 no of steps: 123 score: -47.0 avg score: -0.3821 memorylength: 69828 epsilon: 0.6370545480767154
Training...
episode: 502 no of steps: 128 score: -153.0 avg score: -1.1953 memorylength: 69956 epsilon: 0.6364814569221494
Training...
episode: 503 no of steps: 112 score: -132.0 avg score: -1.1786 memorylength: 70068 epsilon: 0.6359088813175904
Training...
episode: 504 no of steps: 146 score: -27.0 avg score: -0.1849 memorylength: 70214 epsilon: 0.6353368207992519
Training...
episode: 505 no of steps: 142 score: 144.0 avg score: 1.0141 memorylength: 70356 epsilon: 0.6347652749037649
Training...
episode: 506 no of steps: 127 score: 67.0 avg score: 0.5276 memorylength: 70483 epsilon: 0.6341942431681772
Training...
episode: 507 no of steps: 143 score: -161.0 avg score: -1.1259 memorylength: 70626 epsilon: 0.633623725129953
Training...
episode: 508 no of steps: 151 score: -298.0 avg score: -1.9735 memorylength: 70777 epsilon: 0.6330537203269727
Training...
episode: 509 no of steps: 152 score: -171.0 avg score: -1.125 memorylength: 70929 epsilon: 0.6324842282975324
Training...
episode: 510 no of steps: 148 score: 153.0 avg score: 1.0338 memorylength: 71077 epsilon: 0.6319152485803434
Training...
episode: 511 no of steps: 141 score: -54.0 avg score: -0.383 memorylength: 71218 epsilon: 0.6313467807145324
Training...
episode: 512 no of steps: 151 score: -217.0 avg score: -1.4371 memorylength: 71369 epsilon: 0.63077882423964
Training...
episode: 513 no of steps: 153 score: -5.0 avg score: -0.0327 memorylength: 71522 epsilon: 0.6302113786956217
Training...
episode: 514 no of steps: 139 score: 12.0 avg score: 0.0863 memorylength: 71661 epsilon: 0.6296444436228466
Training...
episode: 515 no of steps: 132 score: 26.0 avg score: 0.197 memorylength: 71793 epsilon: 0.629078018562097
Training...
episode: 516 no of steps: 145 score: -255.0 avg score: -1.7586 memorylength: 71938 epsilon: 0.6285121030545688
Training...
episode: 517 no of steps: 155 score: 76.0 avg score: 0.4903 memorylength: 72093 epsilon: 0.6279466966418704
Training...
episode: 518 no of steps: 141 score: -540.0 avg score: -3.8298 memorylength: 72234 epsilon: 0.6273817988660224
Training...
episode: 519 no of steps: 130 score: -5.0 avg score: -0.0385 memorylength: 72364 epsilon: 0.6268174092694577
Training...
episode: 520 no of steps: 142 score: 22.0 avg score: 0.1549 memorylength: 72506 epsilon: 0.6262535273950207
Training...
episode: 521 no of steps: 134 score: 138.0 avg score: 1.0299 memorylength: 72640 epsilon: 0.6256901527859671
Training...
episode: 522 no of steps: 144 score: -53.0 avg score: -0.3681 memorylength: 72784 epsilon: 0.6251272849859633
Training...
episode: 523 no of steps: 137 score: -150.0 avg score: -1.0949 memorylength: 72921 epsilon: 0.6245649235390864
Training...
episode: 524 no of steps: 130 score: -117.0 avg score: -0.9 memorylength: 73051 epsilon: 0.6240030679898236
Training...
episode: 525 no of steps: 147 score: 485.0 avg score: 3.2993 memorylength: 73198 epsilon: 0.623441717883072
Training...
episode: 526 no of steps: 123 score: -24.0 avg score: -0.1951 memorylength: 73321 epsilon: 0.6228808727641378
Training...
episode: 527 no of steps: 139 score: 85.0 avg score: 0.6115 memorylength: 73460 epsilon: 0.6223205321787365
Training...
episode: 528 no of steps: 141 score: 229.0 avg score: 1.6241 memorylength: 73601 epsilon: 0.6217606956729921
Training...
episode: 529 no of steps: 141 score: -87.0 avg score: -0.617 memorylength: 73742 epsilon: 0.6212013627934373
Training...
episode: 530 no of steps: 147 score: -48.0 avg score: -0.3265 memorylength: 73889 epsilon: 0.620642533087012
Training...
episode: 531 no of steps: 122 score: -14.0 avg score: -0.1148 memorylength: 74011 epsilon: 0.6200842061010645
Training...
episode: 532 no of steps: 141 score: 25.0 avg score: 0.1773 memorylength: 74152 epsilon: 0.6195263813833496
Training...
episode: 533 no of steps: 155 score: -102.0 avg score: -0.6581 memorylength: 74307 epsilon: 0.6189690584820295
Training...
episode: 534 no of steps: 142 score: 62.0 avg score: 0.4366 memorylength: 74449 epsilon: 0.6184122369456726
Training...
episode: 535 no of steps: 124 score: -20.0 avg score: -0.1613 memorylength: 74573 epsilon: 0.6178559163232532
Training...
episode: 536 no of steps: 127 score: 40.0 avg score: 0.315 memorylength: 74700 epsilon: 0.6173000961641516
Training...
episode: 537 no of steps: 147 score: -134.0 avg score: -0.9116 memorylength: 74847 epsilon: 0.6167447760181537
Training...
episode: 538 no of steps: 137 score: -41.0 avg score: -0.2993 memorylength: 74984 epsilon: 0.6161899554354501
Training...
episode: 539 no of steps: 140 score: -221.0 avg score: -1.5786 memorylength: 75124 epsilon: 0.6156356339666358
Training...
episode: 540 no of steps: 144 score: 58.0 avg score: 0.4028 memorylength: 75268 epsilon: 0.6150818111627107
Training...
episode: 541 no of steps: 144 score: 120.0 avg score: 0.8333 memorylength: 75412 epsilon: 0.6145284865750781
Training...
episode: 542 no of steps: 139 score: -153.0 avg score: -1.1007 memorylength: 75551 epsilon: 0.613975659755545
Training...
episode: 543 no of steps: 129 score: -37.0 avg score: -0.2868 memorylength: 75680 epsilon: 0.6134233302563219
Training...
episode: 544 no of steps: 137 score: 131.0 avg score: 0.9562 memorylength: 75817 epsilon: 0.6128714976300218
Training...
episode: 545 no of steps: 130 score: 40.0 avg score: 0.3077 memorylength: 75947 epsilon: 0.6123201614296602
Training...
episode: 546 no of steps: 129 score: -119.0 avg score: -0.9225 memorylength: 76076 epsilon: 0.6117693212086546
Training...
episode: 547 no of steps: 134 score: -122.0 avg score: -0.9104 memorylength: 76210 epsilon: 0.6112189765208246
Training...
episode: 548 no of steps: 147 score: -2.0 avg score: -0.0136 memorylength: 76357 epsilon: 0.6106691269203909
Training...
episode: 549 no of steps: 133 score: 4.0 avg score: 0.0301 memorylength: 76490 epsilon: 0.6101197719619753
Training...
episode: 550 no of steps: 138 score: -117.0 avg score: -0.8478 memorylength: 76628 epsilon: 0.6095709112006003
saving states...
Training...
episode: 551 no of steps: 130 score: 147.0 avg score: 1.1308 memorylength: 76758 epsilon: 0.6090225441916884
Training...
episode: 552 no of steps: 150 score: 31.0 avg score: 0.2067 memorylength: 76908 epsilon: 0.6084746704910627
Training...
episode: 553 no of steps: 137 score: 33.0 avg score: 0.2409 memorylength: 77045 epsilon: 0.6079272896549452
Training...
episode: 554 no of steps: 134 score: 192.0 avg score: 1.4328 memorylength: 77179 epsilon: 0.6073804012399575
Training...
episode: 555 no of steps: 143 score: -91.0 avg score: -0.6364 memorylength: 77322 epsilon: 0.6068340048031199
Training...
episode: 556 no of steps: 132 score: -162.0 avg score: -1.2273 memorylength: 77454 epsilon: 0.6062880999018513
Training...
episode: 557 no of steps: 133 score: -77.0 avg score: -0.5789 memorylength: 77587 epsilon: 0.6057426860939685
Training...
episode: 558 no of steps: 154 score: -222.0 avg score: -1.4416 memorylength: 77741 epsilon: 0.6051977629376866
Training...
episode: 559 no of steps: 134 score: -134.0 avg score: -1.0 memorylength: 77875 epsilon: 0.6046533299916176
Training...
episode: 560 no of steps: 134 score: 193.0 avg score: 1.4403 memorylength: 78009 epsilon: 0.6041093868147709
Training...
episode: 561 no of steps: 131 score: 39.0 avg score: 0.2977 memorylength: 78140 epsilon: 0.6035659329665525
Training...
episode: 562 no of steps: 146 score: -173.0 avg score: -1.1849 memorylength: 78286 epsilon: 0.6030229680067646
Training...
episode: 563 no of steps: 130 score: 172.0 avg score: 1.3231 memorylength: 78416 epsilon: 0.6024804914956057
Training...
episode: 564 no of steps: 140 score: 139.0 avg score: 0.9929 memorylength: 78556 epsilon: 0.6019385029936698
Training...
episode: 565 no of steps: 146 score: -221.0 avg score: -1.5137 memorylength: 78702 epsilon: 0.601397002061946
Training...
episode: 566 no of steps: 126 score: 192.0 avg score: 1.5238 memorylength: 78828 epsilon: 0.6008559882618187
Training...
episode: 567 no of steps: 138 score: 99.0 avg score: 0.7174 memorylength: 78966 epsilon: 0.6003154611550667
Training...
episode: 568 no of steps: 140 score: -7.0 avg score: -0.05 memorylength: 79106 epsilon: 0.599775420303863
Training...
episode: 569 no of steps: 148 score: 15.0 avg score: 0.1014 memorylength: 79254 epsilon: 0.5992358652707743
Training...
episode: 570 no of steps: 134 score: 127.0 avg score: 0.9478 memorylength: 79388 epsilon: 0.5986967956187613
Training...
episode: 571 no of steps: 138 score: -305.0 avg score: -2.2101 memorylength: 79526 epsilon: 0.5981582109111773
Training...
episode: 572 no of steps: 150 score: 432.0 avg score: 2.88 memorylength: 79676 epsilon: 0.5976201107117687
Training...
episode: 573 no of steps: 135 score: 269.0 avg score: 1.9926 memorylength: 79811 epsilon: 0.5970824945846744
Training...
episode: 574 no of steps: 144 score: 302.0 avg score: 2.0972 memorylength: 79955 epsilon: 0.5965453620944253
Training...
episode: 575 no of steps: 130 score: -118.0 avg score: -0.9077 memorylength: 80085 epsilon: 0.5960087128059439
Training...
episode: 576 no of steps: 129 score: 109.0 avg score: 0.845 memorylength: 80214 epsilon: 0.5954725462845444
Training...
episode: 577 no of steps: 137 score: 153.0 avg score: 1.1168 memorylength: 80351 epsilon: 0.5949368620959319
Training...
episode: 578 no of steps: 133 score: -88.0 avg score: -0.6617 memorylength: 80484 epsilon: 0.5944016598062021
Training...
episode: 579 no of steps: 131 score: 284.0 avg score: 2.1679 memorylength: 80615 epsilon: 0.5938669389818412
Training...
episode: 580 no of steps: 145 score: 87.0 avg score: 0.6 memorylength: 80760 epsilon: 0.5933326991897251
Training...
episode: 581 no of steps: 141 score: 295.0 avg score: 2.0922 memorylength: 80901 epsilon: 0.5927989399971196
Training...
episode: 582 no of steps: 132 score: 9.0 avg score: 0.0682 memorylength: 81033 epsilon: 0.5922656609716802
Training...
episode: 583 no of steps: 122 score: -68.0 avg score: -0.5574 memorylength: 81155 epsilon: 0.5917328616814502
Training...
episode: 584 no of steps: 141 score: 97.0 avg score: 0.6879 memorylength: 81296 epsilon: 0.5912005416948625
Training...
episode: 585 no of steps: 135 score: -82.0 avg score: -0.6074 memorylength: 81431 epsilon: 0.5906687005807376
Training...
episode: 586 no of steps: 117 score: -297.0 avg score: -2.5385 memorylength: 81548 epsilon: 0.5901373379082846
Training...
episode: 587 no of steps: 141 score: -62.0 avg score: -0.4397 memorylength: 81689 epsilon: 0.5896064532470994
Training...
episode: 588 no of steps: 129 score: -102.0 avg score: -0.7907 memorylength: 81818 epsilon: 0.5890760461671655
Training...
episode: 589 no of steps: 143 score: -258.0 avg score: -1.8042 memorylength: 81961 epsilon: 0.588546116238853
Training...
episode: 590 no of steps: 140 score: -303.0 avg score: -2.1643 memorylength: 82101 epsilon: 0.5880166630329189
Training...
episode: 591 no of steps: 140 score: -433.0 avg score: -3.0929 memorylength: 82241 epsilon: 0.5874876861205057
Training...
episode: 592 no of steps: 125 score: -36.0 avg score: -0.288 memorylength: 82366 epsilon: 0.5869591850731425
Training...
episode: 593 no of steps: 138 score: 166.0 avg score: 1.2029 memorylength: 82504 epsilon: 0.5864311594627429
Training...
episode: 594 no of steps: 144 score: 17.0 avg score: 0.1181 memorylength: 82648 epsilon: 0.5859036088616068
Training...
episode: 595 no of steps: 135 score: -149.0 avg score: -1.1037 memorylength: 82783 epsilon: 0.5853765328424174
Training...
episode: 596 no of steps: 139 score: -50.0 avg score: -0.3597 memorylength: 82922 epsilon: 0.5848499309782438
Training...
episode: 597 no of steps: 129 score: 44.0 avg score: 0.3411 memorylength: 83051 epsilon: 0.5843238028425382
Training...
episode: 598 no of steps: 126 score: 89.0 avg score: 0.7063 memorylength: 83177 epsilon: 0.5837981480091365
Training...
episode: 599 no of steps: 152 score: 184.0 avg score: 1.2105 memorylength: 83329 epsilon: 0.5832729660522588
Training...
episode: 600 no of steps: 118 score: -214.0 avg score: -1.8136 memorylength: 83447 epsilon: 0.5827482565465071
saving states...
Training...
episode: 601 no of steps: 129 score: -213.0 avg score: -1.6512 memorylength: 83576 epsilon: 0.5822240190668673
Training...
episode: 602 no of steps: 136 score: -222.0 avg score: -1.6324 memorylength: 83712 epsilon: 0.5817002531887063
Training...
episode: 603 no of steps: 129 score: -64.0 avg score: -0.4961 memorylength: 83841 epsilon: 0.5811769584877743
Training...
episode: 604 no of steps: 126 score: 126.0 avg score: 1.0 memorylength: 83967 epsilon: 0.5806541345402023
Training...
episode: 605 no of steps: 142 score: 9.0 avg score: 0.0634 memorylength: 84109 epsilon: 0.5801317809225031
Training...
episode: 606 no of steps: 131 score: -216.0 avg score: -1.6489 memorylength: 84240 epsilon: 0.5796098972115699
Training...
episode: 607 no of steps: 131 score: 26.0 avg score: 0.1985 memorylength: 84371 epsilon: 0.579088482984677
Training...
episode: 608 no of steps: 145 score: 119.0 avg score: 0.8207 memorylength: 84516 epsilon: 0.5785675378194789
Training...
episode: 609 no of steps: 145 score: -150.0 avg score: -1.0345 memorylength: 84661 epsilon: 0.5780470612940101
Training...
episode: 610 no of steps: 128 score: -161.0 avg score: -1.2578 memorylength: 84789 epsilon: 0.5775270529866843
Training...
episode: 611 no of steps: 145 score: 116.0 avg score: 0.8 memorylength: 84934 epsilon: 0.577007512476295
Training...
episode: 612 no of steps: 135 score: 80.0 avg score: 0.5926 memorylength: 85069 epsilon: 0.5764884393420141
Training...
episode: 613 no of steps: 131 score: -251.0 avg score: -1.916 memorylength: 85200 epsilon: 0.5759698331633927
Training...
episode: 614 no of steps: 119 score: -207.0 avg score: -1.7395 memorylength: 85319 epsilon: 0.5754516935203593
Training...
episode: 615 no of steps: 125 score: -155.0 avg score: -1.24 memorylength: 85444 epsilon: 0.5749340199932211
Training...
episode: 616 no of steps: 145 score: 241.0 avg score: 1.6621 memorylength: 85589 epsilon: 0.5744168121626625
Training...
episode: 617 no of steps: 129 score: 56.0 avg score: 0.4341 memorylength: 85718 epsilon: 0.573900069609745
Training...
episode: 618 no of steps: 119 score: 103.0 avg score: 0.8655 memorylength: 85837 epsilon: 0.5733837919159072
Training...
episode: 619 no of steps: 142 score: 81.0 avg score: 0.5704 memorylength: 85979 epsilon: 0.5728679786629641
Training...
episode: 620 no of steps: 133 score: -117.0 avg score: -0.8797 memorylength: 86112 epsilon: 0.572352629433107
Training...
episode: 621 no of steps: 117 score: -4.0 avg score: -0.0342 memorylength: 86229 epsilon: 0.571837743808903
Training...
episode: 622 no of steps: 120 score: -35.0 avg score: -0.2917 memorylength: 86349 epsilon: 0.5713233213732944
Training...
episode: 623 no of steps: 141 score: 98.0 avg score: 0.695 memorylength: 86490 epsilon: 0.5708093617095995
Training...
episode: 624 no of steps: 125 score: -186.0 avg score: -1.488 memorylength: 86615 epsilon: 0.5702958644015105
Training...
episode: 625 no of steps: 139 score: -177.0 avg score: -1.2734 memorylength: 86754 epsilon: 0.5697828290330947
Training...
episode: 626 no of steps: 129 score: -105.0 avg score: -0.814 memorylength: 86883 epsilon: 0.5692702551887937
Training...
episode: 627 no of steps: 140 score: -86.0 avg score: -0.6143 memorylength: 87023 epsilon: 0.5687581424534223
Training...
episode: 628 no of steps: 147 score: 412.0 avg score: 2.8027 memorylength: 87170 epsilon: 0.5682464904121692
Training...
episode: 629 no of steps: 127 score: 88.0 avg score: 0.6929 memorylength: 87297 epsilon: 0.5677352986505966
Training...
episode: 630 no of steps: 134 score: 11.0 avg score: 0.0821 memorylength: 87431 epsilon: 0.5672245667546385
Training...
episode: 631 no of steps: 129 score: 78.0 avg score: 0.6047 memorylength: 87560 epsilon: 0.5667142943106025
Training...
episode: 632 no of steps: 140 score: -5.0 avg score: -0.0357 memorylength: 87700 epsilon: 0.5662044809051678
Training...
episode: 633 no of steps: 140 score: 44.0 avg score: 0.3143 memorylength: 87840 epsilon: 0.5656951261253855
Training...
episode: 634 no of steps: 122 score: -9.0 avg score: -0.0738 memorylength: 87962 epsilon: 0.5651862295586783
Training...
episode: 635 no of steps: 127 score: 103.0 avg score: 0.811 memorylength: 88089 epsilon: 0.5646777907928396
Training...
episode: 636 no of steps: 122 score: -47.0 avg score: -0.3852 memorylength: 88211 epsilon: 0.5641698094160343
Training...
episode: 637 no of steps: 133 score: 535.0 avg score: 4.0226 memorylength: 88344 epsilon: 0.5636622850167975
Training...
episode: 638 no of steps: 129 score: -176.0 avg score: -1.3643 memorylength: 88473 epsilon: 0.5631552171840344
Training...
episode: 639 no of steps: 135 score: 264.0 avg score: 1.9556 memorylength: 88608 epsilon: 0.5626486055070196
Training...
episode: 640 no of steps: 125 score: -10.0 avg score: -0.08 memorylength: 88733 epsilon: 0.562142449575398
Training...
episode: 641 no of steps: 126 score: -168.0 avg score: -1.3333 memorylength: 88859 epsilon: 0.5616367489791833
Training...
episode: 642 no of steps: 108 score: 45.0 avg score: 0.4167 memorylength: 88967 epsilon: 0.5611315033087578
Training...
episode: 643 no of steps: 137 score: -116.0 avg score: -0.8467 memorylength: 89104 epsilon: 0.5606267121548725
Training...
episode: 644 no of steps: 134 score: -185.0 avg score: -1.3806 memorylength: 89238 epsilon: 0.5601223751086467
Training...
episode: 645 no of steps: 134 score: 191.0 avg score: 1.4254 memorylength: 89372 epsilon: 0.5596184917615673
Training...
episode: 646 no of steps: 152 score: 323.0 avg score: 2.125 memorylength: 89524 epsilon: 0.5591150617054885
Training...
episode: 647 no of steps: 138 score: 40.0 avg score: 0.2899 memorylength: 89662 epsilon: 0.5586120845326324
Training...
episode: 648 no of steps: 147 score: -218.0 avg score: -1.483 memorylength: 89809 epsilon: 0.5581095598355871
Training...
episode: 649 no of steps: 133 score: -24.0 avg score: -0.1805 memorylength: 89942 epsilon: 0.5576074872073078
Training...
episode: 650 no of steps: 125 score: -49.0 avg score: -0.392 memorylength: 90067 epsilon: 0.5571058662411154
saving states...
Training...
episode: 651 no of steps: 147 score: -225.0 avg score: -1.5306 memorylength: 90214 epsilon: 0.556604696530697
Training...
episode: 652 no of steps: 132 score: -195.0 avg score: -1.4773 memorylength: 90346 epsilon: 0.5561039776701051
Training...
episode: 653 no of steps: 130 score: 58.0 avg score: 0.4462 memorylength: 90476 epsilon: 0.5556037092537575
Training...
episode: 654 no of steps: 149 score: -117.0 avg score: -0.7852 memorylength: 90625 epsilon: 0.5551038908764366
Training...
episode: 655 no of steps: 116 score: -165.0 avg score: -1.4224 memorylength: 90741 epsilon: 0.5546045221332897
Training...
episode: 656 no of steps: 130 score: -340.0 avg score: -2.6154 memorylength: 90871 epsilon: 0.5541056026198278
Training...
episode: 657 no of steps: 133 score: 279.0 avg score: 2.0977 memorylength: 91004 epsilon: 0.5536071319319263
Training...
episode: 658 no of steps: 142 score: -29.0 avg score: -0.2042 memorylength: 91146 epsilon: 0.5531091096658239
Training...
episode: 659 no of steps: 126 score: 444.0 avg score: 3.5238 memorylength: 91272 epsilon: 0.5526115354181224
Training...
episode: 660 no of steps: 148 score: -45.0 avg score: -0.3041 memorylength: 91420 epsilon: 0.5521144087857865
Training...
episode: 661 no of steps: 146 score: 279.0 avg score: 1.911 memorylength: 91566 epsilon: 0.5516177293661441
Training...
episode: 662 no of steps: 127 score: 23.0 avg score: 0.1811 memorylength: 91693 epsilon: 0.5511214967568845
Training...
episode: 663 no of steps: 138 score: 16.0 avg score: 0.1159 memorylength: 91831 epsilon: 0.5506257105560591
Training...
episode: 664 no of steps: 132 score: -161.0 avg score: -1.2197 memorylength: 91963 epsilon: 0.5501303703620815
Training...
episode: 665 no of steps: 136 score: -72.0 avg score: -0.5294 memorylength: 92099 epsilon: 0.5496354757737257
Training...
episode: 666 no of steps: 132 score: -255.0 avg score: -1.9318 memorylength: 92231 epsilon: 0.5491410263901274
Training...
episode: 667 no of steps: 133 score: 38.0 avg score: 0.2857 memorylength: 92364 epsilon: 0.5486470218107823
Training...
episode: 668 no of steps: 136 score: 173.0 avg score: 1.2721 memorylength: 92500 epsilon: 0.5481534616355468
Training...
episode: 669 no of steps: 148 score: 20.0 avg score: 0.1351 memorylength: 92648 epsilon: 0.547660345464637
Training...
episode: 670 no of steps: 140 score: 387.0 avg score: 2.7643 memorylength: 92788 epsilon: 0.5471676728986289
Training...
episode: 671 no of steps: 134 score: 324.0 avg score: 2.4179 memorylength: 92922 epsilon: 0.5466754435384578
Training...
episode: 672 no of steps: 143 score: -86.0 avg score: -0.6014 memorylength: 93065 epsilon: 0.5461836569854175
Training...
episode: 673 no of steps: 131 score: 245.0 avg score: 1.8702 memorylength: 93196 epsilon: 0.5456923128411613
Training...
episode: 674 no of steps: 126 score: -27.0 avg score: -0.2143 memorylength: 93322 epsilon: 0.5452014107077002
Training...
episode: 675 no of steps: 133 score: 202.0 avg score: 1.5188 memorylength: 93455 epsilon: 0.5447109501874036
Training...
episode: 676 no of steps: 115 score: 120.0 avg score: 1.0435 memorylength: 93570 epsilon: 0.5442209308829982
Training...
episode: 677 no of steps: 136 score: -263.0 avg score: -1.9338 memorylength: 93706 epsilon: 0.5437313523975684
Training...
episode: 678 no of steps: 122 score: -352.0 avg score: -2.8852 memorylength: 93828 epsilon: 0.5432422143345558
Training...
episode: 679 no of steps: 131 score: -158.0 avg score: -1.2061 memorylength: 93959 epsilon: 0.5427535162977583
Training...
episode: 680 no of steps: 126 score: -6.0 avg score: -0.0476 memorylength: 94085 epsilon: 0.5422652578913307
Training...
episode: 681 no of steps: 139 score: 251.0 avg score: 1.8058 memorylength: 94224 epsilon: 0.5417774387197835
Training...
episode: 682 no of steps: 129 score: 12.0 avg score: 0.093 memorylength: 94353 epsilon: 0.5412900583879832
Training...
episode: 683 no of steps: 133 score: 120.0 avg score: 0.9023 memorylength: 94486 epsilon: 0.5408031165011516
Training...
episode: 684 no of steps: 123 score: 198.0 avg score: 1.6098 memorylength: 94609 epsilon: 0.5403166126648659
Training...
episode: 685 no of steps: 139 score: 148.0 avg score: 1.0647 memorylength: 94748 epsilon: 0.5398305464850579
Training...
episode: 686 no of steps: 125 score: 259.0 avg score: 2.072 memorylength: 94873 epsilon: 0.5393449175680141
Training...
episode: 687 no of steps: 130 score: -108.0 avg score: -0.8308 memorylength: 95003 epsilon: 0.5388597255203748
Training...
episode: 688 no of steps: 139 score: 52.0 avg score: 0.3741 memorylength: 95142 epsilon: 0.5383749699491345
Training...
episode: 689 no of steps: 145 score: 110.0 avg score: 0.7586 memorylength: 95287 epsilon: 0.5378906504616412
Training...
episode: 690 no of steps: 120 score: -158.0 avg score: -1.3167 memorylength: 95407 epsilon: 0.5374067666655961
Training...
episode: 691 no of steps: 137 score: 16.0 avg score: 0.1168 memorylength: 95544 epsilon: 0.5369233181690531
Training...
episode: 692 no of steps: 123 score: -15.0 avg score: -0.122 memorylength: 95667 epsilon: 0.5364403045804194
Training...
episode: 693 no of steps: 146 score: 337.0 avg score: 2.3082 memorylength: 95813 epsilon: 0.5359577255084534
Training...
episode: 694 no of steps: 137 score: -163.0 avg score: -1.1898 memorylength: 95950 epsilon: 0.5354755805622665
Training...
episode: 695 no of steps: 108 score: 277.0 avg score: 2.5648 memorylength: 96058 epsilon: 0.5349938693513208
Training...
episode: 696 no of steps: 144 score: 63.0 avg score: 0.4375 memorylength: 96202 epsilon: 0.5345125914854305
Training...
episode: 697 no of steps: 137 score: 136.0 avg score: 0.9927 memorylength: 96339 epsilon: 0.5340317465747605
Training...
episode: 698 no of steps: 135 score: 270.0 avg score: 2.0 memorylength: 96474 epsilon: 0.5335513342298263
Training...
episode: 699 no of steps: 125 score: 17.0 avg score: 0.136 memorylength: 96599 epsilon: 0.5330713540614938
Training...
episode: 700 no of steps: 133 score: 153.0 avg score: 1.1504 memorylength: 96732 epsilon: 0.5325918056809792
saving states...
Training...
episode: 701 no of steps: 131 score: 73.0 avg score: 0.5573 memorylength: 96863 epsilon: 0.5321126886998482
Training...
episode: 702 no of steps: 138 score: 207.0 avg score: 1.5 memorylength: 97001 epsilon: 0.531634002730016
Training...
episode: 703 no of steps: 143 score: 70.0 avg score: 0.4895 memorylength: 97144 epsilon: 0.5311557473837472
Training...
episode: 704 no of steps: 134 score: 100.0 avg score: 0.7463 memorylength: 97278 epsilon: 0.5306779222736545
Training...
episode: 705 no of steps: 142 score: -8.0 avg score: -0.0563 memorylength: 97420 epsilon: 0.5302005270126998
Training...
episode: 706 no of steps: 140 score: -89.0 avg score: -0.6357 memorylength: 97560 epsilon: 0.529723561214193
Training...
episode: 707 no of steps: 123 score: -241.0 avg score: -1.9593 memorylength: 97683 epsilon: 0.5292470244917914
Training...
episode: 708 no of steps: 135 score: 36.0 avg score: 0.2667 memorylength: 97818 epsilon: 0.5287709164595007
Training...
episode: 709 no of steps: 140 score: -243.0 avg score: -1.7357 memorylength: 97958 epsilon: 0.528295236731673
Training...
episode: 710 no of steps: 123 score: -249.0 avg score: -2.0244 memorylength: 98081 epsilon: 0.5278199849230079
Training...
episode: 711 no of steps: 118 score: 373.0 avg score: 3.161 memorylength: 98199 epsilon: 0.5273451606485513
Training...
episode: 712 no of steps: 136 score: -135.0 avg score: -0.9926 memorylength: 98335 epsilon: 0.5268707635236957
Training...
episode: 713 no of steps: 144 score: 53.0 avg score: 0.3681 memorylength: 98479 epsilon: 0.5263967931641791
Training...
episode: 714 no of steps: 124 score: 164.0 avg score: 1.3226 memorylength: 98603 epsilon: 0.5259232491860857
Training...
episode: 715 no of steps: 137 score: 76.0 avg score: 0.5547 memorylength: 98740 epsilon: 0.5254501312058448
Training...
episode: 716 no of steps: 134 score: -227.0 avg score: -1.694 memorylength: 98874 epsilon: 0.5249774388402307
Training...
episode: 717 no of steps: 143 score: 225.0 avg score: 1.5734 memorylength: 99017 epsilon: 0.5245051717063628
Training...
episode: 718 no of steps: 142 score: 71.0 avg score: 0.5 memorylength: 99159 epsilon: 0.5240333294217046
Training...
episode: 719 no of steps: 135 score: 278.0 avg score: 2.0593 memorylength: 99294 epsilon: 0.5235619116040637
Training...
episode: 720 no of steps: 137 score: -32.0 avg score: -0.2336 memorylength: 99431 epsilon: 0.5230909178715917
Training...
episode: 721 no of steps: 133 score: 75.0 avg score: 0.5639 memorylength: 99564 epsilon: 0.5226203478427837
Training...
episode: 722 no of steps: 121 score: 44.0 avg score: 0.3636 memorylength: 99685 epsilon: 0.5221502011364779
Training...
episode: 723 no of steps: 133 score: -97.0 avg score: -0.7293 memorylength: 99818 epsilon: 0.5216804773718555
Training...
episode: 724 no of steps: 148 score: -7.0 avg score: -0.0473 memorylength: 99966 epsilon: 0.5212111761684403
Training...
episode: 725 no of steps: 129 score: -5.0 avg score: -0.0388 memorylength: 100095 epsilon: 0.5207422971460981
Training...
episode: 726 no of steps: 132 score: -9.0 avg score: -0.0682 memorylength: 100227 epsilon: 0.520273839925037
Training...
episode: 727 no of steps: 155 score: 210.0 avg score: 1.3548 memorylength: 100382 epsilon: 0.5198058041258065
Training...
episode: 728 no of steps: 123 score: 76.0 avg score: 0.6179 memorylength: 100505 epsilon: 0.5193381893692977
Training...
episode: 729 no of steps: 154 score: 225.0 avg score: 1.461 memorylength: 100659 epsilon: 0.5188709952767425
Training...
episode: 730 no of steps: 120 score: 162.0 avg score: 1.35 memorylength: 100779 epsilon: 0.5184042214697138
Training...
episode: 731 no of steps: 135 score: -312.0 avg score: -2.3111 memorylength: 100914 epsilon: 0.5179378675701248
Training...
episode: 732 no of steps: 142 score: -15.0 avg score: -0.1056 memorylength: 101056 epsilon: 0.5174719332002288
Training...
episode: 733 no of steps: 140 score: 188.0 avg score: 1.3429 memorylength: 101196 epsilon: 0.5170064179826187
Training...
episode: 734 no of steps: 144 score: 117.0 avg score: 0.8125 memorylength: 101340 epsilon: 0.5165413215402275
Training...
episode: 735 no of steps: 149 score: 493.0 avg score: 3.3087 memorylength: 101489 epsilon: 0.5160766434963268
Training...
episode: 736 no of steps: 137 score: -249.0 avg score: -1.8175 memorylength: 101626 epsilon: 0.5156123834745273
Training...
episode: 737 no of steps: 127 score: -118.0 avg score: -0.9291 memorylength: 101753 epsilon: 0.5151485410987788
Training...
episode: 738 no of steps: 125 score: 31.0 avg score: 0.248 memorylength: 101878 epsilon: 0.5146851159933685
Training...
episode: 739 no of steps: 144 score: -254.0 avg score: -1.7639 memorylength: 102022 epsilon: 0.5142221077829222
Training...
episode: 740 no of steps: 140 score: 196.0 avg score: 1.4 memorylength: 102162 epsilon: 0.5137595160924032
Training...
episode: 741 no of steps: 114 score: -387.0 avg score: -3.3947 memorylength: 102276 epsilon: 0.5132973405471124
Training...
episode: 742 no of steps: 142 score: 26.0 avg score: 0.1831 memorylength: 102418 epsilon: 0.5128355807726873
Training...
episode: 743 no of steps: 133 score: 223.0 avg score: 1.6767 memorylength: 102551 epsilon: 0.5123742363951025
Training...
episode: 744 no of steps: 143 score: 374.0 avg score: 2.6154 memorylength: 102694 epsilon: 0.5119133070406692
Training...
episode: 745 no of steps: 153 score: 27.0 avg score: 0.1765 memorylength: 102847 epsilon: 0.5114527923360344
Training...
episode: 746 no of steps: 137 score: 372.0 avg score: 2.7153 memorylength: 102984 epsilon: 0.5109926919081812
Training...
episode: 747 no of steps: 137 score: 94.0 avg score: 0.6861 memorylength: 103121 epsilon: 0.5105330053844284
Training...
episode: 748 no of steps: 134 score: 54.0 avg score: 0.403 memorylength: 103255 epsilon: 0.5100737323924297
Training...
episode: 749 no of steps: 129 score: 67.0 avg score: 0.5194 memorylength: 103384 epsilon: 0.509614872560174
Training...
episode: 750 no of steps: 128 score: 310.0 avg score: 2.4219 memorylength: 103512 epsilon: 0.509156425515985
saving states...
Training...
episode: 751 no of steps: 141 score: 189.0 avg score: 1.3404 memorylength: 103653 epsilon: 0.5086983908885203
Training...
episode: 752 no of steps: 132 score: 63.0 avg score: 0.4773 memorylength: 103785 epsilon: 0.508240768306772
Training...
episode: 753 no of steps: 132 score: -95.0 avg score: -0.7197 memorylength: 103917 epsilon: 0.5077835574000655
Training...
episode: 754 no of steps: 142 score: 84.0 avg score: 0.5915 memorylength: 104059 epsilon: 0.5073267577980604
Training...
episode: 755 no of steps: 137 score: 53.0 avg score: 0.3869 memorylength: 104196 epsilon: 0.5068703691307487
Training...
episode: 756 no of steps: 114 score: 72.0 avg score: 0.6316 memorylength: 104310 epsilon: 0.5064143910284555
Training...
episode: 757 no of steps: 127 score: -56.0 avg score: -0.4409 memorylength: 104437 epsilon: 0.5059588231218387
Training...
episode: 758 no of steps: 139 score: -147.0 avg score: -1.0576 memorylength: 104576 epsilon: 0.5055036650418883
Training...
episode: 759 no of steps: 141 score: 251.0 avg score: 1.7801 memorylength: 104717 epsilon: 0.505048916419926
Training...
episode: 760 no of steps: 145 score: 216.0 avg score: 1.4897 memorylength: 104862 epsilon: 0.5045945768876055
Training...
episode: 761 no of steps: 142 score: 183.0 avg score: 1.2887 memorylength: 105004 epsilon: 0.5041406460769119
Training...
episode: 762 no of steps: 133 score: 81.0 avg score: 0.609 memorylength: 105137 epsilon: 0.5036871236201609
Training...
episode: 763 no of steps: 137 score: -7.0 avg score: -0.0511 memorylength: 105274 epsilon: 0.5032340091499995
Training...
episode: 764 no of steps: 129 score: -198.0 avg score: -1.5349 memorylength: 105403 epsilon: 0.5027813022994051
Training...
episode: 765 no of steps: 152 score: -54.0 avg score: -0.3553 memorylength: 105555 epsilon: 0.5023290027016847
Training...
episode: 766 no of steps: 130 score: 210.0 avg score: 1.6154 memorylength: 105685 epsilon: 0.5018771099904761
Training...
episode: 767 no of steps: 141 score: 200.0 avg score: 1.4184 memorylength: 105826 epsilon: 0.5014256237997458
Training...
episode: 768 no of steps: 127 score: 92.0 avg score: 0.7244 memorylength: 105953 epsilon: 0.50097454376379
Training...
episode: 769 no of steps: 125 score: 416.0 avg score: 3.328 memorylength: 106078 epsilon: 0.5005238695172342
Training...
episode: 770 no of steps: 132 score: 137.0 avg score: 1.0379 memorylength: 106210 epsilon: 0.5000736006950318
Training...
episode: 771 no of steps: 135 score: 124.0 avg score: 0.9185 memorylength: 106345 epsilon: 0.4996237369324651
Training...
episode: 772 no of steps: 126 score: -218.0 avg score: -1.7302 memorylength: 106471 epsilon: 0.4991742778651447
Training...
episode: 773 no of steps: 135 score: -8.0 avg score: -0.0593 memorylength: 106606 epsilon: 0.49872522312900847
Training...
episode: 774 no of steps: 134 score: -38.0 avg score: -0.2836 memorylength: 106740 epsilon: 0.4982765723603222
Training...
episode: 775 no of steps: 137 score: 384.0 avg score: 2.8029 memorylength: 106877 epsilon: 0.4978283251956787
Training...
episode: 776 no of steps: 131 score: 328.0 avg score: 2.5038 memorylength: 107008 epsilon: 0.4973804812719977
Training...
episode: 777 no of steps: 154 score: 466.0 avg score: 3.026 memorylength: 107162 epsilon: 0.4969330402265256
Training...
episode: 778 no of steps: 144 score: 35.0 avg score: 0.2431 memorylength: 107306 epsilon: 0.49648600169683527
Training...
episode: 779 no of steps: 128 score: 13.0 avg score: 0.1016 memorylength: 107434 epsilon: 0.49603936532082527
Training...
episode: 780 no of steps: 130 score: 303.0 avg score: 2.3308 memorylength: 107564 epsilon: 0.4955931307367202
Training...
episode: 781 no of steps: 142 score: -86.0 avg score: -0.6056 memorylength: 107706 epsilon: 0.49514729758307
Training...
episode: 782 no of steps: 140 score: 120.0 avg score: 0.8571 memorylength: 107846 epsilon: 0.4947018654987499
Training...
episode: 783 no of steps: 124 score: -22.0 avg score: -0.1774 memorylength: 107970 epsilon: 0.49425683412295973
Training...
episode: 784 no of steps: 139 score: 10.0 avg score: 0.0719 memorylength: 108109 epsilon: 0.4938122030952241
Training...
episode: 785 no of steps: 138 score: 207.0 avg score: 1.5 memorylength: 108247 epsilon: 0.49336797205539196
Training...
episode: 786 no of steps: 136 score: 459.0 avg score: 3.375 memorylength: 108383 epsilon: 0.49292414064363593
Training...
episode: 787 no of steps: 124 score: -54.0 avg score: -0.4355 memorylength: 108507 epsilon: 0.49248070850045284
Training...
episode: 788 no of steps: 129 score: -9.0 avg score: -0.0698 memorylength: 108636 epsilon: 0.4920376752666624
Training...
episode: 789 no of steps: 134 score: 324.0 avg score: 2.4179 memorylength: 108770 epsilon: 0.4915950405834077
Training...
episode: 790 no of steps: 127 score: -135.0 avg score: -1.063 memorylength: 108897 epsilon: 0.49115280409215467
Training...
episode: 791 no of steps: 131 score: -185.0 avg score: -1.4122 memorylength: 109028 epsilon: 0.49071096543469167
Training...
episode: 792 no of steps: 149 score: 129.0 avg score: 0.8658 memorylength: 109177 epsilon: 0.4902695242531294
Training...
episode: 793 no of steps: 124 score: 350.0 avg score: 2.8226 memorylength: 109301 epsilon: 0.48982848018990055
Training...
episode: 794 no of steps: 129 score: 101.0 avg score: 0.7829 memorylength: 109430 epsilon: 0.4893878328877593
Training...
episode: 795 no of steps: 118 score: -129.0 avg score: -1.0932 memorylength: 109548 epsilon: 0.48894758198978133
Training...
episode: 796 no of steps: 132 score: 184.0 avg score: 1.3939 memorylength: 109680 epsilon: 0.48850772713936347
Training...
episode: 797 no of steps: 122 score: 95.0 avg score: 0.7787 memorylength: 109802 epsilon: 0.4880682679802231
Training...
episode: 798 no of steps: 125 score: 135.0 avg score: 1.08 memorylength: 109927 epsilon: 0.48762920415639843
Training...
episode: 799 no of steps: 119 score: -14.0 avg score: -0.1176 memorylength: 110046 epsilon: 0.4871905353122477
Training...
episode: 800 no of steps: 139 score: 72.0 avg score: 0.518 memorylength: 110185 epsilon: 0.48675226109244907
saving states...
Training...
episode: 801 no of steps: 142 score: -136.0 avg score: -0.9577 memorylength: 110327 epsilon: 0.4863143811420005
Training...
episode: 802 no of steps: 144 score: 348.0 avg score: 2.4167 memorylength: 110471 epsilon: 0.48587689510621906
Training...
episode: 803 no of steps: 124 score: -124.0 avg score: -1.0 memorylength: 110595 epsilon: 0.48543980263074116
Training...
episode: 804 no of steps: 132 score: -3.0 avg score: -0.0227 memorylength: 110727 epsilon: 0.48500310336152186
Training...
episode: 805 no of steps: 135 score: -106.0 avg score: -0.7852 memorylength: 110862 epsilon: 0.4845667969448347
Training...
episode: 806 no of steps: 142 score: -315.0 avg score: -2.2183 memorylength: 111004 epsilon: 0.4841308830272715
Training...
episode: 807 no of steps: 151 score: 234.0 avg score: 1.5497 memorylength: 111155 epsilon: 0.4836953612557418
Training...
episode: 808 no of steps: 142 score: 125.0 avg score: 0.8803 memorylength: 111297 epsilon: 0.48326023127747314
Training...
episode: 809 no of steps: 139 score: 126.0 avg score: 0.9065 memorylength: 111436 epsilon: 0.4828254927400101
Training...
episode: 810 no of steps: 144 score: 13.0 avg score: 0.0903 memorylength: 111580 epsilon: 0.48239114529121446
Training...
episode: 811 no of steps: 145 score: 496.0 avg score: 3.4207 memorylength: 111725 epsilon: 0.48195718857926484
Training...
episode: 812 no of steps: 150 score: 21.0 avg score: 0.14 memorylength: 111875 epsilon: 0.4815236222526562
Training...
episode: 813 no of steps: 131 score: 187.0 avg score: 1.4275 memorylength: 112006 epsilon: 0.4810904459601998
Training...
episode: 814 no of steps: 126 score: -7.0 avg score: -0.0556 memorylength: 112132 epsilon: 0.48065765935102284
Training...
episode: 815 no of steps: 139 score: 27.0 avg score: 0.1942 memorylength: 112271 epsilon: 0.4802252620745682
Training...
episode: 816 no of steps: 136 score: 140.0 avg score: 1.0294 memorylength: 112407 epsilon: 0.47979325378059395
Training...
episode: 817 no of steps: 129 score: -72.0 avg score: -0.5581 memorylength: 112536 epsilon: 0.4793616341191733
Training...
episode: 818 no of steps: 132 score: 138.0 avg score: 1.0455 memorylength: 112668 epsilon: 0.47893040274069454
Training...
episode: 819 no of steps: 144 score: 38.0 avg score: 0.2639 memorylength: 112812 epsilon: 0.47849955929586
Training...
episode: 820 no of steps: 137 score: 156.0 avg score: 1.1387 memorylength: 112949 epsilon: 0.4780691034356866
Training...
episode: 821 no of steps: 136 score: -91.0 avg score: -0.6691 memorylength: 113085 epsilon: 0.47763903481150494
Training...
episode: 822 no of steps: 144 score: 36.0 avg score: 0.25 memorylength: 113229 epsilon: 0.4772093530749596
Training...
episode: 823 no of steps: 144 score: 182.0 avg score: 1.2639 memorylength: 113373 epsilon: 0.47678005787800815
Training...
episode: 824 no of steps: 135 score: 371.0 avg score: 2.7481 memorylength: 113508 epsilon: 0.4763511488729216
Training...
episode: 825 no of steps: 139 score: 26.0 avg score: 0.1871 memorylength: 113647 epsilon: 0.4759226257122836
Training...
episode: 826 no of steps: 146 score: -235.0 avg score: -1.6096 memorylength: 113793 epsilon: 0.47549448804899036
Training...
episode: 827 no of steps: 136 score: -101.0 avg score: -0.7426 memorylength: 113929 epsilon: 0.4750667355362503
Training...
episode: 828 no of steps: 127 score: -388.0 avg score: -3.0551 memorylength: 114056 epsilon: 0.4746393678275838
Training...
episode: 829 no of steps: 139 score: 168.0 avg score: 1.2086 memorylength: 114195 epsilon: 0.47421238457682324
Training...
episode: 830 no of steps: 118 score: -210.0 avg score: -1.7797 memorylength: 114313 epsilon: 0.47378578543811195
Training...
episode: 831 no of steps: 128 score: -57.0 avg score: -0.4453 memorylength: 114441 epsilon: 0.4733595700659047
Training...
episode: 832 no of steps: 116 score: 90.0 avg score: 0.7759 memorylength: 114557 epsilon: 0.4729337381149669
Training...
episode: 833 no of steps: 137 score: -23.0 avg score: -0.1679 memorylength: 114694 epsilon: 0.4725082892403748
Training...
episode: 834 no of steps: 135 score: 503.0 avg score: 3.7259 memorylength: 114829 epsilon: 0.47208322309751477
Training...
episode: 835 no of steps: 122 score: 274.0 avg score: 2.2459 memorylength: 114951 epsilon: 0.4716585393420831
Training...
episode: 836 no of steps: 125 score: -77.0 avg score: -0.616 memorylength: 115076 epsilon: 0.471234237630086
Training...
episode: 837 no of steps: 137 score: 30.0 avg score: 0.219 memorylength: 115213 epsilon: 0.47081031761783904
Training...
episode: 838 no of steps: 121 score: 163.0 avg score: 1.3471 memorylength: 115334 epsilon: 0.47038677896196696
Training...
episode: 839 no of steps: 142 score: 592.0 avg score: 4.169 memorylength: 115476 epsilon: 0.46996362131940345
Training...
episode: 840 no of steps: 146 score: 282.0 avg score: 1.9315 memorylength: 115622 epsilon: 0.46954084434739085
Training...
episode: 841 no of steps: 142 score: 429.0 avg score: 3.0211 memorylength: 115764 epsilon: 0.4691184477034797
Training...
episode: 842 no of steps: 136 score: 81.0 avg score: 0.5956 memorylength: 115900 epsilon: 0.4686964310455288
Training...
episode: 843 no of steps: 142 score: 108.0 avg score: 0.7606 memorylength: 116042 epsilon: 0.4682747940317046
Training...
episode: 844 no of steps: 132 score: 156.0 avg score: 1.1818 memorylength: 116174 epsilon: 0.467853536320481
Training...
episode: 845 no of steps: 151 score: 206.0 avg score: 1.3642 memorylength: 116325 epsilon: 0.4674326575706393
Training...
episode: 846 no of steps: 143 score: 169.0 avg score: 1.1818 memorylength: 116468 epsilon: 0.4670121574412677
Training...
episode: 847 no of steps: 127 score: 210.0 avg score: 1.6535 memorylength: 116595 epsilon: 0.46659203559176105
Training...
episode: 848 no of steps: 140 score: 200.0 avg score: 1.4286 memorylength: 116735 epsilon: 0.4661722916818206
Training...
episode: 849 no of steps: 146 score: 85.0 avg score: 0.5822 memorylength: 116881 epsilon: 0.46575292537145385
Training...
episode: 850 no of steps: 139 score: 238.0 avg score: 1.7122 memorylength: 117020 epsilon: 0.4653339363209741
saving states...
Training...
episode: 851 no of steps: 138 score: 93.0 avg score: 0.6739 memorylength: 117158 epsilon: 0.46491532419099996
Training...
episode: 852 no of steps: 153 score: 75.0 avg score: 0.4902 memorylength: 117311 epsilon: 0.46449708864245587
Training...
episode: 853 no of steps: 141 score: 153.0 avg score: 1.0851 memorylength: 117452 epsilon: 0.4640792293365708
Training...
episode: 854 no of steps: 140 score: 369.0 avg score: 2.6357 memorylength: 117592 epsilon: 0.4636617459348788
Training...
episode: 855 no of steps: 125 score: -93.0 avg score: -0.744 memorylength: 117717 epsilon: 0.4632446380992182
Training...
episode: 856 no of steps: 124 score: 93.0 avg score: 0.75 memorylength: 117841 epsilon: 0.4628279054917317
Training...
episode: 857 no of steps: 120 score: 207.0 avg score: 1.725 memorylength: 117961 epsilon: 0.4624115477748659
Training...
episode: 858 no of steps: 124 score: -44.0 avg score: -0.3548 memorylength: 118085 epsilon: 0.4619955646113709
Training...
episode: 859 no of steps: 140 score: 418.0 avg score: 2.9857 memorylength: 118225 epsilon: 0.4615799556643005
Training...
episode: 860 no of steps: 139 score: -137.0 avg score: -0.9856 memorylength: 118364 epsilon: 0.46116472059701125
Training...
episode: 861 no of steps: 155 score: 126.0 avg score: 0.8129 memorylength: 118519 epsilon: 0.46074985907316285
Training...
episode: 862 no of steps: 143 score: 46.0 avg score: 0.3217 memorylength: 118662 epsilon: 0.4603353707567174
Training...
episode: 863 no of steps: 133 score: 135.0 avg score: 1.015 memorylength: 118795 epsilon: 0.4599212553119393
Training...
episode: 864 no of steps: 121 score: 98.0 avg score: 0.8099 memorylength: 118916 epsilon: 0.459507512403395
Training...
episode: 865 no of steps: 157 score: 720.0 avg score: 4.586 memorylength: 119073 epsilon: 0.4590941416959528
Training...
episode: 866 no of steps: 115 score: 228.0 avg score: 1.9826 memorylength: 119188 epsilon: 0.45868114285478245
Training...
episode: 867 no of steps: 134 score: -349.0 avg score: -2.6045 memorylength: 119322 epsilon: 0.4582685155453547
Training...
episode: 868 no of steps: 139 score: 18.0 avg score: 0.1295 memorylength: 119461 epsilon: 0.4578562594334415
Training...
episode: 869 no of steps: 154 score: 60.0 avg score: 0.3896 memorylength: 119615 epsilon: 0.4574443741851154
Training...
episode: 870 no of steps: 140 score: 572.0 avg score: 4.0857 memorylength: 119755 epsilon: 0.4570328594667493
Training...
episode: 871 no of steps: 129 score: 336.0 avg score: 2.6047 memorylength: 119884 epsilon: 0.4566217149450163
Training...
episode: 872 no of steps: 139 score: 270.0 avg score: 1.9424 memorylength: 120023 epsilon: 0.45621094028688924
Training...
episode: 873 no of steps: 127 score: 333.0 avg score: 2.622 memorylength: 120150 epsilon: 0.45580053515964064
Training...
episode: 874 no of steps: 114 score: 184.0 avg score: 1.614 memorylength: 120264 epsilon: 0.45539049923084235
Training...
episode: 875 no of steps: 136 score: 344.0 avg score: 2.5294 memorylength: 120400 epsilon: 0.4549808321683652
Training...
episode: 876 no of steps: 149 score: 453.0 avg score: 3.0403 memorylength: 120549 epsilon: 0.45457153364037894
Training...
episode: 877 no of steps: 144 score: 154.0 avg score: 1.0694 memorylength: 120693 epsilon: 0.45416260331535163
Training...
episode: 878 no of steps: 135 score: 405.0 avg score: 3.0 memorylength: 120828 epsilon: 0.45375404086204973
Training...
episode: 879 no of steps: 139 score: 133.0 avg score: 0.9568 memorylength: 120967 epsilon: 0.4533458459495377
Training...
episode: 880 no of steps: 134 score: 102.0 avg score: 0.7612 memorylength: 121101 epsilon: 0.4529380182471776
Training...
episode: 881 no of steps: 132 score: 135.0 avg score: 1.0227 memorylength: 121233 epsilon: 0.4525305574246289
Training...
episode: 882 no of steps: 122 score: -45.0 avg score: -0.3689 memorylength: 121355 epsilon: 0.4521234631518483
Training...
episode: 883 no of steps: 128 score: -167.0 avg score: -1.3047 memorylength: 121483 epsilon: 0.45171673509908955
Training...
episode: 884 no of steps: 129 score: 21.0 avg score: 0.1628 memorylength: 121612 epsilon: 0.45131037293690274
Training...
episode: 885 no of steps: 123 score: 125.0 avg score: 1.0163 memorylength: 121735 epsilon: 0.45090437633613467
Training...
episode: 886 no of steps: 154 score: 206.0 avg score: 1.3377 memorylength: 121889 epsilon: 0.45049874496792797
Training...
episode: 887 no of steps: 144 score: -57.0 avg score: -0.3958 memorylength: 122033 epsilon: 0.4500934785037212
Training...
episode: 888 no of steps: 136 score: 798.0 avg score: 5.8676 memorylength: 122169 epsilon: 0.4496885766152485
Training...
episode: 889 no of steps: 138 score: 207.0 avg score: 1.5 memorylength: 122307 epsilon: 0.4492840389745394
Training...
episode: 890 no of steps: 139 score: 246.0 avg score: 1.7698 memorylength: 122446 epsilon: 0.4488798652539184
Training...
episode: 891 no of steps: 156 score: 477.0 avg score: 3.0577 memorylength: 122602 epsilon: 0.44847605512600464
Training...
episode: 892 no of steps: 118 score: 480.0 avg score: 4.0678 memorylength: 122720 epsilon: 0.44807260826371187
Training...
episode: 893 no of steps: 144 score: 234.0 avg score: 1.625 memorylength: 122864 epsilon: 0.44766952434024826
Training...
episode: 894 no of steps: 130 score: 108.0 avg score: 0.8308 memorylength: 122994 epsilon: 0.4472668030291157
Training...
episode: 895 no of steps: 152 score: 117.0 avg score: 0.7697 memorylength: 123146 epsilon: 0.44686444400411
Training...
episode: 896 no of steps: 133 score: 288.0 avg score: 2.1654 memorylength: 123279 epsilon: 0.44646244693932025
Training...
episode: 897 no of steps: 129 score: -46.0 avg score: -0.3566 memorylength: 123408 epsilon: 0.44606081150912885
Training...
episode: 898 no of steps: 120 score: -36.0 avg score: -0.3 memorylength: 123528 epsilon: 0.44565953738821107
Training...
episode: 899 no of steps: 136 score: 374.0 avg score: 2.75 memorylength: 123664 epsilon: 0.44525862425153484
Training...
episode: 900 no of steps: 123 score: -80.0 avg score: -0.6504 memorylength: 123787 epsilon: 0.4448580717743605
saving states...
Training...
episode: 901 no of steps: 141 score: 129.0 avg score: 0.9149 memorylength: 123928 epsilon: 0.4444578796322405
Training...
episode: 902 no of steps: 135 score: 256.0 avg score: 1.8963 memorylength: 124063 epsilon: 0.4440580475010191
Training...
episode: 903 no of steps: 128 score: 36.0 avg score: 0.2812 memorylength: 124191 epsilon: 0.44365857505683254
Training...
episode: 904 no of steps: 131 score: 97.0 avg score: 0.7405 memorylength: 124322 epsilon: 0.4432594619761078
Training...
episode: 905 no of steps: 131 score: 137.0 avg score: 1.0458 memorylength: 124453 epsilon: 0.4428607079355635
Training...
episode: 906 no of steps: 138 score: 103.0 avg score: 0.7464 memorylength: 124591 epsilon: 0.44246231261220864
Training...
episode: 907 no of steps: 140 score: 300.0 avg score: 2.1429 memorylength: 124731 epsilon: 0.4420642756833431
Training...
episode: 908 no of steps: 138 score: 344.0 avg score: 2.4928 memorylength: 124869 epsilon: 0.44166659682655707
Training...
episode: 909 no of steps: 121 score: 294.0 avg score: 2.4298 memorylength: 124990 epsilon: 0.4412692757197304
Training...
episode: 910 no of steps: 125 score: 143.0 avg score: 1.144 memorylength: 125115 epsilon: 0.44087231204103305
Training...
episode: 911 no of steps: 138 score: 409.0 avg score: 2.9638 memorylength: 125253 epsilon: 0.44047570546892456
Training...
episode: 912 no of steps: 133 score: 503.0 avg score: 3.782 memorylength: 125386 epsilon: 0.4400794556821534
Training...
episode: 913 no of steps: 136 score: 450.0 avg score: 3.3088 memorylength: 125522 epsilon: 0.43968356235975736
Training...
episode: 914 no of steps: 135 score: 228.0 avg score: 1.6889 memorylength: 125657 epsilon: 0.4392880251810627
Training...
episode: 915 no of steps: 130 score: 331.0 avg score: 2.5462 memorylength: 125787 epsilon: 0.43889284382568444
Training...
episode: 916 no of steps: 125 score: -33.0 avg score: -0.264 memorylength: 125912 epsilon: 0.4384980179735255
Training...
episode: 917 no of steps: 125 score: 99.0 avg score: 0.792 memorylength: 126037 epsilon: 0.43810354730477713
Training...
episode: 918 no of steps: 122 score: 256.0 avg score: 2.0984 memorylength: 126159 epsilon: 0.43770943149991776
Training...
episode: 919 no of steps: 131 score: 65.0 avg score: 0.4962 memorylength: 126290 epsilon: 0.43731567023971385
Training...
episode: 920 no of steps: 145 score: 116.0 avg score: 0.8 memorylength: 126435 epsilon: 0.4369222632052186
Training...
episode: 921 no of steps: 137 score: -224.0 avg score: -1.635 memorylength: 126572 epsilon: 0.4365292100777723
Training...
episode: 922 no of steps: 129 score: 63.0 avg score: 0.4884 memorylength: 126701 epsilon: 0.436136510539002
Training...
episode: 923 no of steps: 140 score: 179.0 avg score: 1.2786 memorylength: 126841 epsilon: 0.4357441642708209
Training...
episode: 924 no of steps: 150 score: 503.0 avg score: 3.3533 memorylength: 126991 epsilon: 0.43535217095542866
Training...
episode: 925 no of steps: 133 score: 175.0 avg score: 1.3158 memorylength: 127124 epsilon: 0.43496053027531056
Training...
episode: 926 no of steps: 136 score: 157.0 avg score: 1.1544 memorylength: 127260 epsilon: 0.4345692419132377
Training...
episode: 927 no of steps: 167 score: 589.0 avg score: 3.5269 memorylength: 127427 epsilon: 0.43417830555226644
Training...
episode: 928 no of steps: 131 score: -5.0 avg score: -0.0382 memorylength: 127558 epsilon: 0.4337877208757383
Training...
episode: 929 no of steps: 137 score: 290.0 avg score: 2.1168 memorylength: 127695 epsilon: 0.4333974875672797
Training...
episode: 930 no of steps: 129 score: -212.0 avg score: -1.6434 memorylength: 127824 epsilon: 0.4330076053108016
Training...
episode: 931 no of steps: 158 score: 403.0 avg score: 2.5506 memorylength: 127982 epsilon: 0.4326180737904994
Training...
episode: 932 no of steps: 132 score: 62.0 avg score: 0.4697 memorylength: 128114 epsilon: 0.43222889269085246
Training...
episode: 933 no of steps: 132 score: 690.0 avg score: 5.2273 memorylength: 128246 epsilon: 0.4318400616966242
Training...
episode: 934 no of steps: 143 score: 183.0 avg score: 1.2797 memorylength: 128389 epsilon: 0.4314515804928615
Training...
episode: 935 no of steps: 144 score: -106.0 avg score: -0.7361 memorylength: 128533 epsilon: 0.43106344876489433
Training...
episode: 936 no of steps: 125 score: 0.0 avg score: 0.0 memorylength: 128658 epsilon: 0.43067566619833625
Training...
episode: 937 no of steps: 128 score: 405.0 avg score: 3.1641 memorylength: 128786 epsilon: 0.4302882324790832
Training...
episode: 938 no of steps: 135 score: 319.0 avg score: 2.363 memorylength: 128921 epsilon: 0.42990114729331386
Training...
episode: 939 no of steps: 140 score: 345.0 avg score: 2.4643 memorylength: 129061 epsilon: 0.4295144103274892
Training...
episode: 940 no of steps: 148 score: 243.0 avg score: 1.6419 memorylength: 129209 epsilon: 0.42912802126835237
Training...
episode: 941 no of steps: 135 score: 332.0 avg score: 2.4593 memorylength: 129344 epsilon: 0.42874197980292805
Training...
episode: 942 no of steps: 131 score: 170.0 avg score: 1.2977 memorylength: 129475 epsilon: 0.42835628561852274
Training...
episode: 943 no of steps: 144 score: 295.0 avg score: 2.0486 memorylength: 129619 epsilon: 0.4279709384027241
Training...
episode: 944 no of steps: 123 score: 172.0 avg score: 1.3984 memorylength: 129742 epsilon: 0.42758593784340093
Training...
episode: 945 no of steps: 143 score: 367.0 avg score: 2.5664 memorylength: 129885 epsilon: 0.4272012836287027
Training...
episode: 946 no of steps: 125 score: 255.0 avg score: 2.04 memorylength: 130010 epsilon: 0.4268169754470594
Training...
episode: 947 no of steps: 136 score: 206.0 avg score: 1.5147 memorylength: 130146 epsilon: 0.4264330129871814
Training...
episode: 948 no of steps: 146 score: -152.0 avg score: -1.0411 memorylength: 130292 epsilon: 0.42604939593805924
Training...
episode: 949 no of steps: 130 score: 124.0 avg score: 0.9538 memorylength: 130422 epsilon: 0.4256661239889629
Training...
episode: 950 no of steps: 142 score: 148.0 avg score: 1.0423 memorylength: 130564 epsilon: 0.4252831968294422
saving states...
Training...
episode: 951 no of steps: 137 score: 332.0 avg score: 2.4234 memorylength: 130701 epsilon: 0.42490061414932606
Training...
episode: 952 no of steps: 134 score: 155.0 avg score: 1.1567 memorylength: 130835 epsilon: 0.4245183756387226
Training...
episode: 953 no of steps: 147 score: 3.0 avg score: 0.0204 memorylength: 130982 epsilon: 0.4241364809880184
Training...
episode: 954 no of steps: 137 score: 25.0 avg score: 0.1825 memorylength: 131072 epsilon: 0.42375492988787894
Training...
episode: 955 no of steps: 138 score: -64.0 avg score: -0.4638 memorylength: 131072 epsilon: 0.4233737220292478
Training...
episode: 956 no of steps: 139 score: 306.0 avg score: 2.2014 memorylength: 131072 epsilon: 0.4229928571033465
Training...
episode: 957 no of steps: 144 score: 287.0 avg score: 1.9931 memorylength: 131072 epsilon: 0.42261233480167454
Training...
episode: 958 no of steps: 136 score: 341.0 avg score: 2.5074 memorylength: 131072 epsilon: 0.42223215481600873
Training...
episode: 959 no of steps: 136 score: 279.0 avg score: 2.0515 memorylength: 131072 epsilon: 0.42185231683840324
Training...
episode: 960 no of steps: 138 score: 193.0 avg score: 1.3986 memorylength: 131072 epsilon: 0.42147282056118945
Training...
episode: 961 no of steps: 139 score: 198.0 avg score: 1.4245 memorylength: 131072 epsilon: 0.4210936656769752
Training...
episode: 962 no of steps: 137 score: 200.0 avg score: 1.4599 memorylength: 131072 epsilon: 0.4207148518786451
Training...
episode: 963 no of steps: 123 score: -3.0 avg score: -0.0244 memorylength: 131072 epsilon: 0.4203363788593599
Training...
episode: 964 no of steps: 138 score: 27.0 avg score: 0.1957 memorylength: 131072 epsilon: 0.41995824631255657
Training...
episode: 965 no of steps: 146 score: -107.0 avg score: -0.7329 memorylength: 131072 epsilon: 0.41958045393194754
Training...
episode: 966 no of steps: 133 score: -71.0 avg score: -0.5338 memorylength: 131072 epsilon: 0.41920300141152095
Training...
episode: 967 no of steps: 133 score: 88.0 avg score: 0.6617 memorylength: 131072 epsilon: 0.4188258884455404
Training...
episode: 968 no of steps: 133 score: 226.0 avg score: 1.6992 memorylength: 131072 epsilon: 0.41844911472854435
Training...
episode: 969 no of steps: 136 score: 115.0 avg score: 0.8456 memorylength: 131072 epsilon: 0.4180726799553459
Training...
episode: 970 no of steps: 133 score: -306.0 avg score: -2.3008 memorylength: 131072 epsilon: 0.41769658382103303
Training...
episode: 971 no of steps: 130 score: 249.0 avg score: 1.9154 memorylength: 131072 epsilon: 0.41732082602096776
Training...
episode: 972 no of steps: 139 score: 349.0 avg score: 2.5108 memorylength: 131072 epsilon: 0.4169454062507863
Training...
episode: 973 no of steps: 142 score: 523.0 avg score: 3.6831 memorylength: 131072 epsilon: 0.4165703242063986
Training...
episode: 974 no of steps: 141 score: 333.0 avg score: 2.3617 memorylength: 131072 epsilon: 0.41619557958398823
Training...
episode: 975 no of steps: 141 score: 192.0 avg score: 1.3617 memorylength: 131072 epsilon: 0.41582117208001196
Training...
episode: 976 no of steps: 138 score: 430.0 avg score: 3.1159 memorylength: 131072 epsilon: 0.4154471013911996
Training...
episode: 977 no of steps: 137 score: 358.0 avg score: 2.6131 memorylength: 131072 epsilon: 0.4150733672145541
Training...
episode: 978 no of steps: 134 score: 284.0 avg score: 2.1194 memorylength: 131072 epsilon: 0.41469996924735064
Training...
episode: 979 no of steps: 120 score: -94.0 avg score: -0.7833 memorylength: 131072 epsilon: 0.4143269071871368
Training...
episode: 980 no of steps: 140 score: -132.0 avg score: -0.9429 memorylength: 131072 epsilon: 0.41395418073173235
Training...
episode: 981 no of steps: 132 score: 81.0 avg score: 0.6136 memorylength: 131072 epsilon: 0.4135817895792288
Training...
episode: 982 no of steps: 139 score: 80.0 avg score: 0.5755 memorylength: 131072 epsilon: 0.41320973342798933
Training...
episode: 983 no of steps: 138 score: 82.0 avg score: 0.5942 memorylength: 131072 epsilon: 0.4128380119766485
Training...
episode: 984 no of steps: 131 score: 161.0 avg score: 1.229 memorylength: 131072 epsilon: 0.41246662492411174
Training...
episode: 985 no of steps: 156 score: 285.0 avg score: 1.8269 memorylength: 131072 epsilon: 0.41209557196955565
Training...
episode: 986 no of steps: 129 score: 273.0 avg score: 2.1163 memorylength: 131072 epsilon: 0.4117248528124273
Training...
episode: 987 no of steps: 145 score: 36.0 avg score: 0.2483 memorylength: 131072 epsilon: 0.41135446715244417
Training...
episode: 988 no of steps: 154 score: 244.0 avg score: 1.5844 memorylength: 131072 epsilon: 0.41098441468959374
Training...
episode: 989 no of steps: 133 score: 490.0 avg score: 3.6842 memorylength: 131072 epsilon: 0.4106146951241336
Training...
episode: 990 no of steps: 136 score: 424.0 avg score: 3.1176 memorylength: 131072 epsilon: 0.41024530815659094
Training...
episode: 991 no of steps: 149 score: 553.0 avg score: 3.7114 memorylength: 131072 epsilon: 0.4098762534877622
Training...
episode: 992 no of steps: 195 score: 136.0 avg score: 0.6974 memorylength: 131072 epsilon: 0.40950753081871305
Training...
episode: 993 no of steps: 200 score: 216.0 avg score: 1.08 memorylength: 131072 epsilon: 0.4091391398507782
Training...
episode: 994 no of steps: 165 score: -124.0 avg score: -0.7515 memorylength: 131072 epsilon: 0.40877108028556086
Training...
episode: 995 no of steps: 142 score: -108.0 avg score: -0.7606 memorylength: 131072 epsilon: 0.40840335182493276
Training...
episode: 996 no of steps: 125 score: 117.0 avg score: 0.936 memorylength: 131072 epsilon: 0.40803595417103394
Training...
episode: 997 no of steps: 125 score: 175.0 avg score: 1.4 memorylength: 131072 epsilon: 0.4076688870262722
Training...
episode: 998 no of steps: 115 score: 52.0 avg score: 0.4522 memorylength: 131072 epsilon: 0.4073021500933231
Training...
episode: 999 no of steps: 115 score: -24.0 avg score: -0.2087 memorylength: 131072 epsilon: 0.40693574307512975
Training...
episode: 1000 no of steps: 126 score: 138.0 avg score: 1.0952 memorylength: 131072 epsilon: 0.4065696656749025
saving states...
Training...
episode: 1001 no of steps: 132 score: -45.0 avg score: -0.3409 memorylength: 131072 epsilon: 0.40620391759611857
Training...
episode: 1002 no of steps: 164 score: 422.0 avg score: 2.5732 memorylength: 131072 epsilon: 0.4058384985425219
Training...
episode: 1003 no of steps: 136 score: 616.0 avg score: 4.5294 memorylength: 131072 epsilon: 0.4054734082181232
Training...
episode: 1004 no of steps: 134 score: 570.0 avg score: 4.2537 memorylength: 131072 epsilon: 0.4051086463271993
Training...
episode: 1005 no of steps: 142 score: 285.0 avg score: 2.007 memorylength: 131072 epsilon: 0.4047442125742929
Training...
episode: 1006 no of steps: 144 score: 400.0 avg score: 2.7778 memorylength: 131072 epsilon: 0.4043801066642127
Training...
episode: 1007 no of steps: 121 score: 168.0 avg score: 1.3884 memorylength: 131072 epsilon: 0.4040163283020329
Training...
episode: 1008 no of steps: 125 score: 371.0 avg score: 2.968 memorylength: 131072 epsilon: 0.40365287719309306
Training...
episode: 1009 no of steps: 127 score: 413.0 avg score: 3.252 memorylength: 131072 epsilon: 0.4032897530429977
Training...
episode: 1010 no of steps: 146 score: 638.0 avg score: 4.3699 memorylength: 131072 epsilon: 0.4029269555576162
Training...
episode: 1011 no of steps: 148 score: 424.0 avg score: 2.8649 memorylength: 131072 epsilon: 0.40256448444308274
Training...
episode: 1012 no of steps: 145 score: 601.0 avg score: 4.1448 memorylength: 131072 epsilon: 0.40220233940579553
Training...
episode: 1013 no of steps: 133 score: 389.0 avg score: 2.9248 memorylength: 131072 epsilon: 0.40184052015241717
Training...
episode: 1014 no of steps: 147 score: 86.0 avg score: 0.585 memorylength: 131072 epsilon: 0.4014790263898739
Training...
episode: 1015 no of steps: 150 score: 45.0 avg score: 0.3 memorylength: 131072 epsilon: 0.401117857825356
Training...
episode: 1016 no of steps: 144 score: 283.0 avg score: 1.9653 memorylength: 131072 epsilon: 0.40075701416631665
Training...
episode: 1017 no of steps: 143 score: 350.0 avg score: 2.4476 memorylength: 131072 epsilon: 0.4003964951204726
Training...
episode: 1018 no of steps: 160 score: 288.0 avg score: 1.8 memorylength: 131072 epsilon: 0.4000363003958034
Training...
episode: 1019 no of steps: 148 score: 397.0 avg score: 2.6824 memorylength: 131072 epsilon: 0.39967642970055134
Training...
episode: 1020 no of steps: 148 score: -27.0 avg score: -0.1824 memorylength: 131072 epsilon: 0.3993168827432211
Training...
episode: 1021 no of steps: 135 score: 312.0 avg score: 2.3111 memorylength: 131072 epsilon: 0.3989576592325796
Training...
episode: 1022 no of steps: 140 score: 198.0 avg score: 1.4143 memorylength: 131072 epsilon: 0.3985987588776558
Training...
episode: 1023 no of steps: 122 score: 425.0 avg score: 3.4836 memorylength: 131072 epsilon: 0.39824018138774026
Training...
episode: 1024 no of steps: 127 score: -81.0 avg score: -0.6378 memorylength: 131072 epsilon: 0.39788192647238546
Training...
episode: 1025 no of steps: 128 score: 62.0 avg score: 0.4844 memorylength: 131072 epsilon: 0.3975239938414047
Training...
episode: 1026 no of steps: 137 score: 288.0 avg score: 2.1022 memorylength: 131072 epsilon: 0.3971663832048726
Training...
episode: 1027 no of steps: 137 score: -137.0 avg score: -1.0 memorylength: 131072 epsilon: 0.39680909427312444
Training...
episode: 1028 no of steps: 128 score: 129.0 avg score: 1.0078 memorylength: 131072 epsilon: 0.39645212675675634
Training...
episode: 1029 no of steps: 131 score: -159.0 avg score: -1.2137 memorylength: 131072 epsilon: 0.39609548036662445
Training...
episode: 1030 no of steps: 131 score: -39.0 avg score: -0.2977 memorylength: 131072 epsilon: 0.3957391548138452
Training...
episode: 1031 no of steps: 159 score: -82.0 avg score: -0.5157 memorylength: 131072 epsilon: 0.3953831498097949
Training...
episode: 1032 no of steps: 140 score: 385.0 avg score: 2.75 memorylength: 131072 epsilon: 0.3950274650661095
Training...
episode: 1033 no of steps: 135 score: 300.0 avg score: 2.2222 memorylength: 131072 epsilon: 0.39467210029468425
Training...
episode: 1034 no of steps: 136 score: 592.0 avg score: 4.3529 memorylength: 131072 epsilon: 0.39431705520767374
Training...
episode: 1035 no of steps: 152 score: 121.0 avg score: 0.7961 memorylength: 131072 epsilon: 0.3939623295174914
Training...
episode: 1036 no of steps: 128 score: 301.0 avg score: 2.3516 memorylength: 131072 epsilon: 0.3936079229368094
Training...
episode: 1037 no of steps: 155 score: 382.0 avg score: 2.4645 memorylength: 131072 epsilon: 0.3932538351785584
Training...
episode: 1038 no of steps: 135 score: 382.0 avg score: 2.8296 memorylength: 131072 epsilon: 0.3929000659559273
Training...
episode: 1039 no of steps: 143 score: 207.0 avg score: 1.4476 memorylength: 131072 epsilon: 0.39254661498236304
Training...
episode: 1040 no of steps: 131 score: 254.0 avg score: 1.9389 memorylength: 131072 epsilon: 0.3921934819715702
Training...
episode: 1041 no of steps: 126 score: 126.0 avg score: 1.0 memorylength: 131072 epsilon: 0.3918406666375112
Training...
episode: 1042 no of steps: 129 score: 342.0 avg score: 2.6512 memorylength: 131072 epsilon: 0.39148816869440545
Training...
episode: 1043 no of steps: 143 score: 577.0 avg score: 4.035 memorylength: 131072 epsilon: 0.3911359878567296
Training...
episode: 1044 no of steps: 132 score: 211.0 avg score: 1.5985 memorylength: 131072 epsilon: 0.39078412383921723
Training...
episode: 1045 no of steps: 139 score: -158.0 avg score: -1.1367 memorylength: 131072 epsilon: 0.3904325763568585
Training...
episode: 1046 no of steps: 152 score: 326.0 avg score: 2.1447 memorylength: 131072 epsilon: 0.3900813451248998
Training...
episode: 1047 no of steps: 148 score: 300.0 avg score: 2.027 memorylength: 131072 epsilon: 0.3897304298588439
Training...
episode: 1048 no of steps: 153 score: 634.0 avg score: 4.1438 memorylength: 131072 epsilon: 0.3893798302744494
Training...
episode: 1049 no of steps: 149 score: 278.0 avg score: 1.8658 memorylength: 131072 epsilon: 0.3890295460877306
Training...
episode: 1050 no of steps: 150 score: 558.0 avg score: 3.72 memorylength: 131072 epsilon: 0.3886795770149573
saving states...
Training...
episode: 1051 no of steps: 150 score: 318.0 avg score: 2.12 memorylength: 131072 epsilon: 0.38832992277265455
Training...
episode: 1052 no of steps: 137 score: 45.0 avg score: 0.3285 memorylength: 131072 epsilon: 0.3879805830776023
Training...
episode: 1053 no of steps: 138 score: 247.0 avg score: 1.7899 memorylength: 131072 epsilon: 0.38763155764683555
Training...
episode: 1054 no of steps: 135 score: 720.0 avg score: 5.3333 memorylength: 131072 epsilon: 0.3872828461976435
Training...
episode: 1055 no of steps: 139 score: 394.0 avg score: 2.8345 memorylength: 131072 epsilon: 0.38693444844757
Training...
episode: 1056 no of steps: 139 score: -79.0 avg score: -0.5683 memorylength: 131072 epsilon: 0.3865863641144129
Training...
episode: 1057 no of steps: 128 score: 386.0 avg score: 3.0156 memorylength: 131072 epsilon: 0.38623859291622364
Training...
episode: 1058 no of steps: 140 score: 288.0 avg score: 2.0571 memorylength: 131072 epsilon: 0.3858911345713077
Training...
episode: 1059 no of steps: 138 score: -32.0 avg score: -0.2319 memorylength: 131072 epsilon: 0.3855439887982237
Training...
episode: 1060 no of steps: 130 score: 144.0 avg score: 1.1077 memorylength: 131072 epsilon: 0.3851971553157837
Training...
episode: 1061 no of steps: 144 score: 342.0 avg score: 2.375 memorylength: 131072 epsilon: 0.3848506338430524
Training...
episode: 1062 no of steps: 143 score: 396.0 avg score: 2.7692 memorylength: 131072 epsilon: 0.3845044240993475
Training...
episode: 1063 no of steps: 149 score: 711.0 avg score: 4.7718 memorylength: 131072 epsilon: 0.384158525804239
Training...
episode: 1064 no of steps: 150 score: 576.0 avg score: 3.84 memorylength: 131072 epsilon: 0.3838129386775493
Training...
episode: 1065 no of steps: 151 score: 458.0 avg score: 3.0331 memorylength: 131072 epsilon: 0.3834676624393529
Training...
episode: 1066 no of steps: 151 score: 570.0 avg score: 3.7748 memorylength: 131072 epsilon: 0.38312269680997585
Training...
episode: 1067 no of steps: 169 score: 272.0 avg score: 1.6095 memorylength: 131072 epsilon: 0.3827780415099961
Training...
episode: 1068 no of steps: 141 score: -46.0 avg score: -0.3262 memorylength: 131072 epsilon: 0.3824336962602428
Training...
episode: 1069 no of steps: 128 score: 447.0 avg score: 3.4922 memorylength: 131072 epsilon: 0.3820896607817963
Training...
episode: 1070 no of steps: 145 score: 557.0 avg score: 3.8414 memorylength: 131072 epsilon: 0.3817459347959878
Training...
episode: 1071 no of steps: 142 score: 624.0 avg score: 4.3944 memorylength: 131072 epsilon: 0.38140251802439923
Training...
episode: 1072 no of steps: 140 score: 325.0 avg score: 2.3214 memorylength: 131072 epsilon: 0.381059410188863
Training...
episode: 1073 no of steps: 128 score: 81.0 avg score: 0.6328 memorylength: 131072 epsilon: 0.3807166110114618
Training...
episode: 1074 no of steps: 139 score: 169.0 avg score: 1.2158 memorylength: 131072 epsilon: 0.38037412021452827
Training...
episode: 1075 no of steps: 142 score: -143.0 avg score: -1.007 memorylength: 131072 epsilon: 0.38003193752064474
Training...
episode: 1076 no of steps: 134 score: 153.0 avg score: 1.1418 memorylength: 131072 epsilon: 0.3796900626526434
Training...
episode: 1077 no of steps: 153 score: 189.0 avg score: 1.2353 memorylength: 131072 epsilon: 0.3793484953336053
Training...
episode: 1078 no of steps: 147 score: 6.0 avg score: 0.0408 memorylength: 131072 epsilon: 0.3790072352868612
Training...
episode: 1079 no of steps: 142 score: 36.0 avg score: 0.2535 memorylength: 131072 epsilon: 0.37866628223599025
Training...
episode: 1080 no of steps: 151 score: 147.0 avg score: 0.9735 memorylength: 131072 epsilon: 0.3783256359048205
Training...
episode: 1081 no of steps: 152 score: 78.0 avg score: 0.5132 memorylength: 131072 epsilon: 0.3779852960174284
Training...
episode: 1082 no of steps: 151 score: -25.0 avg score: -0.1656 memorylength: 131072 epsilon: 0.37764526229813866
Training...
episode: 1083 no of steps: 141 score: 79.0 avg score: 0.5603 memorylength: 131072 epsilon: 0.37730553447152393
Training...
episode: 1084 no of steps: 146 score: 173.0 avg score: 1.1849 memorylength: 131072 epsilon: 0.3769661122624047
Training...
episode: 1085 no of steps: 130 score: 74.0 avg score: 0.5692 memorylength: 131072 epsilon: 0.3766269953958489
Training...
episode: 1086 no of steps: 129 score: 400.0 avg score: 3.1008 memorylength: 131072 epsilon: 0.3762881835971718
Training...
episode: 1087 no of steps: 127 score: 568.0 avg score: 4.4724 memorylength: 131072 epsilon: 0.37594967659193596
Training...
episode: 1088 no of steps: 130 score: 551.0 avg score: 4.2385 memorylength: 131072 epsilon: 0.3756114741059506
Training...
episode: 1089 no of steps: 141 score: 305.0 avg score: 2.1631 memorylength: 131072 epsilon: 0.3752735758652716
Training...
episode: 1090 no of steps: 153 score: 33.0 avg score: 0.2157 memorylength: 131072 epsilon: 0.37493598159620156
Training...
episode: 1091 no of steps: 152 score: 412.0 avg score: 2.7105 memorylength: 131072 epsilon: 0.37459869102528903
Training...
episode: 1092 no of steps: 131 score: 535.0 avg score: 4.084 memorylength: 131072 epsilon: 0.37426170387932856
Training...
episode: 1093 no of steps: 155 score: 521.0 avg score: 3.3613 memorylength: 131072 epsilon: 0.37392501988536064
Training...
episode: 1094 no of steps: 149 score: 403.0 avg score: 2.7047 memorylength: 131072 epsilon: 0.37358863877067117
Training...
episode: 1095 no of steps: 144 score: 535.0 avg score: 3.7153 memorylength: 131072 epsilon: 0.3732525602627914
Training...
episode: 1096 no of steps: 141 score: 589.0 avg score: 4.1773 memorylength: 131072 epsilon: 0.37291678408949774
Training...
episode: 1097 no of steps: 152 score: 9.0 avg score: 0.0592 memorylength: 131072 epsilon: 0.3725813099788115
Training...
episode: 1098 no of steps: 128 score: 225.0 avg score: 1.7578 memorylength: 131072 epsilon: 0.3722461376589986
Training...
episode: 1099 no of steps: 127 score: 228.0 avg score: 1.7953 memorylength: 131072 epsilon: 0.3719112668585695
Training...
episode: 1100 no of steps: 145 score: 252.0 avg score: 1.7379 memorylength: 131072 epsilon: 0.3715766973062788
saving states...
Training...
episode: 1101 no of steps: 146 score: -69.0 avg score: -0.4726 memorylength: 131072 epsilon: 0.37124242873112506
Training...
episode: 1102 no of steps: 125 score: 99.0 avg score: 0.792 memorylength: 131072 epsilon: 0.37090846086235085
Training...
episode: 1103 no of steps: 138 score: 223.0 avg score: 1.6159 memorylength: 131072 epsilon: 0.37057479342944205
Training...
episode: 1104 no of steps: 122 score: 135.0 avg score: 1.1066 memorylength: 131072 epsilon: 0.3702414261621282
Training...
episode: 1105 no of steps: 133 score: 78.0 avg score: 0.5865 memorylength: 131072 epsilon: 0.3699083587903816
Training...
episode: 1106 no of steps: 129 score: 388.0 avg score: 3.0078 memorylength: 131072 epsilon: 0.36957559104441773
Training...
episode: 1107 no of steps: 144 score: 74.0 avg score: 0.5139 memorylength: 131072 epsilon: 0.3692431226546947
Training...
episode: 1108 no of steps: 129 score: 198.0 avg score: 1.5349 memorylength: 131072 epsilon: 0.3689109533519132
Training...
episode: 1109 no of steps: 131 score: 360.0 avg score: 2.7481 memorylength: 131072 epsilon: 0.36857908286701596
Training...
episode: 1110 no of steps: 131 score: 336.0 avg score: 2.5649 memorylength: 131072 epsilon: 0.36824751093118785
Training...
episode: 1111 no of steps: 131 score: 207.0 avg score: 1.5802 memorylength: 131072 epsilon: 0.36791623727585565
Training...
episode: 1112 no of steps: 136 score: 461.0 avg score: 3.3897 memorylength: 131072 epsilon: 0.3675852616326877
Training...
episode: 1113 no of steps: 143 score: 535.0 avg score: 3.7413 memorylength: 131072 epsilon: 0.3672545837335936
Training...
episode: 1114 no of steps: 139 score: 527.0 avg score: 3.7914 memorylength: 131072 epsilon: 0.3669242033107244
Training...
episode: 1115 no of steps: 131 score: 180.0 avg score: 1.374 memorylength: 131072 epsilon: 0.3665941200964717
Training...
episode: 1116 no of steps: 150 score: 292.0 avg score: 1.9467 memorylength: 131072 epsilon: 0.3662643338234683
Training...
episode: 1117 no of steps: 140 score: 323.0 avg score: 2.3071 memorylength: 131072 epsilon: 0.3659348442245872
Training...
episode: 1118 no of steps: 126 score: 82.0 avg score: 0.6508 memorylength: 131072 epsilon: 0.3656056510329419
Training...
episode: 1119 no of steps: 157 score: 47.0 avg score: 0.2994 memorylength: 131072 epsilon: 0.3652767539818858
Training...
episode: 1120 no of steps: 153 score: 243.0 avg score: 1.5882 memorylength: 131072 epsilon: 0.36494815280501225
Training...
episode: 1121 no of steps: 170 score: 279.0 avg score: 1.6412 memorylength: 131072 epsilon: 0.36461984723615437
Training...
episode: 1122 no of steps: 154 score: 261.0 avg score: 1.6948 memorylength: 131072 epsilon: 0.36429183700938456
Training...
episode: 1123 no of steps: 139 score: 543.0 avg score: 3.9065 memorylength: 131072 epsilon: 0.3639641218590145
Training...
episode: 1124 no of steps: 148 score: 126.0 avg score: 0.8514 memorylength: 131072 epsilon: 0.363636701519595
Training...
episode: 1125 no of steps: 143 score: 845.0 avg score: 5.9091 memorylength: 131072 epsilon: 0.36330957572591555
Training...
episode: 1126 no of steps: 135 score: 316.0 avg score: 2.3407 memorylength: 131072 epsilon: 0.36298274421300414
Training...
episode: 1127 no of steps: 143 score: 160.0 avg score: 1.1189 memorylength: 131072 epsilon: 0.36265620671612736
Training...
episode: 1128 no of steps: 133 score: 77.0 avg score: 0.5789 memorylength: 131072 epsilon: 0.3623299629707897
Training...
episode: 1129 no of steps: 139 score: 267.0 avg score: 1.9209 memorylength: 131072 epsilon: 0.3620040127127337
Training...
episode: 1130 no of steps: 139 score: 341.0 avg score: 2.4532 memorylength: 131072 epsilon: 0.3616783556779398
Training...
episode: 1131 no of steps: 127 score: 286.0 avg score: 2.252 memorylength: 131072 epsilon: 0.3613529916026256
Training...
episode: 1132 no of steps: 140 score: 21.0 avg score: 0.15 memorylength: 131072 epsilon: 0.3610279202232463
Training...
episode: 1133 no of steps: 133 score: 396.0 avg score: 2.9774 memorylength: 131072 epsilon: 0.36070314127649394
Training...
episode: 1134 no of steps: 130 score: 92.0 avg score: 0.7077 memorylength: 131072 epsilon: 0.36037865449929773
Training...
episode: 1135 no of steps: 134 score: 223.0 avg score: 1.6642 memorylength: 131072 epsilon: 0.3600544596288232
Training...
episode: 1136 no of steps: 137 score: 155.0 avg score: 1.1314 memorylength: 131072 epsilon: 0.3597305564024726
Training...
episode: 1137 no of steps: 141 score: 295.0 avg score: 2.0922 memorylength: 131072 epsilon: 0.3594069445578843
Training...
episode: 1138 no of steps: 137 score: 333.0 avg score: 2.4307 memorylength: 131072 epsilon: 0.3590836238329325
Training...
episode: 1139 no of steps: 152 score: 573.0 avg score: 3.7697 memorylength: 131072 epsilon: 0.3587605939657277
Training...
episode: 1140 no of steps: 147 score: 403.0 avg score: 2.7415 memorylength: 131072 epsilon: 0.35843785469461537
Training...
episode: 1141 no of steps: 132 score: 549.0 avg score: 4.1591 memorylength: 131072 epsilon: 0.35811540575817696
Training...
episode: 1142 no of steps: 139 score: 607.0 avg score: 4.3669 memorylength: 131072 epsilon: 0.35779324689522857
Training...
episode: 1143 no of steps: 141 score: 216.0 avg score: 1.5319 memorylength: 131072 epsilon: 0.35747137784482175
Training...
episode: 1144 no of steps: 136 score: 263.0 avg score: 1.9338 memorylength: 131072 epsilon: 0.3571497983462424
Training...
episode: 1145 no of steps: 141 score: 53.0 avg score: 0.3759 memorylength: 131072 epsilon: 0.3568285081390111
Training...
episode: 1146 no of steps: 149 score: -79.0 avg score: -0.5302 memorylength: 131072 epsilon: 0.3565075069628829
Training...
episode: 1147 no of steps: 149 score: 18.0 avg score: 0.1208 memorylength: 131072 epsilon: 0.3561867945578466
Training...
episode: 1148 no of steps: 160 score: 235.0 avg score: 1.4688 memorylength: 131072 epsilon: 0.35586637066412535
Training...
episode: 1149 no of steps: 152 score: 595.0 avg score: 3.9145 memorylength: 131072 epsilon: 0.35554623502217564
Training...
episode: 1150 no of steps: 159 score: 1117.0 avg score: 7.0252 memorylength: 131072 epsilon: 0.3552263873726877
saving states...
Training...
episode: 1151 no of steps: 171 score: 720.0 avg score: 4.2105 memorylength: 131072 epsilon: 0.3549068274565848
Training...
episode: 1152 no of steps: 150 score: 606.0 avg score: 4.04 memorylength: 131072 epsilon: 0.3545875550150235
Training...
episode: 1153 no of steps: 155 score: 708.0 avg score: 4.5677 memorylength: 131072 epsilon: 0.354268569789393
Training...
episode: 1154 no of steps: 134 score: 451.0 avg score: 3.3657 memorylength: 131072 epsilon: 0.3539498715213153
Training...
episode: 1155 no of steps: 130 score: 170.0 avg score: 1.3077 memorylength: 131072 epsilon: 0.35363145995264483
Training...
episode: 1156 no of steps: 135 score: 694.0 avg score: 5.1407 memorylength: 131072 epsilon: 0.3533133348254681
Training...
episode: 1157 no of steps: 128 score: 279.0 avg score: 2.1797 memorylength: 131072 epsilon: 0.3529954958821038
Training...
episode: 1158 no of steps: 131 score: 49.0 avg score: 0.374 memorylength: 131072 epsilon: 0.3526779428651024
Training...
episode: 1159 no of steps: 133 score: 34.0 avg score: 0.2556 memorylength: 131072 epsilon: 0.3523606755172459
Training...
episode: 1160 no of steps: 138 score: 127.0 avg score: 0.9203 memorylength: 131072 epsilon: 0.3520436935815477
Training...
episode: 1161 no of steps: 141 score: 3.0 avg score: 0.0213 memorylength: 131072 epsilon: 0.35172699680125247
Training...
episode: 1162 no of steps: 145 score: 391.0 avg score: 2.6966 memorylength: 131072 epsilon: 0.3514105849198358
Training...
episode: 1163 no of steps: 156 score: 445.0 avg score: 2.8526 memorylength: 131072 epsilon: 0.351094457681004
Training...
episode: 1164 no of steps: 145 score: 504.0 avg score: 3.4759 memorylength: 131072 epsilon: 0.35077861482869405
Training...
episode: 1165 no of steps: 144 score: 886.0 avg score: 6.1528 memorylength: 131072 epsilon: 0.3504630561070731
Training...
episode: 1166 no of steps: 112 score: 621.0 avg score: 5.5446 memorylength: 131072 epsilon: 0.3501477812605388
Training...
episode: 1167 no of steps: 122 score: 414.0 avg score: 3.3934 memorylength: 131072 epsilon: 0.34983279003371825
Training...
episode: 1168 no of steps: 123 score: 197.0 avg score: 1.6016 memorylength: 131072 epsilon: 0.34951808217146874
Training...
episode: 1169 no of steps: 127 score: 491.0 avg score: 3.8661 memorylength: 131072 epsilon: 0.3492036574188767
Training...
episode: 1170 no of steps: 140 score: 222.0 avg score: 1.5857 memorylength: 131072 epsilon: 0.34888951552125824
Training...
episode: 1171 no of steps: 143 score: 354.0 avg score: 2.4755 memorylength: 131072 epsilon: 0.34857565622415826
Training...
episode: 1172 no of steps: 149 score: 567.0 avg score: 3.8054 memorylength: 131072 epsilon: 0.3482620792733509
Training...
episode: 1173 no of steps: 137 score: 156.0 avg score: 1.1387 memorylength: 131072 epsilon: 0.3479487844148386
Training...
episode: 1174 no of steps: 151 score: -71.0 avg score: -0.4702 memorylength: 131072 epsilon: 0.34763577139485263
Training...
episode: 1175 no of steps: 164 score: 171.0 avg score: 1.0427 memorylength: 131072 epsilon: 0.34732303995985236
Training...
episode: 1176 no of steps: 157 score: 379.0 avg score: 2.414 memorylength: 131072 epsilon: 0.34701058985652533
Training...
episode: 1177 no of steps: 148 score: 250.0 avg score: 1.6892 memorylength: 131072 epsilon: 0.3466984208317871
Training...
episode: 1178 no of steps: 131 score: 107.0 avg score: 0.8168 memorylength: 131072 epsilon: 0.3463865326327804
Training...
episode: 1179 no of steps: 131 score: 351.0 avg score: 2.6794 memorylength: 131072 epsilon: 0.34607492500687614
Training...
episode: 1180 no of steps: 152 score: 387.0 avg score: 2.5461 memorylength: 131072 epsilon: 0.3457635977016718
Training...
episode: 1181 no of steps: 141 score: 387.0 avg score: 2.7447 memorylength: 131072 epsilon: 0.34545255046499257
Training...
episode: 1182 no of steps: 148 score: 424.0 avg score: 2.8649 memorylength: 131072 epsilon: 0.3451417830448899
Training...
episode: 1183 no of steps: 135 score: 544.0 avg score: 4.0296 memorylength: 131072 epsilon: 0.3448312951896423
Training...
episode: 1184 no of steps: 131 score: 412.0 avg score: 3.145 memorylength: 131072 epsilon: 0.34452108664775455
Training...
episode: 1185 no of steps: 137 score: 727.0 avg score: 5.3066 memorylength: 131072 epsilon: 0.3442111571679577
Training...
episode: 1186 no of steps: 132 score: 468.0 avg score: 3.5455 memorylength: 131072 epsilon: 0.3439015064992089
Training...
episode: 1187 no of steps: 135 score: 337.0 avg score: 2.4963 memorylength: 131072 epsilon: 0.3435921343906911
Training...
episode: 1188 no of steps: 142 score: 229.0 avg score: 1.6127 memorylength: 131072 epsilon: 0.3432830405918128
Training...
episode: 1189 no of steps: 145 score: 414.0 avg score: 2.8552 memorylength: 131072 epsilon: 0.34297422485220797
Training...
episode: 1190 no of steps: 143 score: 155.0 avg score: 1.0839 memorylength: 131072 epsilon: 0.34266568692173605
Training...
episode: 1191 no of steps: 147 score: 687.0 avg score: 4.6735 memorylength: 131072 epsilon: 0.3423574265504811
Training...
episode: 1192 no of steps: 167 score: 375.0 avg score: 2.2455 memorylength: 131072 epsilon: 0.3420494434887523
Training...
episode: 1193 no of steps: 137 score: 660.0 avg score: 4.8175 memorylength: 131072 epsilon: 0.34174173748708336
Training...
episode: 1194 no of steps: 145 score: 827.0 avg score: 5.7034 memorylength: 131072 epsilon: 0.34143430829623234
Training...
episode: 1195 no of steps: 155 score: 518.0 avg score: 3.3419 memorylength: 131072 epsilon: 0.34112715566718166
Training...
episode: 1196 no of steps: 143 score: 546.0 avg score: 3.8182 memorylength: 131072 epsilon: 0.3408202793511375
Training...
episode: 1197 no of steps: 128 score: 244.0 avg score: 1.9062 memorylength: 131072 epsilon: 0.3405136790995303
Training...
episode: 1198 no of steps: 144 score: 459.0 avg score: 3.1875 memorylength: 131072 epsilon: 0.3402073546640135
Training...
episode: 1199 no of steps: 135 score: 403.0 avg score: 2.9852 memorylength: 131072 epsilon: 0.3399013057964646
Training...
episode: 1200 no of steps: 126 score: 286.0 avg score: 2.2698 memorylength: 131072 epsilon: 0.3395955322489838
saving states...
Training...
episode: 1201 no of steps: 133 score: 116.0 avg score: 0.8722 memorylength: 131072 epsilon: 0.3392900337738947
Training...
episode: 1202 no of steps: 153 score: -95.0 avg score: -0.6209 memorylength: 131072 epsilon: 0.33898481012374343
Training...
episode: 1203 no of steps: 154 score: 494.0 avg score: 3.2078 memorylength: 131072 epsilon: 0.33867986105129866
Training...
episode: 1204 no of steps: 156 score: 444.0 avg score: 2.8462 memorylength: 131072 epsilon: 0.3383751863095519
Training...
episode: 1205 no of steps: 156 score: 303.0 avg score: 1.9423 memorylength: 131072 epsilon: 0.3380707856517163
Training...
episode: 1206 no of steps: 152 score: 486.0 avg score: 3.1974 memorylength: 131072 epsilon: 0.3377666588312276
Training...
episode: 1207 no of steps: 157 score: 606.0 avg score: 3.8599 memorylength: 131072 epsilon: 0.3374628056017428
Training...
episode: 1208 no of steps: 142 score: 882.0 avg score: 6.2113 memorylength: 131072 epsilon: 0.33715922571714096
Training...
episode: 1209 no of steps: 146 score: 1193.0 avg score: 8.1712 memorylength: 131072 epsilon: 0.3368559189315222
Training...
episode: 1210 no of steps: 127 score: 573.0 avg score: 4.5118 memorylength: 131072 epsilon: 0.3365528849992082
Training...
episode: 1211 no of steps: 133 score: 553.0 avg score: 4.1579 memorylength: 131072 epsilon: 0.3362501236747414
Training...
episode: 1212 no of steps: 139 score: 198.0 avg score: 1.4245 memorylength: 131072 epsilon: 0.3359476347128849
Training...
episode: 1213 no of steps: 136 score: 369.0 avg score: 2.7132 memorylength: 131072 epsilon: 0.3356454178686229
Training...
episode: 1214 no of steps: 132 score: 270.0 avg score: 2.0455 memorylength: 131072 epsilon: 0.33534347289715954
Training...
episode: 1215 no of steps: 151 score: 555.0 avg score: 3.6755 memorylength: 131072 epsilon: 0.33504179955391955
Training...
episode: 1216 no of steps: 145 score: 330.0 avg score: 2.2759 memorylength: 131072 epsilon: 0.3347403975945473
Training...
episode: 1217 no of steps: 155 score: 413.0 avg score: 2.6645 memorylength: 131072 epsilon: 0.33443926677490743
Training...
episode: 1218 no of steps: 148 score: 425.0 avg score: 2.8716 memorylength: 131072 epsilon: 0.33413840685108376
Training...
episode: 1219 no of steps: 153 score: 444.0 avg score: 2.902 memorylength: 131072 epsilon: 0.3338378175793798
Training...
episode: 1220 no of steps: 151 score: 664.0 avg score: 4.3974 memorylength: 131072 epsilon: 0.3335374987163183
Training...
episode: 1221 no of steps: 137 score: 476.0 avg score: 3.4745 memorylength: 131072 epsilon: 0.33323745001864086
Training...
episode: 1222 no of steps: 146 score: 759.0 avg score: 5.1986 memorylength: 131072 epsilon: 0.3329376712433081
Training...
episode: 1223 no of steps: 140 score: 364.0 avg score: 2.6 memorylength: 131072 epsilon: 0.33263816214749903
Training...
episode: 1224 no of steps: 133 score: 381.0 avg score: 2.8647 memorylength: 131072 epsilon: 0.33233892248861147
Training...
episode: 1225 no of steps: 130 score: 462.0 avg score: 3.5538 memorylength: 131072 epsilon: 0.3320399520242612
Training...
episode: 1226 no of steps: 134 score: 90.0 avg score: 0.6716 memorylength: 131072 epsilon: 0.3317412505122821
Training...
episode: 1227 no of steps: 130 score: -123.0 avg score: -0.9462 memorylength: 131072 epsilon: 0.3314428177107259
Training...
episode: 1228 no of steps: 126 score: 201.0 avg score: 1.5952 memorylength: 131072 epsilon: 0.33114465337786214
Training...
episode: 1229 no of steps: 140 score: 162.0 avg score: 1.1571 memorylength: 131072 epsilon: 0.3308467572721777
Training...
episode: 1230 no of steps: 137 score: 1.0 avg score: 0.0073 memorylength: 131072 epsilon: 0.3305491291523765
Training...
episode: 1231 no of steps: 145 score: 534.0 avg score: 3.6828 memorylength: 131072 epsilon: 0.33025176877737994
Training...
episode: 1232 no of steps: 150 score: 270.0 avg score: 1.8 memorylength: 131072 epsilon: 0.32995467590632604
Training...
episode: 1233 no of steps: 141 score: 188.0 avg score: 1.3333 memorylength: 131072 epsilon: 0.3296578502985696
Training...
episode: 1234 no of steps: 142 score: 416.0 avg score: 2.9296 memorylength: 131072 epsilon: 0.3293612917136817
Training...
episode: 1235 no of steps: 134 score: 273.0 avg score: 2.0373 memorylength: 131072 epsilon: 0.3290649999114501
Training...
episode: 1236 no of steps: 136 score: 369.0 avg score: 2.7132 memorylength: 131072 epsilon: 0.3287689746518783
Training...
episode: 1237 no of steps: 152 score: 372.0 avg score: 2.4474 memorylength: 131072 epsilon: 0.3284732156951859
Training...
episode: 1238 no of steps: 151 score: 839.0 avg score: 5.5563 memorylength: 131072 epsilon: 0.32817772280180796
Training...
episode: 1239 no of steps: 175 score: 290.0 avg score: 1.6571 memorylength: 131072 epsilon: 0.3278824957323954
Training...
episode: 1240 no of steps: 145 score: 655.0 avg score: 4.5172 memorylength: 131072 epsilon: 0.3275875342478143
Training...
episode: 1241 no of steps: 151 score: 561.0 avg score: 3.7152 memorylength: 131072 epsilon: 0.3272928381091456
Training...
episode: 1242 no of steps: 142 score: 30.0 avg score: 0.2113 memorylength: 131072 epsilon: 0.3269984070776857
Training...
episode: 1243 no of steps: 152 score: 157.0 avg score: 1.0329 memorylength: 131072 epsilon: 0.32670424091494515
Training...
episode: 1244 no of steps: 145 score: 488.0 avg score: 3.3655 memorylength: 131072 epsilon: 0.32641033938264963
Training...
episode: 1245 no of steps: 160 score: 278.0 avg score: 1.7375 memorylength: 131072 epsilon: 0.3261167022427387
Training...
episode: 1246 no of steps: 158 score: 844.0 avg score: 5.3418 memorylength: 131072 epsilon: 0.3258233292573663
Training...
episode: 1247 no of steps: 142 score: 962.0 avg score: 6.7746 memorylength: 131072 epsilon: 0.3255302201889003
Training...
episode: 1248 no of steps: 147 score: 630.0 avg score: 4.2857 memorylength: 131072 epsilon: 0.32523737479992243
Training...
episode: 1249 no of steps: 135 score: 634.0 avg score: 4.6963 memorylength: 131072 epsilon: 0.32494479285322786
Training...
episode: 1250 no of steps: 147 score: 857.0 avg score: 5.8299 memorylength: 131072 epsilon: 0.324652474111825
saving states...
Training...
episode: 1251 no of steps: 144 score: 478.0 avg score: 3.3194 memorylength: 131072 epsilon: 0.32436041833893603
Training...
episode: 1252 no of steps: 137 score: 442.0 avg score: 3.2263 memorylength: 131072 epsilon: 0.32406862529799535
Training...
episode: 1253 no of steps: 142 score: 507.0 avg score: 3.5704 memorylength: 131072 epsilon: 0.32377709475265093
Training...
episode: 1254 no of steps: 139 score: 714.0 avg score: 5.1367 memorylength: 131072 epsilon: 0.32348582646676277
Training...
episode: 1255 no of steps: 126 score: 245.0 avg score: 1.9444 memorylength: 131072 epsilon: 0.32319482020440365
Training...
episode: 1256 no of steps: 139 score: 327.0 avg score: 2.3525 memorylength: 131072 epsilon: 0.32290407572985846
Training...
episode: 1257 no of steps: 137 score: 380.0 avg score: 2.7737 memorylength: 131072 epsilon: 0.32261359280762425
Training...
episode: 1258 no of steps: 150 score: 373.0 avg score: 2.4867 memorylength: 131072 epsilon: 0.32232337120240967
Training...
episode: 1259 no of steps: 127 score: 148.0 avg score: 1.1654 memorylength: 131072 epsilon: 0.3220334106791353
Training...
episode: 1260 no of steps: 136 score: 400.0 avg score: 2.9412 memorylength: 131072 epsilon: 0.32174371100293314
Training...
episode: 1261 no of steps: 137 score: 428.0 avg score: 3.1241 memorylength: 131072 epsilon: 0.3214542719391463
Training...
episode: 1262 no of steps: 134 score: -23.0 avg score: -0.1716 memorylength: 131072 epsilon: 0.32116509325332926
Training...
episode: 1263 no of steps: 141 score: 274.0 avg score: 1.9433 memorylength: 131072 epsilon: 0.3208761747112472
Training...
episode: 1264 no of steps: 135 score: 393.0 avg score: 2.9111 memorylength: 131072 epsilon: 0.3205875160788761
Training...
episode: 1265 no of steps: 162 score: 442.0 avg score: 2.7284 memorylength: 131072 epsilon: 0.32029911712240244
Training...
episode: 1266 no of steps: 144 score: 443.0 avg score: 3.0764 memorylength: 131072 epsilon: 0.32001097760822306
Training...
episode: 1267 no of steps: 149 score: 485.0 avg score: 3.255 memorylength: 131072 epsilon: 0.319723097302945
Training...
episode: 1268 no of steps: 146 score: 319.0 avg score: 2.1849 memorylength: 131072 epsilon: 0.31943547597338506
Training...
episode: 1269 no of steps: 144 score: 602.0 avg score: 4.1806 memorylength: 131072 epsilon: 0.3191481133865701
Training...
episode: 1270 no of steps: 146 score: 721.0 avg score: 4.9384 memorylength: 131072 epsilon: 0.31886100930973627
Training...
episode: 1271 no of steps: 142 score: 562.0 avg score: 3.9577 memorylength: 131072 epsilon: 0.31857416351032936
Training...
episode: 1272 no of steps: 154 score: 553.0 avg score: 3.5909 memorylength: 131072 epsilon: 0.31828757575600414
Training...
episode: 1273 no of steps: 140 score: 551.0 avg score: 3.9357 memorylength: 131072 epsilon: 0.31800124581462463
Training...
episode: 1274 no of steps: 142 score: 479.0 avg score: 3.3732 memorylength: 131072 epsilon: 0.3177151734542635
Training...
episode: 1275 no of steps: 147 score: 684.0 avg score: 4.6531 memorylength: 131072 epsilon: 0.31742935844320214
Training...
episode: 1276 no of steps: 137 score: 531.0 avg score: 3.8759 memorylength: 131072 epsilon: 0.31714380054993047
Training...
episode: 1277 no of steps: 157 score: 43.0 avg score: 0.2739 memorylength: 131072 epsilon: 0.3168584995431463
Training...
episode: 1278 no of steps: 121 score: 542.0 avg score: 4.4793 memorylength: 131072 epsilon: 0.31657345519175617
Training...
episode: 1279 no of steps: 126 score: 295.0 avg score: 2.3413 memorylength: 131072 epsilon: 0.3162886672648738
Training...
episode: 1280 no of steps: 142 score: 328.0 avg score: 2.3099 memorylength: 131072 epsilon: 0.3160041355318213
Training...
episode: 1281 no of steps: 140 score: 344.0 avg score: 2.4571 memorylength: 131072 epsilon: 0.3157198597621275
Training...
episode: 1282 no of steps: 125 score: 264.0 avg score: 2.112 memorylength: 131072 epsilon: 0.31543583972552947
Training...
episode: 1283 no of steps: 146 score: 85.0 avg score: 0.5822 memorylength: 131072 epsilon: 0.31515207519197064
Training...
episode: 1284 no of steps: 143 score: 651.0 avg score: 4.5524 memorylength: 131072 epsilon: 0.314868565931602
Training...
episode: 1285 no of steps: 145 score: 369.0 avg score: 2.5448 memorylength: 131072 epsilon: 0.31458531171478077
Training...
episode: 1286 no of steps: 147 score: 270.0 avg score: 1.8367 memorylength: 131072 epsilon: 0.3143023123120711
Training...
episode: 1287 no of steps: 134 score: 881.0 avg score: 6.5746 memorylength: 131072 epsilon: 0.3140195674942436
Training...
episode: 1288 no of steps: 151 score: 854.0 avg score: 5.6556 memorylength: 131072 epsilon: 0.3137370770322747
Training...
episode: 1289 no of steps: 136 score: 773.0 avg score: 5.6838 memorylength: 131072 epsilon: 0.31345484069734736
Training...
episode: 1290 no of steps: 131 score: 393.0 avg score: 3.0 memorylength: 131072 epsilon: 0.31317285826084995
Training...
episode: 1291 no of steps: 144 score: 656.0 avg score: 4.5556 memorylength: 131072 epsilon: 0.3128911294943768
Training...
episode: 1292 no of steps: 128 score: 315.0 avg score: 2.4609 memorylength: 131072 epsilon: 0.3126096541697275
Training...
episode: 1293 no of steps: 144 score: 88.0 avg score: 0.6111 memorylength: 131072 epsilon: 0.3123284320589072
Training...
episode: 1294 no of steps: 149 score: 85.0 avg score: 0.5705 memorylength: 131072 epsilon: 0.3120474629341257
Training...
episode: 1295 no of steps: 150 score: 120.0 avg score: 0.8 memorylength: 131072 epsilon: 0.3117667465677982
Training...
episode: 1296 no of steps: 144 score: 504.0 avg score: 3.5 memorylength: 131072 epsilon: 0.3114862827325444
Training...
episode: 1297 no of steps: 152 score: 220.0 avg score: 1.4474 memorylength: 131072 epsilon: 0.31120607120118843
Training...
episode: 1298 no of steps: 173 score: 295.0 avg score: 1.7052 memorylength: 131072 epsilon: 0.31092611174675916
Training...
episode: 1299 no of steps: 149 score: 51.0 avg score: 0.3423 memorylength: 131072 epsilon: 0.31064640414248923
Training...
episode: 1300 no of steps: 154 score: 396.0 avg score: 2.5714 memorylength: 131072 epsilon: 0.3103669481618156
saving states...
Training...
episode: 1301 no of steps: 133 score: 629.0 avg score: 4.7293 memorylength: 131072 epsilon: 0.31008774357837876
Training...
episode: 1302 no of steps: 155 score: 612.0 avg score: 3.9484 memorylength: 131072 epsilon: 0.3098087901660232
Training...
episode: 1303 no of steps: 145 score: 575.0 avg score: 3.9655 memorylength: 131072 epsilon: 0.30953008769879636
Training...
episode: 1304 no of steps: 146 score: 434.0 avg score: 2.9726 memorylength: 131072 epsilon: 0.3092516359509495
Training...
episode: 1305 no of steps: 138 score: 335.0 avg score: 2.4275 memorylength: 131072 epsilon: 0.3089734346969366
Training...
episode: 1306 no of steps: 137 score: 319.0 avg score: 2.3285 memorylength: 131072 epsilon: 0.3086954837114145
Training...
episode: 1307 no of steps: 140 score: 359.0 avg score: 2.5643 memorylength: 131072 epsilon: 0.3084177827692431
Training...
episode: 1308 no of steps: 145 score: 234.0 avg score: 1.6138 memorylength: 131072 epsilon: 0.3081403316454843
Training...
episode: 1309 no of steps: 153 score: 23.0 avg score: 0.1503 memorylength: 131072 epsilon: 0.30786313011540306
Training...
episode: 1310 no of steps: 144 score: 203.0 avg score: 1.4097 memorylength: 131072 epsilon: 0.30758617795446586
Training...
episode: 1311 no of steps: 157 score: 513.0 avg score: 3.2675 memorylength: 131072 epsilon: 0.30730947493834154
Training...
episode: 1312 no of steps: 136 score: 648.0 avg score: 4.7647 memorylength: 131072 epsilon: 0.30703302084290063
Training...
episode: 1313 no of steps: 124 score: 576.0 avg score: 4.6452 memorylength: 131072 epsilon: 0.30675681544421535
Training...
episode: 1314 no of steps: 127 score: 563.0 avg score: 4.4331 memorylength: 131072 epsilon: 0.3064808585185592
Training...
episode: 1315 no of steps: 138 score: 700.0 avg score: 5.0725 memorylength: 131072 epsilon: 0.30620514984240704
Training...
episode: 1316 no of steps: 139 score: 468.0 avg score: 3.3669 memorylength: 131072 epsilon: 0.305929689192435
Training...
episode: 1317 no of steps: 145 score: 603.0 avg score: 4.1586 memorylength: 131072 epsilon: 0.3056544763455198
Training...
episode: 1318 no of steps: 127 score: 11.0 avg score: 0.0866 memorylength: 131072 epsilon: 0.305379511078739
Training...
episode: 1319 no of steps: 145 score: 51.0 avg score: 0.3517 memorylength: 131072 epsilon: 0.30510479316937084
Training...
episode: 1320 no of steps: 156 score: 265.0 avg score: 1.6987 memorylength: 131072 epsilon: 0.30483032239489366
Training...
episode: 1321 no of steps: 155 score: 493.0 avg score: 3.1806 memorylength: 131072 epsilon: 0.3045560985329862
Training...
episode: 1322 no of steps: 174 score: 562.0 avg score: 3.2299 memorylength: 131072 epsilon: 0.30428212136152716
Training...
episode: 1323 no of steps: 159 score: 801.0 avg score: 5.0377 memorylength: 131072 epsilon: 0.304008390658595
Training...
episode: 1324 no of steps: 180 score: 844.0 avg score: 4.6889 memorylength: 131072 epsilon: 0.3037349062024677
Training...
episode: 1325 no of steps: 167 score: 792.0 avg score: 4.7425 memorylength: 131072 epsilon: 0.3034616677716229
Training...
episode: 1326 no of steps: 157 score: 1051.0 avg score: 6.6943 memorylength: 131072 epsilon: 0.3031886751447375
Training...
episode: 1327 no of steps: 147 score: 619.0 avg score: 4.2109 memorylength: 131072 epsilon: 0.30291592810068757
Training...
episode: 1328 no of steps: 172 score: 552.0 avg score: 3.2093 memorylength: 131072 epsilon: 0.3026434264185477
Training...
episode: 1329 no of steps: 175 score: 105.0 avg score: 0.6 memorylength: 131072 epsilon: 0.30237116987759177
Training...
episode: 1330 no of steps: 165 score: 490.0 avg score: 2.9697 memorylength: 131072 epsilon: 0.3020991582572919
Training...
episode: 1331 no of steps: 151 score: 423.0 avg score: 2.8013 memorylength: 131072 epsilon: 0.30182739133731856
Training...
episode: 1332 no of steps: 158 score: 327.0 avg score: 2.0696 memorylength: 131072 epsilon: 0.30155586889754066
Training...
episode: 1333 no of steps: 133 score: 381.0 avg score: 2.8647 memorylength: 131072 epsilon: 0.3012845907180249
Training...
episode: 1334 no of steps: 154 score: 515.0 avg score: 3.3442 memorylength: 131072 epsilon: 0.30101355657903606
Training...
episode: 1335 no of steps: 139 score: 216.0 avg score: 1.554 memorylength: 131072 epsilon: 0.30074276626103635
Training...
episode: 1336 no of steps: 142 score: 306.0 avg score: 2.1549 memorylength: 131072 epsilon: 0.3004722195446857
Training...
episode: 1337 no of steps: 139 score: 768.0 avg score: 5.5252 memorylength: 131072 epsilon: 0.30020191621084114
Training...
episode: 1338 no of steps: 138 score: 504.0 avg score: 3.6522 memorylength: 131072 epsilon: 0.2999318560405571
Training...
episode: 1339 no of steps: 144 score: 765.0 avg score: 5.3125 memorylength: 131072 epsilon: 0.2996620388150847
Training...
episode: 1340 no of steps: 144 score: 424.0 avg score: 2.9444 memorylength: 131072 epsilon: 0.2993924643158721
Training...
episode: 1341 no of steps: 147 score: 219.0 avg score: 1.4898 memorylength: 131072 epsilon: 0.29912313232456383
Training...
episode: 1342 no of steps: 145 score: 467.0 avg score: 3.2207 memorylength: 131072 epsilon: 0.29885404262300097
Training...
episode: 1343 no of steps: 146 score: 526.0 avg score: 3.6027 memorylength: 131072 epsilon: 0.2985851949932209
Training...
episode: 1344 no of steps: 150 score: 216.0 avg score: 1.44 memorylength: 131072 epsilon: 0.29831658921745696
Training...
episode: 1345 no of steps: 141 score: 489.0 avg score: 3.4681 memorylength: 131072 epsilon: 0.29804822507813855
Training...
episode: 1346 no of steps: 158 score: 489.0 avg score: 3.0949 memorylength: 131072 epsilon: 0.2977801023578906
Training...
episode: 1347 no of steps: 152 score: 532.0 avg score: 3.5 memorylength: 131072 epsilon: 0.29751222083953377
Training...
episode: 1348 no of steps: 157 score: 450.0 avg score: 2.8662 memorylength: 131072 epsilon: 0.2972445803060839
Training...
episode: 1349 no of steps: 138 score: 693.0 avg score: 5.0217 memorylength: 131072 epsilon: 0.29697718054075234
Training...
episode: 1350 no of steps: 173 score: 253.0 avg score: 1.4624 memorylength: 131072 epsilon: 0.29671002132694513
saving states...
Training...
episode: 1351 no of steps: 184 score: 954.0 avg score: 5.1848 memorylength: 131072 epsilon: 0.29644310244826333
Training...
episode: 1352 no of steps: 144 score: 368.0 avg score: 2.5556 memorylength: 131072 epsilon: 0.2961764236885026
Training...
episode: 1353 no of steps: 183 score: 474.0 avg score: 2.5902 memorylength: 131072 epsilon: 0.2959099848316531
Training...
episode: 1354 no of steps: 152 score: 576.0 avg score: 3.7895 memorylength: 131072 epsilon: 0.29564378566189947
Training...
episode: 1355 no of steps: 159 score: 629.0 avg score: 3.956 memorylength: 131072 epsilon: 0.2953778259636202
Training...
episode: 1356 no of steps: 137 score: 492.0 avg score: 3.5912 memorylength: 131072 epsilon: 0.29511210552138817
Training...
episode: 1357 no of steps: 143 score: 529.0 avg score: 3.6993 memorylength: 131072 epsilon: 0.2948466241199695
Training...
episode: 1358 no of steps: 138 score: 173.0 avg score: 1.2536 memorylength: 131072 epsilon: 0.2945813815443245
Training...
episode: 1359 no of steps: 142 score: 17.0 avg score: 0.1197 memorylength: 131072 epsilon: 0.29431637757960644
Training...
episode: 1360 no of steps: 176 score: 614.0 avg score: 3.4886 memorylength: 131072 epsilon: 0.2940516120111623
Training...
episode: 1361 no of steps: 165 score: 668.0 avg score: 4.0485 memorylength: 131072 epsilon: 0.2937870846245319
Training...
episode: 1362 no of steps: 155 score: 6.0 avg score: 0.0387 memorylength: 131072 epsilon: 0.2935227952054479
Training...
episode: 1363 no of steps: 155 score: 705.0 avg score: 4.5484 memorylength: 131072 epsilon: 0.293258743539836
Training...
episode: 1364 no of steps: 141 score: 558.0 avg score: 3.9574 memorylength: 131072 epsilon: 0.2929949294138143
Training...
episode: 1365 no of steps: 130 score: 805.0 avg score: 6.1923 memorylength: 131072 epsilon: 0.2927313526136934
Training...
episode: 1366 no of steps: 127 score: 235.0 avg score: 1.8504 memorylength: 131072 epsilon: 0.29246801292597596
Training...
episode: 1367 no of steps: 144 score: 588.0 avg score: 4.0833 memorylength: 131072 epsilon: 0.2922049101373569
Training...
episode: 1368 no of steps: 130 score: 548.0 avg score: 4.2154 memorylength: 131072 epsilon: 0.2919420440347229
Training...
episode: 1369 no of steps: 140 score: 297.0 avg score: 2.1214 memorylength: 131072 epsilon: 0.29167941440515244
Training...
episode: 1370 no of steps: 151 score: 502.0 avg score: 3.3245 memorylength: 131072 epsilon: 0.2914170210359156
Training...
episode: 1371 no of steps: 157 score: 389.0 avg score: 2.4777 memorylength: 131072 epsilon: 0.29115486371447347
Training...
episode: 1372 no of steps: 144 score: 219.0 avg score: 1.5208 memorylength: 131072 epsilon: 0.29089294222847883
Training...
episode: 1373 no of steps: 153 score: 18.0 avg score: 0.1176 memorylength: 131072 epsilon: 0.2906312563657752
Training...
episode: 1374 no of steps: 153 score: -27.0 avg score: -0.1765 memorylength: 131072 epsilon: 0.2903698059143971
Training...
episode: 1375 no of steps: 156 score: 25.0 avg score: 0.1603 memorylength: 131072 epsilon: 0.2901085906625694
Training...
episode: 1376 no of steps: 149 score: 544.0 avg score: 3.651 memorylength: 131072 epsilon: 0.28984761039870804
Training...
episode: 1377 no of steps: 164 score: 714.0 avg score: 4.3537 memorylength: 131072 epsilon: 0.2895868649114188
Training...
episode: 1378 no of steps: 157 score: 576.0 avg score: 3.6688 memorylength: 131072 epsilon: 0.2893263539894979
Training...
episode: 1379 no of steps: 175 score: 925.0 avg score: 5.2857 memorylength: 131072 epsilon: 0.28906607742193147
Training...
episode: 1380 no of steps: 155 score: 987.0 avg score: 6.3677 memorylength: 131072 epsilon: 0.28880603499789537
Training...
episode: 1381 no of steps: 167 score: 810.0 avg score: 4.8503 memorylength: 131072 epsilon: 0.2885462265067554
Training...
episode: 1382 no of steps: 163 score: 706.0 avg score: 4.3313 memorylength: 131072 epsilon: 0.28828665173806645
Training...
episode: 1383 no of steps: 154 score: 771.0 avg score: 5.0065 memorylength: 131072 epsilon: 0.28802731048157315
Training...
episode: 1384 no of steps: 173 score: 418.0 avg score: 2.4162 memorylength: 131072 epsilon: 0.28776820252720897
Training...
episode: 1385 no of steps: 152 score: 854.0 avg score: 5.6184 memorylength: 131072 epsilon: 0.2875093276650965
Training...
episode: 1386 no of steps: 162 score: 719.0 avg score: 4.4383 memorylength: 131072 epsilon: 0.287250685685547
Training...
episode: 1387 no of steps: 150 score: 1063.0 avg score: 7.0867 memorylength: 131072 epsilon: 0.2869922763790606
Training...
episode: 1388 no of steps: 160 score: 706.0 avg score: 4.4125 memorylength: 131072 epsilon: 0.28673409953632567
Training...
episode: 1389 no of steps: 160 score: 711.0 avg score: 4.4438 memorylength: 131072 epsilon: 0.2864761549482188
Training...
episode: 1390 no of steps: 153 score: 1007.0 avg score: 6.5817 memorylength: 131072 epsilon: 0.28621844240580513
Training...
episode: 1391 no of steps: 150 score: 859.0 avg score: 5.7267 memorylength: 131072 epsilon: 0.2859609617003373
Training...
episode: 1392 no of steps: 147 score: 342.0 avg score: 2.3265 memorylength: 131072 epsilon: 0.285703712623256
Training...
episode: 1393 no of steps: 144 score: 499.0 avg score: 3.4653 memorylength: 131072 epsilon: 0.2854466949661894
Training...
episode: 1394 no of steps: 133 score: 198.0 avg score: 1.4887 memorylength: 131072 epsilon: 0.2851899085209533
Training...
episode: 1395 no of steps: 146 score: 493.0 avg score: 3.3767 memorylength: 131072 epsilon: 0.28493335307955053
Training...
episode: 1396 no of steps: 134 score: 402.0 avg score: 3.0 memorylength: 131072 epsilon: 0.2846770284341713
Training...
episode: 1397 no of steps: 130 score: 323.0 avg score: 2.4846 memorylength: 131072 epsilon: 0.28442093437719257
Training...
episode: 1398 no of steps: 135 score: 197.0 avg score: 1.4593 memorylength: 131072 epsilon: 0.2841650707011781
Training...
episode: 1399 no of steps: 132 score: 227.0 avg score: 1.7197 memorylength: 131072 epsilon: 0.28390943719887834
Training...
episode: 1400 no of steps: 148 score: 132.0 avg score: 0.8919 memorylength: 131072 epsilon: 0.2836540336632301
saving states...
Training...
episode: 1401 no of steps: 151 score: 174.0 avg score: 1.1523 memorylength: 131072 epsilon: 0.2833988598873566
Training...
episode: 1402 no of steps: 136 score: 590.0 avg score: 4.3382 memorylength: 131072 epsilon: 0.2831439156645669
Training...
episode: 1403 no of steps: 132 score: 449.0 avg score: 3.4015 memorylength: 131072 epsilon: 0.2828892007883564
Training...
episode: 1404 no of steps: 146 score: 328.0 avg score: 2.2466 memorylength: 131072 epsilon: 0.2826347150524058
Training...
episode: 1405 no of steps: 144 score: 657.0 avg score: 4.5625 memorylength: 131072 epsilon: 0.28238045825058183
Training...
episode: 1406 no of steps: 140 score: 916.0 avg score: 6.5429 memorylength: 131072 epsilon: 0.2821264301769364
Training...
episode: 1407 no of steps: 153 score: 436.0 avg score: 2.8497 memorylength: 131072 epsilon: 0.2818726306257066
Training...
episode: 1408 no of steps: 180 score: 267.0 avg score: 1.4833 memorylength: 131072 epsilon: 0.281619059391315
Training...
episode: 1409 no of steps: 153 score: 526.0 avg score: 3.4379 memorylength: 131072 epsilon: 0.2813657162683688
Training...
episode: 1410 no of steps: 163 score: 531.0 avg score: 3.2577 memorylength: 131072 epsilon: 0.2811126010516601
Training...
episode: 1411 no of steps: 170 score: 599.0 avg score: 3.5235 memorylength: 131072 epsilon: 0.28085971353616546
Training...
episode: 1412 no of steps: 146 score: 408.0 avg score: 2.7945 memorylength: 131072 epsilon: 0.28060705351704607
Training...
episode: 1413 no of steps: 142 score: 629.0 avg score: 4.4296 memorylength: 131072 epsilon: 0.2803546207896472
Training...
episode: 1414 no of steps: 157 score: 808.0 avg score: 5.1465 memorylength: 131072 epsilon: 0.2801024151494985
Training...
episode: 1415 no of steps: 148 score: 898.0 avg score: 6.0676 memorylength: 131072 epsilon: 0.2798504363923133
Training...
episode: 1416 no of steps: 155 score: 486.0 avg score: 3.1355 memorylength: 131072 epsilon: 0.2795986843139887
Training...
episode: 1417 no of steps: 148 score: 197.0 avg score: 1.3311 memorylength: 131072 epsilon: 0.27934715871060567
Training...
episode: 1418 no of steps: 147 score: 683.0 avg score: 4.6463 memorylength: 131072 epsilon: 0.27909585937842823
Training...
episode: 1419 no of steps: 152 score: 705.0 avg score: 4.6382 memorylength: 131072 epsilon: 0.2788447861139042
Training...
episode: 1420 no of steps: 143 score: 420.0 avg score: 2.9371 memorylength: 131072 epsilon: 0.27859393871366395
Training...
episode: 1421 no of steps: 149 score: 702.0 avg score: 4.7114 memorylength: 131072 epsilon: 0.27834331697452125
Training...
episode: 1422 no of steps: 152 score: 450.0 avg score: 2.9605 memorylength: 131072 epsilon: 0.27809292069347236
Training...
episode: 1423 no of steps: 149 score: 623.0 avg score: 4.1812 memorylength: 131072 epsilon: 0.2778427496676964
Training...
episode: 1424 no of steps: 150 score: 565.0 avg score: 3.7667 memorylength: 131072 epsilon: 0.2775928036945547
Training...
episode: 1425 no of steps: 145 score: 150.0 avg score: 1.0345 memorylength: 131072 epsilon: 0.2773430825715911
Training...
episode: 1426 no of steps: 157 score: 659.0 avg score: 4.1975 memorylength: 131072 epsilon: 0.2770935860965315
Training...
episode: 1427 no of steps: 142 score: 703.0 avg score: 4.9507 memorylength: 131072 epsilon: 0.2768443140672836
Training...
episode: 1428 no of steps: 163 score: 663.0 avg score: 4.0675 memorylength: 131072 epsilon: 0.27659526628193726
Training...
episode: 1429 no of steps: 146 score: 305.0 avg score: 2.089 memorylength: 131072 epsilon: 0.2763464425387635
Training...
episode: 1430 no of steps: 141 score: 492.0 avg score: 3.4894 memorylength: 131072 epsilon: 0.27609784263621523
Training...
episode: 1431 no of steps: 143 score: 283.0 avg score: 1.979 memorylength: 131072 epsilon: 0.2758494663729265
Training...
episode: 1432 no of steps: 147 score: 468.0 avg score: 3.1837 memorylength: 131072 epsilon: 0.27560131354771256
Training...
episode: 1433 no of steps: 163 score: 456.0 avg score: 2.7975 memorylength: 131072 epsilon: 0.2753533839595695
Training...
episode: 1434 no of steps: 148 score: 711.0 avg score: 4.8041 memorylength: 131072 epsilon: 0.27510567740767444
Training...
episode: 1435 no of steps: 140 score: 366.0 avg score: 2.6143 memorylength: 131072 epsilon: 0.2748581936913851
Training...
episode: 1436 no of steps: 137 score: 367.0 avg score: 2.6788 memorylength: 131072 epsilon: 0.2746109326102394
Training...
episode: 1437 no of steps: 136 score: -130.0 avg score: -0.9559 memorylength: 131072 epsilon: 0.27436389396395616
Training...
episode: 1438 no of steps: 174 score: 492.0 avg score: 2.8276 memorylength: 131072 epsilon: 0.27411707755243386
Training...
episode: 1439 no of steps: 167 score: 489.0 avg score: 2.9281 memorylength: 131072 epsilon: 0.27387048317575136
Training...
episode: 1440 no of steps: 153 score: 687.0 avg score: 4.4902 memorylength: 131072 epsilon: 0.273624110634167
Training...
episode: 1441 no of steps: 146 score: 675.0 avg score: 4.6233 memorylength: 131072 epsilon: 0.2733779597281192
Training...
episode: 1442 no of steps: 166 score: 544.0 avg score: 3.2771 memorylength: 131072 epsilon: 0.2731320302582255
Training...
episode: 1443 no of steps: 161 score: 907.0 avg score: 5.6335 memorylength: 131072 epsilon: 0.2728863220252833
Training...
episode: 1444 no of steps: 156 score: 742.0 avg score: 4.7564 memorylength: 131072 epsilon: 0.2726408348302687
Training...
episode: 1445 no of steps: 162 score: 625.0 avg score: 3.858 memorylength: 131072 epsilon: 0.27239556847433705
Training...
episode: 1446 no of steps: 147 score: 909.0 avg score: 6.1837 memorylength: 131072 epsilon: 0.27215052275882273
Training...
episode: 1447 no of steps: 148 score: 773.0 avg score: 5.223 memorylength: 131072 epsilon: 0.2719056974852386
Training...
episode: 1448 no of steps: 145 score: 418.0 avg score: 2.8828 memorylength: 131072 epsilon: 0.2716610924552762
Training...
episode: 1449 no of steps: 151 score: 476.0 avg score: 3.1523 memorylength: 131072 epsilon: 0.2714167074708055
Training...
episode: 1450 no of steps: 167 score: 561.0 avg score: 3.3593 memorylength: 131072 epsilon: 0.27117254233387456
saving states...
Training...
episode: 1451 no of steps: 174 score: 189.0 avg score: 1.0862 memorylength: 131072 epsilon: 0.27092859684670956
Training...
episode: 1452 no of steps: 158 score: 423.0 avg score: 2.6772 memorylength: 131072 epsilon: 0.2706848708117148
Training...
episode: 1453 no of steps: 154 score: 642.0 avg score: 4.1688 memorylength: 131072 epsilon: 0.27044136403147206
Training...
episode: 1454 no of steps: 167 score: 628.0 avg score: 3.7605 memorylength: 131072 epsilon: 0.2701980763087409
Training...
episode: 1455 no of steps: 150 score: 542.0 avg score: 3.6133 memorylength: 131072 epsilon: 0.2699550074464582
Training...
episode: 1456 no of steps: 151 score: 936.0 avg score: 6.1987 memorylength: 131072 epsilon: 0.26971215724773817
Training...
episode: 1457 no of steps: 144 score: 522.0 avg score: 3.625 memorylength: 131072 epsilon: 0.2694695255158722
Training...
episode: 1458 no of steps: 134 score: 141.0 avg score: 1.0522 memorylength: 131072 epsilon: 0.2692271120543285
Training...
episode: 1459 no of steps: 128 score: 710.0 avg score: 5.5469 memorylength: 131072 epsilon: 0.2689849166667522
Training...
episode: 1460 no of steps: 135 score: 514.0 avg score: 3.8074 memorylength: 131072 epsilon: 0.268742939156965
Training...
episode: 1461 no of steps: 151 score: 315.0 avg score: 2.0861 memorylength: 131072 epsilon: 0.26850117932896517
Training...
episode: 1462 no of steps: 162 score: 856.0 avg score: 5.284 memorylength: 131072 epsilon: 0.2682596369869271
Training...
episode: 1463 no of steps: 141 score: 491.0 avg score: 3.4823 memorylength: 131072 epsilon: 0.2680183119352016
Training...
episode: 1464 no of steps: 162 score: 596.0 avg score: 3.679 memorylength: 131072 epsilon: 0.2677772039783153
Training...
episode: 1465 no of steps: 174 score: 332.0 avg score: 1.908 memorylength: 131072 epsilon: 0.2675363129209708
Training...
episode: 1466 no of steps: 146 score: 668.0 avg score: 4.5753 memorylength: 131072 epsilon: 0.2672956385680463
Training...
episode: 1467 no of steps: 167 score: 438.0 avg score: 2.6228 memorylength: 131072 epsilon: 0.26705518072459544
Training...
episode: 1468 no of steps: 179 score: 613.0 avg score: 3.4246 memorylength: 131072 epsilon: 0.2668149391958476
Training...
episode: 1469 no of steps: 174 score: 521.0 avg score: 2.9943 memorylength: 131072 epsilon: 0.2665749137872069
Training...
episode: 1470 no of steps: 186 score: 279.0 avg score: 1.5 memorylength: 131072 epsilon: 0.2663351043042529
Training...
episode: 1471 no of steps: 183 score: 935.0 avg score: 5.1093 memorylength: 131072 epsilon: 0.26609551055273983
Training...
episode: 1472 no of steps: 170 score: 435.0 avg score: 2.5588 memorylength: 131072 epsilon: 0.26585613233859673
Training...
episode: 1473 no of steps: 154 score: 585.0 avg score: 3.7987 memorylength: 131072 epsilon: 0.26561696946792734
Training...
episode: 1474 no of steps: 148 score: 513.0 avg score: 3.4662 memorylength: 131072 epsilon: 0.26537802174700953
Training...
episode: 1475 no of steps: 140 score: 715.0 avg score: 5.1071 memorylength: 131072 epsilon: 0.26513928898229583
Training...
episode: 1476 no of steps: 139 score: 658.0 avg score: 4.7338 memorylength: 131072 epsilon: 0.26490077098041254
Training...
episode: 1477 no of steps: 146 score: 612.0 avg score: 4.1918 memorylength: 131072 epsilon: 0.26466246754816014
Training...
episode: 1478 no of steps: 139 score: 684.0 avg score: 4.9209 memorylength: 131072 epsilon: 0.2644243784925129
Training...
episode: 1479 no of steps: 144 score: 1010.0 avg score: 7.0139 memorylength: 131072 epsilon: 0.2641865036206186
Training...
episode: 1480 no of steps: 148 score: 936.0 avg score: 6.3243 memorylength: 131072 epsilon: 0.26394884273979846
Training...
episode: 1481 no of steps: 150 score: 555.0 avg score: 3.7 memorylength: 131072 epsilon: 0.2637113956575473
Training...
episode: 1482 no of steps: 147 score: 619.0 avg score: 4.2109 memorylength: 131072 epsilon: 0.263474162181533
Training...
episode: 1483 no of steps: 154 score: 702.0 avg score: 4.5584 memorylength: 131072 epsilon: 0.2632371421195963
Training...
episode: 1484 no of steps: 159 score: 583.0 avg score: 3.6667 memorylength: 131072 epsilon: 0.26300033527975114
Training...
episode: 1485 no of steps: 165 score: 183.0 avg score: 1.1091 memorylength: 131072 epsilon: 0.2627637414701837
Training...
episode: 1486 no of steps: 143 score: 366.0 avg score: 2.5594 memorylength: 131072 epsilon: 0.2625273604992532
Training...
episode: 1487 no of steps: 143 score: 327.0 avg score: 2.2867 memorylength: 131072 epsilon: 0.26229119217549085
Training...
episode: 1488 no of steps: 152 score: 450.0 avg score: 2.9605 memorylength: 131072 epsilon: 0.2620552363076006
Training...
episode: 1489 no of steps: 122 score: 139.0 avg score: 1.1393 memorylength: 131072 epsilon: 0.26181949270445776
Training...
episode: 1490 no of steps: 136 score: 495.0 avg score: 3.6397 memorylength: 131072 epsilon: 0.2615839611751104
Training...
episode: 1491 no of steps: 145 score: 576.0 avg score: 3.9724 memorylength: 131072 epsilon: 0.2613486415287777
Training...
episode: 1492 no of steps: 147 score: 1044.0 avg score: 7.102 memorylength: 131072 epsilon: 0.26111353357485084
Training...
episode: 1493 no of steps: 147 score: 671.0 avg score: 4.5646 memorylength: 131072 epsilon: 0.2608786371228924
Training...
episode: 1494 no of steps: 162 score: 666.0 avg score: 4.1111 memorylength: 131072 epsilon: 0.2606439519826361
Training...
episode: 1495 no of steps: 145 score: 297.0 avg score: 2.0483 memorylength: 131072 epsilon: 0.26040947796398717
Training...
episode: 1496 no of steps: 159 score: 699.0 avg score: 4.3962 memorylength: 131072 epsilon: 0.26017521487702144
Training...
episode: 1497 no of steps: 168 score: 711.0 avg score: 4.2321 memorylength: 131072 epsilon: 0.25994116253198596
Training...
episode: 1498 no of steps: 160 score: 517.0 avg score: 3.2312 memorylength: 131072 epsilon: 0.25970732073929814
Training...
episode: 1499 no of steps: 154 score: 328.0 avg score: 2.1299 memorylength: 131072 epsilon: 0.25947368930954634
Training...
episode: 1500 no of steps: 157 score: 862.0 avg score: 5.4904 memorylength: 131072 epsilon: 0.25924026805348893
saving states...
Training...
episode: 1501 no of steps: 143 score: 567.0 avg score: 3.965 memorylength: 131072 epsilon: 0.25900705678205466
Training...
episode: 1502 no of steps: 147 score: 494.0 avg score: 3.3605 memorylength: 131072 epsilon: 0.2587740553063425
Training...
episode: 1503 no of steps: 149 score: 708.0 avg score: 4.7517 memorylength: 131072 epsilon: 0.2585412634376212
Training...
episode: 1504 no of steps: 160 score: 535.0 avg score: 3.3438 memorylength: 131072 epsilon: 0.25830868098732923
Training...
episode: 1505 no of steps: 150 score: 945.0 avg score: 6.3 memorylength: 131072 epsilon: 0.25807630776707496
Training...
episode: 1506 no of steps: 140 score: 713.0 avg score: 5.0929 memorylength: 131072 epsilon: 0.257844143588636
Training...
episode: 1507 no of steps: 143 score: 636.0 avg score: 4.4476 memorylength: 131072 epsilon: 0.25761218826395926
Training...
episode: 1508 no of steps: 166 score: 657.0 avg score: 3.9578 memorylength: 131072 epsilon: 0.2573804416051611
Training...
episode: 1509 no of steps: 136 score: 486.0 avg score: 3.5735 memorylength: 131072 epsilon: 0.25714890342452656
Training...
episode: 1510 no of steps: 159 score: 859.0 avg score: 5.4025 memorylength: 131072 epsilon: 0.2569175735345098
Training...
episode: 1511 no of steps: 157 score: 909.0 avg score: 5.7898 memorylength: 131072 epsilon: 0.25668645174773347
Training...
episode: 1512 no of steps: 158 score: 355.0 avg score: 2.2468 memorylength: 131072 epsilon: 0.25645553787698905
Training...
episode: 1513 no of steps: 155 score: 238.0 avg score: 1.5355 memorylength: 131072 epsilon: 0.2562248317352362
Training...
episode: 1514 no of steps: 158 score: 746.0 avg score: 4.7215 memorylength: 131072 epsilon: 0.25599433313560294
Training...
episode: 1515 no of steps: 155 score: 353.0 avg score: 2.2774 memorylength: 131072 epsilon: 0.25576404189138546
Training...
episode: 1516 no of steps: 145 score: 576.0 avg score: 3.9724 memorylength: 131072 epsilon: 0.25553395781604776
Training...
episode: 1517 no of steps: 137 score: 420.0 avg score: 3.0657 memorylength: 131072 epsilon: 0.25530408072322186
Training...
episode: 1518 no of steps: 148 score: 279.0 avg score: 1.8851 memorylength: 131072 epsilon: 0.2550744104267071
Training...
episode: 1519 no of steps: 144 score: 729.0 avg score: 5.0625 memorylength: 131072 epsilon: 0.2548449467404707
Training...
episode: 1520 no of steps: 138 score: 601.0 avg score: 4.3551 memorylength: 131072 epsilon: 0.25461568947864693
Training...
episode: 1521 no of steps: 144 score: 519.0 avg score: 3.6042 memorylength: 131072 epsilon: 0.25438663845553744
Training...
episode: 1522 no of steps: 143 score: 764.0 avg score: 5.3427 memorylength: 131072 epsilon: 0.254157793485611
Training...
episode: 1523 no of steps: 147 score: 463.0 avg score: 3.1497 memorylength: 131072 epsilon: 0.253929154383503
Training...
episode: 1524 no of steps: 168 score: 709.0 avg score: 4.2202 memorylength: 131072 epsilon: 0.2537007209640159
Training...
episode: 1525 no of steps: 149 score: 236.0 avg score: 1.5839 memorylength: 131072 epsilon: 0.2534724930421185
Training...
episode: 1526 no of steps: 155 score: 484.0 avg score: 3.1226 memorylength: 131072 epsilon: 0.2532444704329463
Training...
episode: 1527 no of steps: 154 score: 217.0 avg score: 1.4091 memorylength: 131072 epsilon: 0.25301665295180087
Training...
episode: 1528 no of steps: 166 score: -274.0 avg score: -1.6506 memorylength: 131072 epsilon: 0.25278904041415
Training...
episode: 1529 no of steps: 160 score: 178.0 avg score: 1.1125 memorylength: 131072 epsilon: 0.25256163263562764
Training...
episode: 1530 no of steps: 153 score: 435.0 avg score: 2.8431 memorylength: 131072 epsilon: 0.2523344294320334
Training...
episode: 1531 no of steps: 171 score: 774.0 avg score: 4.5263 memorylength: 131072 epsilon: 0.2521074306193327
Training...
episode: 1532 no of steps: 173 score: 957.0 avg score: 5.5318 memorylength: 131072 epsilon: 0.2518806360136565
Training...
episode: 1533 no of steps: 182 score: 964.0 avg score: 5.2967 memorylength: 131072 epsilon: 0.25165404543130115
Training...
episode: 1534 no of steps: 179 score: 1203.0 avg score: 6.7207 memorylength: 131072 epsilon: 0.2514276586887282
Training...
episode: 1535 no of steps: 169 score: 579.0 avg score: 3.426 memorylength: 131072 epsilon: 0.2512014756025645
Training...
episode: 1536 no of steps: 168 score: 818.0 avg score: 4.869 memorylength: 131072 epsilon: 0.2509754959896016
Training...
episode: 1537 no of steps: 153 score: 287.0 avg score: 1.8758 memorylength: 131072 epsilon: 0.25074971966679616
Training...
episode: 1538 no of steps: 162 score: 699.0 avg score: 4.3148 memorylength: 131072 epsilon: 0.25052414645126925
Training...
episode: 1539 no of steps: 153 score: 409.0 avg score: 2.6732 memorylength: 131072 epsilon: 0.2502987761603065
Training...
episode: 1540 no of steps: 143 score: 634.0 avg score: 4.4336 memorylength: 131072 epsilon: 0.25007360861135813
Training...
episode: 1541 no of steps: 161 score: 377.0 avg score: 2.3416 memorylength: 131072 epsilon: 0.24984864362203818
Training...
episode: 1542 no of steps: 170 score: 300.0 avg score: 1.7647 memorylength: 131072 epsilon: 0.2496238810101252
Training...
episode: 1543 no of steps: 142 score: 452.0 avg score: 3.1831 memorylength: 131072 epsilon: 0.24939932059356132
Training...
episode: 1544 no of steps: 128 score: 711.0 avg score: 5.5547 memorylength: 131072 epsilon: 0.24917496219045274
Training...
episode: 1545 no of steps: 131 score: 800.0 avg score: 6.1069 memorylength: 131072 epsilon: 0.248950805619069
Training...
episode: 1546 no of steps: 145 score: 801.0 avg score: 5.5241 memorylength: 131072 epsilon: 0.24872685069784337
Training...
episode: 1547 no of steps: 138 score: 511.0 avg score: 3.7029 memorylength: 131072 epsilon: 0.2485030972453723
Training...
episode: 1548 no of steps: 148 score: 756.0 avg score: 5.1081 memorylength: 131072 epsilon: 0.24827954508041544
Training...
episode: 1549 no of steps: 154 score: 701.0 avg score: 4.5519 memorylength: 131072 epsilon: 0.24805619402189563
Training...
episode: 1550 no of steps: 161 score: 855.0 avg score: 5.3106 memorylength: 131072 epsilon: 0.24783304388889837
saving states...
Training...
episode: 1551 no of steps: 148 score: 631.0 avg score: 4.2635 memorylength: 131072 epsilon: 0.24761009450067217
Training...
episode: 1552 no of steps: 181 score: 395.0 avg score: 2.1823 memorylength: 131072 epsilon: 0.2473873456766279
Training...
episode: 1553 no of steps: 146 score: 507.0 avg score: 3.4726 memorylength: 131072 epsilon: 0.2471647972363391
Training...
episode: 1554 no of steps: 144 score: 944.0 avg score: 6.5556 memorylength: 131072 epsilon: 0.24694244899954146
Training...
episode: 1555 no of steps: 136 score: 602.0 avg score: 4.4265 memorylength: 131072 epsilon: 0.2467203007861329
Training...
episode: 1556 no of steps: 148 score: 632.0 avg score: 4.2703 memorylength: 131072 epsilon: 0.2464983524161734
Training...
episode: 1557 no of steps: 157 score: 904.0 avg score: 5.758 memorylength: 131072 epsilon: 0.2462766037098847
Training...
episode: 1558 no of steps: 155 score: 751.0 avg score: 4.8452 memorylength: 131072 epsilon: 0.2460550544876504
Training...
episode: 1559 no of steps: 149 score: 531.0 avg score: 3.5638 memorylength: 131072 epsilon: 0.24583370457001555
Training...
episode: 1560 no of steps: 161 score: 651.0 avg score: 4.0435 memorylength: 131072 epsilon: 0.2456125537776868
Training...
episode: 1561 no of steps: 191 score: 594.0 avg score: 3.1099 memorylength: 131072 epsilon: 0.24539160193153184
Training...
episode: 1562 no of steps: 167 score: 535.0 avg score: 3.2036 memorylength: 131072 epsilon: 0.24517084885257986
Training...
episode: 1563 no of steps: 146 score: 658.0 avg score: 4.5068 memorylength: 131072 epsilon: 0.24495029436202068
Training...
episode: 1564 no of steps: 140 score: 166.0 avg score: 1.1857 memorylength: 131072 epsilon: 0.2447299382812053
Training...
episode: 1565 no of steps: 144 score: 376.0 avg score: 2.6111 memorylength: 131072 epsilon: 0.2445097804316452
Training...
episode: 1566 no of steps: 140 score: 448.0 avg score: 3.2 memorylength: 131072 epsilon: 0.24428982063501245
Training...
episode: 1567 no of steps: 130 score: 378.0 avg score: 2.9077 memorylength: 131072 epsilon: 0.24407005871313972
Training...
episode: 1568 no of steps: 120 score: 678.0 avg score: 5.65 memorylength: 131072 epsilon: 0.24385049448801976
Training...
episode: 1569 no of steps: 136 score: 598.0 avg score: 4.3971 memorylength: 131072 epsilon: 0.24363112778180562
Training...
episode: 1570 no of steps: 140 score: 174.0 avg score: 1.2429 memorylength: 131072 epsilon: 0.24341195841681015
Training...
episode: 1571 no of steps: 171 score: 539.0 avg score: 3.152 memorylength: 131072 epsilon: 0.24319298621550625
Training...
episode: 1572 no of steps: 146 score: 640.0 avg score: 4.3836 memorylength: 131072 epsilon: 0.24297421100052632
Training...
episode: 1573 no of steps: 166 score: 620.0 avg score: 3.7349 memorylength: 131072 epsilon: 0.24275563259466257
Training...
episode: 1574 no of steps: 157 score: 843.0 avg score: 5.3694 memorylength: 131072 epsilon: 0.24253725082086636
Training...
episode: 1575 no of steps: 168 score: 557.0 avg score: 3.3155 memorylength: 131072 epsilon: 0.24231906550224844
Training...
episode: 1576 no of steps: 186 score: 580.0 avg score: 3.1183 memorylength: 131072 epsilon: 0.2421010764620788
Training...
episode: 1577 no of steps: 166 score: 342.0 avg score: 2.0602 memorylength: 131072 epsilon: 0.24188328352378613
Training...
episode: 1578 no of steps: 180 score: 611.0 avg score: 3.3944 memorylength: 131072 epsilon: 0.24166568651095832
Training...
episode: 1579 no of steps: 159 score: 274.0 avg score: 1.7233 memorylength: 131072 epsilon: 0.24144828524734166
Training...
episode: 1580 no of steps: 144 score: 774.0 avg score: 5.375 memorylength: 131072 epsilon: 0.24123107955684117
Training...
episode: 1581 no of steps: 139 score: 858.0 avg score: 6.1727 memorylength: 131072 epsilon: 0.24101406926352015
Training...
episode: 1582 no of steps: 144 score: 769.0 avg score: 5.3403 memorylength: 131072 epsilon: 0.2407972541916004
Training...
episode: 1583 no of steps: 158 score: 517.0 avg score: 3.2722 memorylength: 131072 epsilon: 0.2405806341654616
Training...
episode: 1584 no of steps: 138 score: 351.0 avg score: 2.5435 memorylength: 131072 epsilon: 0.24036420900964148
Training...
episode: 1585 no of steps: 141 score: 234.0 avg score: 1.6596 memorylength: 131072 epsilon: 0.24014797854883577
Training...
episode: 1586 no of steps: 144 score: 390.0 avg score: 2.7083 memorylength: 131072 epsilon: 0.2399319426078976
Training...
episode: 1587 no of steps: 149 score: 774.0 avg score: 5.1946 memorylength: 131072 epsilon: 0.23971610101183807
Training...
episode: 1588 no of steps: 159 score: 750.0 avg score: 4.717 memorylength: 131072 epsilon: 0.23950045358582528
Training...
episode: 1589 no of steps: 158 score: 661.0 avg score: 4.1835 memorylength: 131072 epsilon: 0.23928500015518495
Training...
episode: 1590 no of steps: 175 score: 678.0 avg score: 3.8743 memorylength: 131072 epsilon: 0.2390697405453997
Training...
episode: 1591 no of steps: 174 score: 817.0 avg score: 4.6954 memorylength: 131072 epsilon: 0.23885467458210927
Training...
episode: 1592 no of steps: 171 score: 551.0 avg score: 3.2222 memorylength: 131072 epsilon: 0.23863980209111024
Training...
episode: 1593 no of steps: 173 score: 776.0 avg score: 4.4855 memorylength: 131072 epsilon: 0.23842512289835582
Training...
episode: 1594 no of steps: 164 score: 670.0 avg score: 4.0854 memorylength: 131072 epsilon: 0.23821063682995589
Training...
episode: 1595 no of steps: 164 score: 752.0 avg score: 4.5854 memorylength: 131072 epsilon: 0.2379963437121767
Training...
episode: 1596 no of steps: 156 score: 531.0 avg score: 3.4038 memorylength: 131072 epsilon: 0.23778224337144088
Training...
episode: 1597 no of steps: 156 score: 704.0 avg score: 4.5128 memorylength: 131072 epsilon: 0.23756833563432703
Training...
episode: 1598 no of steps: 161 score: 751.0 avg score: 4.6646 memorylength: 131072 epsilon: 0.23735462032756996
Training...
episode: 1599 no of steps: 158 score: 864.0 avg score: 5.4684 memorylength: 131072 epsilon: 0.2371410972780602
Training...
episode: 1600 no of steps: 129 score: 557.0 avg score: 4.3178 memorylength: 131072 epsilon: 0.23692776631284415
saving states...
Training...
episode: 1601 no of steps: 167 score: 596.0 avg score: 3.5689 memorylength: 131072 epsilon: 0.23671462725912365
Training...
episode: 1602 no of steps: 153 score: 244.0 avg score: 1.5948 memorylength: 131072 epsilon: 0.23650167994425608
Training...
episode: 1603 no of steps: 160 score: 336.0 avg score: 2.1 memorylength: 131072 epsilon: 0.2362889241957541
Training...
episode: 1604 no of steps: 156 score: 894.0 avg score: 5.7308 memorylength: 131072 epsilon: 0.23607635984128553
Training...
episode: 1605 no of steps: 159 score: 639.0 avg score: 4.0189 memorylength: 131072 epsilon: 0.23586398670867323
Training...
episode: 1606 no of steps: 152 score: 379.0 avg score: 2.4934 memorylength: 131072 epsilon: 0.23565180462589494
Training...
episode: 1607 no of steps: 146 score: 1101.0 avg score: 7.5411 memorylength: 131072 epsilon: 0.23543981342108325
Training...
episode: 1608 no of steps: 162 score: 715.0 avg score: 4.4136 memorylength: 131072 epsilon: 0.23522801292252513
Training...
episode: 1609 no of steps: 153 score: 354.0 avg score: 2.3137 memorylength: 131072 epsilon: 0.2350164029586623
Training...
episode: 1610 no of steps: 144 score: 801.0 avg score: 5.5625 memorylength: 131072 epsilon: 0.23480498335809052
Training...
episode: 1611 no of steps: 137 score: 231.0 avg score: 1.6861 memorylength: 131072 epsilon: 0.2345937539495601
Training...
episode: 1612 no of steps: 142 score: 535.0 avg score: 3.7676 memorylength: 131072 epsilon: 0.2343827145619751
Training...
episode: 1613 no of steps: 135 score: 630.0 avg score: 4.6667 memorylength: 131072 epsilon: 0.23417186502439352
Training...
episode: 1614 no of steps: 159 score: 216.0 avg score: 1.3585 memorylength: 131072 epsilon: 0.23396120516602742
Training...
episode: 1615 no of steps: 144 score: 348.0 avg score: 2.4167 memorylength: 131072 epsilon: 0.23375073481624212
Training...
episode: 1616 no of steps: 175 score: 389.0 avg score: 2.2229 memorylength: 131072 epsilon: 0.23354045380455674
Training...
episode: 1617 no of steps: 157 score: 193.0 avg score: 1.2293 memorylength: 131072 epsilon: 0.23333036196064358
Training...
episode: 1618 no of steps: 160 score: 530.0 avg score: 3.3125 memorylength: 131072 epsilon: 0.2331204591143283
Training...
episode: 1619 no of steps: 166 score: 463.0 avg score: 2.7892 memorylength: 131072 epsilon: 0.2329107450955895
Training...
episode: 1620 no of steps: 142 score: 665.0 avg score: 4.6831 memorylength: 131072 epsilon: 0.23270121973455893
Training...
episode: 1621 no of steps: 151 score: 471.0 avg score: 3.1192 memorylength: 131072 epsilon: 0.23249188286152095
Training...
episode: 1622 no of steps: 148 score: 476.0 avg score: 3.2162 memorylength: 131072 epsilon: 0.23228273430691262
Training...
episode: 1623 no of steps: 147 score: 558.0 avg score: 3.7959 memorylength: 131072 epsilon: 0.23207377390132378
Training...
episode: 1624 no of steps: 153 score: 643.0 avg score: 4.2026 memorylength: 131072 epsilon: 0.23186500147549635
Training...
episode: 1625 no of steps: 140 score: 597.0 avg score: 4.2643 memorylength: 131072 epsilon: 0.2316564168603247
Training...
episode: 1626 no of steps: 143 score: 325.0 avg score: 2.2727 memorylength: 131072 epsilon: 0.23144801988685523
Training...
episode: 1627 no of steps: 144 score: 544.0 avg score: 3.7778 memorylength: 131072 epsilon: 0.23123981038628647
Training...
episode: 1628 no of steps: 130 score: 296.0 avg score: 2.2769 memorylength: 131072 epsilon: 0.23103178818996864
Training...
episode: 1629 no of steps: 160 score: 378.0 avg score: 2.3625 memorylength: 131072 epsilon: 0.23082395312940382
Training...
episode: 1630 no of steps: 148 score: 561.0 avg score: 3.7905 memorylength: 131072 epsilon: 0.23061630503624556
Training...
episode: 1631 no of steps: 159 score: 173.0 avg score: 1.0881 memorylength: 131072 epsilon: 0.2304088437422988
Training...
episode: 1632 no of steps: 165 score: 745.0 avg score: 4.5152 memorylength: 131072 epsilon: 0.23020156907952005
Training...
episode: 1633 no of steps: 151 score: 922.0 avg score: 6.106 memorylength: 131072 epsilon: 0.2299944808800167
Training...
episode: 1634 no of steps: 159 score: 604.0 avg score: 3.7987 memorylength: 131072 epsilon: 0.22978757897604735
Training...
episode: 1635 no of steps: 170 score: 792.0 avg score: 4.6588 memorylength: 131072 epsilon: 0.2295808632000214
Training...
episode: 1636 no of steps: 172 score: 1066.0 avg score: 6.1977 memorylength: 131072 epsilon: 0.22937433338449914
Training...
episode: 1637 no of steps: 149 score: 888.0 avg score: 5.9597 memorylength: 131072 epsilon: 0.22916798936219135
Training...
episode: 1638 no of steps: 179 score: 998.0 avg score: 5.5754 memorylength: 131072 epsilon: 0.2289618309659594
Training...
episode: 1639 no of steps: 189 score: 1053.0 avg score: 5.5714 memorylength: 131072 epsilon: 0.22875585802881496
Training...
episode: 1640 no of steps: 188 score: 463.0 avg score: 2.4628 memorylength: 131072 epsilon: 0.22855007038391983
Training...
episode: 1641 no of steps: 169 score: 805.0 avg score: 4.7633 memorylength: 131072 epsilon: 0.22834446786458623
Training...
episode: 1642 no of steps: 142 score: 566.0 avg score: 3.9859 memorylength: 131072 epsilon: 0.22813905030427586
Training...
episode: 1643 no of steps: 144 score: 663.0 avg score: 4.6042 memorylength: 131072 epsilon: 0.22793381753660072
Training...
episode: 1644 no of steps: 142 score: 691.0 avg score: 4.8662 memorylength: 131072 epsilon: 0.22772876939532208
Training...
episode: 1645 no of steps: 157 score: 755.0 avg score: 4.8089 memorylength: 131072 epsilon: 0.22752390571435105
Training...
episode: 1646 no of steps: 149 score: 524.0 avg score: 3.5168 memorylength: 131072 epsilon: 0.22731922632774793
Training...
episode: 1647 no of steps: 166 score: 977.0 avg score: 5.8855 memorylength: 131072 epsilon: 0.22711473106972252
Training...
episode: 1648 no of steps: 152 score: 839.0 avg score: 5.5197 memorylength: 131072 epsilon: 0.2269104197746336
Training...
episode: 1649 no of steps: 148 score: 603.0 avg score: 4.0743 memorylength: 131072 epsilon: 0.22670629227698896
Training...
episode: 1650 no of steps: 156 score: 556.0 avg score: 3.5641 memorylength: 131072 epsilon: 0.22650234841144537
saving states...
Training...
episode: 1651 no of steps: 126 score: 362.0 avg score: 2.873 memorylength: 131072 epsilon: 0.22629858801280825
Training...
episode: 1652 no of steps: 162 score: 580.0 avg score: 3.5802 memorylength: 131072 epsilon: 0.22609501091603176
Training...
episode: 1653 no of steps: 166 score: 956.0 avg score: 5.759 memorylength: 131072 epsilon: 0.22589161695621832
Training...
episode: 1654 no of steps: 147 score: 698.0 avg score: 4.7483 memorylength: 131072 epsilon: 0.22568840596861892
Training...
episode: 1655 no of steps: 172 score: 817.0 avg score: 4.75 memorylength: 131072 epsilon: 0.2254853777886325
Training...
episode: 1656 no of steps: 161 score: 809.0 avg score: 5.0248 memorylength: 131072 epsilon: 0.22528253225180642
Training...
episode: 1657 no of steps: 165 score: 685.0 avg score: 4.1515 memorylength: 131072 epsilon: 0.2250798691938356
Training...
episode: 1658 no of steps: 169 score: 665.0 avg score: 3.9349 memorylength: 131072 epsilon: 0.2248773884505631
Training...
episode: 1659 no of steps: 155 score: 963.0 avg score: 6.2129 memorylength: 131072 epsilon: 0.2246750898579794
Training...
episode: 1660 no of steps: 155 score: 540.0 avg score: 3.4839 memorylength: 131072 epsilon: 0.22447297325222265
Training...
episode: 1661 no of steps: 144 score: 628.0 avg score: 4.3611 memorylength: 131072 epsilon: 0.2242710384695785
Training...
episode: 1662 no of steps: 129 score: 256.0 avg score: 1.9845 memorylength: 131072 epsilon: 0.22406928534647955
Training...
episode: 1663 no of steps: 142 score: 284.0 avg score: 2.0 memorylength: 131072 epsilon: 0.22386771371950598
Training...
episode: 1664 no of steps: 155 score: 530.0 avg score: 3.4194 memorylength: 131072 epsilon: 0.22366632342538462
Training...
episode: 1665 no of steps: 156 score: 850.0 avg score: 5.4487 memorylength: 131072 epsilon: 0.22346511430098936
Training...
episode: 1666 no of steps: 149 score: 930.0 avg score: 6.2416 memorylength: 131072 epsilon: 0.2232640861833408
Training...
episode: 1667 no of steps: 173 score: 1145.0 avg score: 6.6185 memorylength: 131072 epsilon: 0.2230632389096062
Training...
episode: 1668 no of steps: 151 score: 1308.0 avg score: 8.6623 memorylength: 131072 epsilon: 0.2228625723170992
Training...
episode: 1669 no of steps: 160 score: 1109.0 avg score: 6.9312 memorylength: 131072 epsilon: 0.22266208624327977
Training...
episode: 1670 no of steps: 163 score: 1124.0 avg score: 6.8957 memorylength: 131072 epsilon: 0.22246178052575438
Training...
episode: 1671 no of steps: 152 score: 621.0 avg score: 4.0855 memorylength: 131072 epsilon: 0.2222616550022752
Training...
episode: 1672 no of steps: 160 score: 760.0 avg score: 4.75 memorylength: 131072 epsilon: 0.2220617095107407
Training...
episode: 1673 no of steps: 161 score: 693.0 avg score: 4.3043 memorylength: 131072 epsilon: 0.2218619438891949
Training...
episode: 1674 no of steps: 158 score: 567.0 avg score: 3.5886 memorylength: 131072 epsilon: 0.22166235797582767
Training...
episode: 1675 no of steps: 147 score: 679.0 avg score: 4.619 memorylength: 131072 epsilon: 0.22146295160897442
Training...
episode: 1676 no of steps: 151 score: 171.0 avg score: 1.1325 memorylength: 131072 epsilon: 0.22126372462711602
Training...
episode: 1677 no of steps: 145 score: 247.0 avg score: 1.7034 memorylength: 131072 epsilon: 0.2210646768688786
Training...
episode: 1678 no of steps: 143 score: 342.0 avg score: 2.3916 memorylength: 131072 epsilon: 0.22086580817303333
Training...
episode: 1679 no of steps: 136 score: 321.0 avg score: 2.3603 memorylength: 131072 epsilon: 0.22066711837849673
Training...
episode: 1680 no of steps: 150 score: 760.0 avg score: 5.0667 memorylength: 131072 epsilon: 0.2204686073243299
Training...
episode: 1681 no of steps: 141 score: 764.0 avg score: 5.4184 memorylength: 131072 epsilon: 0.22027027484973905
Training...
episode: 1682 no of steps: 147 score: 909.0 avg score: 6.1837 memorylength: 131072 epsilon: 0.2200721207940747
Training...
episode: 1683 no of steps: 143 score: 862.0 avg score: 6.028 memorylength: 131072 epsilon: 0.2198741449968322
Training...
episode: 1684 no of steps: 145 score: 804.0 avg score: 5.5448 memorylength: 131072 epsilon: 0.21967634729765098
Training...
episode: 1685 no of steps: 170 score: 729.0 avg score: 4.2882 memorylength: 131072 epsilon: 0.21947872753631506
Training...
episode: 1686 no of steps: 157 score: 1062.0 avg score: 6.7643 memorylength: 131072 epsilon: 0.21928128555275234
Training...
episode: 1687 no of steps: 180 score: 598.0 avg score: 3.3222 memorylength: 131072 epsilon: 0.21908402118703474
Training...
episode: 1688 no of steps: 185 score: 738.0 avg score: 3.9892 memorylength: 131072 epsilon: 0.21888693427937825
Training...
episode: 1689 no of steps: 153 score: 979.0 avg score: 6.3987 memorylength: 131072 epsilon: 0.21869002467014234
Training...
episode: 1690 no of steps: 176 score: 940.0 avg score: 5.3409 memorylength: 131072 epsilon: 0.21849329219983032
Training...
episode: 1691 no of steps: 152 score: 722.0 avg score: 4.75 memorylength: 131072 epsilon: 0.21829673670908875
Training...
episode: 1692 no of steps: 138 score: 567.0 avg score: 4.1087 memorylength: 131072 epsilon: 0.21810035803870784
Training...
episode: 1693 no of steps: 130 score: 679.0 avg score: 5.2231 memorylength: 131072 epsilon: 0.21790415602962068
Training...
episode: 1694 no of steps: 153 score: 420.0 avg score: 2.7451 memorylength: 131072 epsilon: 0.2177081305229038
Training...
episode: 1695 no of steps: 143 score: 745.0 avg score: 5.2098 memorylength: 131072 epsilon: 0.21751228135977643
Training...
episode: 1696 no of steps: 142 score: 854.0 avg score: 6.0141 memorylength: 131072 epsilon: 0.21731660838160072
Training...
episode: 1697 no of steps: 134 score: 687.0 avg score: 5.1269 memorylength: 131072 epsilon: 0.21712111142988164
Training...
episode: 1698 no of steps: 148 score: 972.0 avg score: 6.5676 memorylength: 131072 epsilon: 0.2169257903462665
Training...
episode: 1699 no of steps: 153 score: 647.0 avg score: 4.2288 memorylength: 131072 epsilon: 0.21673064497254535
Training...
episode: 1700 no of steps: 161 score: 900.0 avg score: 5.5901 memorylength: 131072 epsilon: 0.2165356751506504
saving states...
Training...
episode: 1701 no of steps: 142 score: 631.0 avg score: 4.4437 memorylength: 131072 epsilon: 0.21634088072265603
Training...
episode: 1702 no of steps: 136 score: 1019.0 avg score: 7.4926 memorylength: 131072 epsilon: 0.21614626153077876
Training...
episode: 1703 no of steps: 165 score: 876.0 avg score: 5.3091 memorylength: 131072 epsilon: 0.21595181741737707
Training...
episode: 1704 no of steps: 153 score: 657.0 avg score: 4.2941 memorylength: 131072 epsilon: 0.21575754822495122
Training...
episode: 1705 no of steps: 150 score: 613.0 avg score: 4.0867 memorylength: 131072 epsilon: 0.21556345379614306
Training...
episode: 1706 no of steps: 153 score: 323.0 avg score: 2.1111 memorylength: 131072 epsilon: 0.21536953397373623
Training...
episode: 1707 no of steps: 153 score: 705.0 avg score: 4.6078 memorylength: 131072 epsilon: 0.21517578860065553
Training...
episode: 1708 no of steps: 125 score: 586.0 avg score: 4.688 memorylength: 131072 epsilon: 0.21498221751996735
Training...
episode: 1709 no of steps: 154 score: 530.0 avg score: 3.4416 memorylength: 131072 epsilon: 0.2147888205748789
Training...
episode: 1710 no of steps: 158 score: 816.0 avg score: 5.1646 memorylength: 131072 epsilon: 0.21459559760873886
Training...
episode: 1711 no of steps: 150 score: 474.0 avg score: 3.16 memorylength: 131072 epsilon: 0.21440254846503645
Training...
episode: 1712 no of steps: 167 score: 570.0 avg score: 3.4132 memorylength: 131072 epsilon: 0.21420967298740198
Training...
episode: 1713 no of steps: 157 score: 709.0 avg score: 4.5159 memorylength: 131072 epsilon: 0.2140169710196062
Training...
episode: 1714 no of steps: 148 score: 451.0 avg score: 3.0473 memorylength: 131072 epsilon: 0.21382444240556056
Training...
episode: 1715 no of steps: 167 score: 871.0 avg score: 5.2156 memorylength: 131072 epsilon: 0.21363208698931685
Training...
episode: 1716 no of steps: 155 score: 1224.0 avg score: 7.8968 memorylength: 131072 epsilon: 0.21343990461506718
Training...
episode: 1717 no of steps: 140 score: 1062.0 avg score: 7.5857 memorylength: 131072 epsilon: 0.21324789512714384
Training...
episode: 1718 no of steps: 163 score: 1153.0 avg score: 7.0736 memorylength: 131072 epsilon: 0.2130560583700191
Training...
episode: 1719 no of steps: 143 score: 732.0 avg score: 5.1189 memorylength: 131072 epsilon: 0.2128643941883052
Training...
episode: 1720 no of steps: 173 score: 1369.0 avg score: 7.9133 memorylength: 131072 epsilon: 0.21267290242675407
Training...
episode: 1721 no of steps: 165 score: 580.0 avg score: 3.5152 memorylength: 131072 epsilon: 0.2124815829302575
Training...
episode: 1722 no of steps: 145 score: 395.0 avg score: 2.7241 memorylength: 131072 epsilon: 0.21229043554384658
Training...
episode: 1723 no of steps: 149 score: 768.0 avg score: 5.1544 memorylength: 131072 epsilon: 0.21209946011269198
Training...
episode: 1724 no of steps: 149 score: 468.0 avg score: 3.1409 memorylength: 131072 epsilon: 0.21190865648210364
Training...
episode: 1725 no of steps: 149 score: 568.0 avg score: 3.8121 memorylength: 131072 epsilon: 0.2117180244975304
Training...
episode: 1726 no of steps: 153 score: 684.0 avg score: 4.4706 memorylength: 131072 epsilon: 0.21152756400456058
Training...
episode: 1727 no of steps: 160 score: 666.0 avg score: 4.1625 memorylength: 131072 epsilon: 0.211337274848921
Training...
episode: 1728 no of steps: 170 score: 999.0 avg score: 5.8765 memorylength: 131072 epsilon: 0.21114715687647756
Training...
episode: 1729 no of steps: 158 score: 825.0 avg score: 5.2215 memorylength: 131072 epsilon: 0.21095720993323455
Training...
episode: 1730 no of steps: 164 score: 720.0 avg score: 4.3902 memorylength: 131072 epsilon: 0.21076743386533514
Training...
episode: 1731 no of steps: 161 score: 1126.0 avg score: 6.9938 memorylength: 131072 epsilon: 0.21057782851906048
Training...
episode: 1732 no of steps: 155 score: 853.0 avg score: 5.5032 memorylength: 131072 epsilon: 0.2103883937408304
Training...
episode: 1733 no of steps: 164 score: 864.0 avg score: 5.2683 memorylength: 131072 epsilon: 0.21019912937720267
Training...
episode: 1734 no of steps: 152 score: 997.0 avg score: 6.5592 memorylength: 131072 epsilon: 0.21001003527487305
Training...
episode: 1735 no of steps: 154 score: 638.0 avg score: 4.1429 memorylength: 131072 epsilon: 0.20982111128067543
Training...
episode: 1736 no of steps: 147 score: 859.0 avg score: 5.8435 memorylength: 131072 epsilon: 0.2096323572415813
Training...
episode: 1737 no of steps: 150 score: 1048.0 avg score: 6.9867 memorylength: 131072 epsilon: 0.20944377300469993
Training...
episode: 1738 no of steps: 164 score: 841.0 avg score: 5.128 memorylength: 131072 epsilon: 0.209255358417278
Training...
episode: 1739 no of steps: 155 score: 880.0 avg score: 5.6774 memorylength: 131072 epsilon: 0.20906711332669978
Training...
episode: 1740 no of steps: 179 score: 1044.0 avg score: 5.8324 memorylength: 131072 epsilon: 0.20887903758048662
Training...
episode: 1741 no of steps: 190 score: 516.0 avg score: 2.7158 memorylength: 131072 epsilon: 0.20869113102629727
Training...
episode: 1742 no of steps: 156 score: 620.0 avg score: 3.9744 memorylength: 131072 epsilon: 0.20850339351192737
Training...
episode: 1743 no of steps: 170 score: 742.0 avg score: 4.3647 memorylength: 131072 epsilon: 0.20831582488530948
Training...
episode: 1744 no of steps: 153 score: 696.0 avg score: 4.549 memorylength: 131072 epsilon: 0.2081284249945131
Training...
episode: 1745 no of steps: 156 score: 657.0 avg score: 4.2115 memorylength: 131072 epsilon: 0.20794119368774414
Training...
episode: 1746 no of steps: 146 score: 418.0 avg score: 2.863 memorylength: 131072 epsilon: 0.2077541308133454
Training...
episode: 1747 no of steps: 155 score: 1274.0 avg score: 8.2194 memorylength: 131072 epsilon: 0.20756723621979586
Training...
episode: 1748 no of steps: 150 score: 783.0 avg score: 5.22 memorylength: 131072 epsilon: 0.20738050975571096
Training...
episode: 1749 no of steps: 167 score: 732.0 avg score: 4.3832 memorylength: 131072 epsilon: 0.2071939512698421
Training...
episode: 1750 no of steps: 151 score: 803.0 avg score: 5.3179 memorylength: 131072 epsilon: 0.2070075606110771
saving states...
Training...
episode: 1751 no of steps: 161 score: 461.0 avg score: 2.8634 memorylength: 131072 epsilon: 0.2068213376284394
Training...
episode: 1752 no of steps: 143 score: 174.0 avg score: 1.2168 memorylength: 131072 epsilon: 0.2066352821710883
Training...
episode: 1753 no of steps: 160 score: 877.0 avg score: 5.4812 memorylength: 131072 epsilon: 0.20644939408831903
Training...
episode: 1754 no of steps: 162 score: 918.0 avg score: 5.6667 memorylength: 131072 epsilon: 0.20626367322956213
Training...
episode: 1755 no of steps: 152 score: 710.0 avg score: 4.6711 memorylength: 131072 epsilon: 0.20607811944438376
Training...
episode: 1756 no of steps: 145 score: 427.0 avg score: 2.9448 memorylength: 131072 epsilon: 0.20589273258248525
Training...
episode: 1757 no of steps: 148 score: 377.0 avg score: 2.5473 memorylength: 131072 epsilon: 0.20570751249370334
Training...
episode: 1758 no of steps: 173 score: 807.0 avg score: 4.6647 memorylength: 131072 epsilon: 0.20552245902800967
Training...
episode: 1759 no of steps: 161 score: 526.0 avg score: 3.2671 memorylength: 131072 epsilon: 0.20533757203551095
Training...
episode: 1760 no of steps: 148 score: 795.0 avg score: 5.3716 memorylength: 131072 epsilon: 0.20515285136644876
Training...
episode: 1761 no of steps: 145 score: 293.0 avg score: 2.0207 memorylength: 131072 epsilon: 0.20496829687119922
Training...
episode: 1762 no of steps: 147 score: 692.0 avg score: 4.7075 memorylength: 131072 epsilon: 0.2047839084002733
Training...
episode: 1763 no of steps: 157 score: 1228.0 avg score: 7.8217 memorylength: 131072 epsilon: 0.20459968580431623
Training...
episode: 1764 no of steps: 142 score: 785.0 avg score: 5.5282 memorylength: 131072 epsilon: 0.20441562893410778
Training...
episode: 1765 no of steps: 143 score: 684.0 avg score: 4.7832 memorylength: 131072 epsilon: 0.20423173764056182
Training...
episode: 1766 no of steps: 148 score: 364.0 avg score: 2.4595 memorylength: 131072 epsilon: 0.20404801177472648
Training...
episode: 1767 no of steps: 138 score: 571.0 avg score: 4.1377 memorylength: 131072 epsilon: 0.20386445118778365
Training...
episode: 1768 no of steps: 144 score: 575.0 avg score: 3.9931 memorylength: 131072 epsilon: 0.2036810557310494
Training...
episode: 1769 no of steps: 152 score: 439.0 avg score: 2.8882 memorylength: 131072 epsilon: 0.2034978252559733
Training...
episode: 1770 no of steps: 165 score: 620.0 avg score: 3.7576 memorylength: 131072 epsilon: 0.20331475961413864
Training...
episode: 1771 no of steps: 146 score: 1017.0 avg score: 6.9658 memorylength: 131072 epsilon: 0.20313185865726235
Training...
episode: 1772 no of steps: 169 score: 1198.0 avg score: 7.0888 memorylength: 131072 epsilon: 0.20294912223719452
Training...
episode: 1773 no of steps: 160 score: 1019.0 avg score: 6.3688 memorylength: 131072 epsilon: 0.20276655020591877
Training...
episode: 1774 no of steps: 173 score: 1181.0 avg score: 6.8266 memorylength: 131072 epsilon: 0.20258414241555162
Training...
episode: 1775 no of steps: 161 score: 837.0 avg score: 5.1988 memorylength: 131072 epsilon: 0.20240189871834283
Training...
episode: 1776 no of steps: 157 score: 1082.0 avg score: 6.8917 memorylength: 131072 epsilon: 0.20221981896667493
Training...
episode: 1777 no of steps: 159 score: 946.0 avg score: 5.9497 memorylength: 131072 epsilon: 0.2020379030130634
Training...
episode: 1778 no of steps: 136 score: 792.0 avg score: 5.8235 memorylength: 131072 epsilon: 0.2018561507101562
Training...
episode: 1779 no of steps: 145 score: 664.0 avg score: 4.5793 memorylength: 131072 epsilon: 0.20167456191073407
Training...
episode: 1780 no of steps: 161 score: 779.0 avg score: 4.8385 memorylength: 131072 epsilon: 0.20149313646771
Training...
episode: 1781 no of steps: 153 score: 468.0 avg score: 3.0588 memorylength: 131072 epsilon: 0.20131187423412936
Training...
episode: 1782 no of steps: 136 score: 504.0 avg score: 3.7059 memorylength: 131072 epsilon: 0.2011307750631698
Training...
episode: 1783 no of steps: 140 score: 281.0 avg score: 2.0071 memorylength: 131072 epsilon: 0.20094983880814085
Training...
episode: 1784 no of steps: 156 score: 540.0 avg score: 3.4615 memorylength: 131072 epsilon: 0.20076906532248429
Training...
episode: 1785 no of steps: 150 score: 427.0 avg score: 2.8467 memorylength: 131072 epsilon: 0.2005884544597735
Training...
episode: 1786 no of steps: 156 score: 782.0 avg score: 5.0128 memorylength: 131072 epsilon: 0.20040800607371373
Training...
episode: 1787 no of steps: 143 score: 907.0 avg score: 6.3427 memorylength: 131072 epsilon: 0.20022772001814168
Training...
episode: 1788 no of steps: 146 score: 1015.0 avg score: 6.9521 memorylength: 131072 epsilon: 0.20004759614702572
Training...
episode: 1789 no of steps: 157 score: 804.0 avg score: 5.121 memorylength: 131072 epsilon: 0.1998676343144655
Training...
episode: 1790 no of steps: 153 score: 1080.0 avg score: 7.0588 memorylength: 131072 epsilon: 0.19968783437469184
Training...
episode: 1791 no of steps: 174 score: 702.0 avg score: 4.0345 memorylength: 131072 epsilon: 0.1995081961820669
Training...
episode: 1792 no of steps: 166 score: 698.0 avg score: 4.2048 memorylength: 131072 epsilon: 0.19932871959108364
Training...
episode: 1793 no of steps: 167 score: 581.0 avg score: 3.479 memorylength: 131072 epsilon: 0.19914940445636606
Training...
episode: 1794 no of steps: 144 score: 272.0 avg score: 1.8889 memorylength: 131072 epsilon: 0.19897025063266888
Training...
episode: 1795 no of steps: 159 score: 355.0 avg score: 2.2327 memorylength: 131072 epsilon: 0.19879125797487748
Training...
episode: 1796 no of steps: 127 score: 348.0 avg score: 2.7402 memorylength: 131072 epsilon: 0.19861242633800782
Training...
episode: 1797 no of steps: 135 score: 449.0 avg score: 3.3259 memorylength: 131072 epsilon: 0.19843375557720627
Training...
episode: 1798 no of steps: 143 score: 422.0 avg score: 2.951 memorylength: 131072 epsilon: 0.19825524554774948
Training...
episode: 1799 no of steps: 149 score: 437.0 avg score: 2.9329 memorylength: 131072 epsilon: 0.19807689610504428
Training...
episode: 1800 no of steps: 134 score: 597.0 avg score: 4.4552 memorylength: 131072 epsilon: 0.1978987071046277
saving states...
Training...
episode: 1801 no of steps: 149 score: 629.0 avg score: 4.2215 memorylength: 131072 epsilon: 0.19772067840216656
Training...
episode: 1802 no of steps: 176 score: 720.0 avg score: 4.0909 memorylength: 131072 epsilon: 0.19754280985345768
Training...
episode: 1803 no of steps: 147 score: 615.0 avg score: 4.1837 memorylength: 131072 epsilon: 0.19736510131442742
Training...
episode: 1804 no of steps: 137 score: 803.0 avg score: 5.8613 memorylength: 131072 epsilon: 0.19718755264113197
Training...
episode: 1805 no of steps: 146 score: 875.0 avg score: 5.9932 memorylength: 131072 epsilon: 0.19701016368975682
Training...
episode: 1806 no of steps: 145 score: 825.0 avg score: 5.6897 memorylength: 131072 epsilon: 0.19683293431661694
Training...
episode: 1807 no of steps: 142 score: 854.0 avg score: 6.0141 memorylength: 131072 epsilon: 0.19665586437815652
Training...
episode: 1808 no of steps: 166 score: 939.0 avg score: 5.6566 memorylength: 131072 epsilon: 0.19647895373094887
Training...
episode: 1809 no of steps: 179 score: 791.0 avg score: 4.419 memorylength: 131072 epsilon: 0.19630220223169645
Training...
episode: 1810 no of steps: 188 score: 873.0 avg score: 4.6436 memorylength: 131072 epsilon: 0.1961256097372304
Training...
episode: 1811 no of steps: 178 score: 715.0 avg score: 4.0169 memorylength: 131072 epsilon: 0.1959491761045109
Training...
episode: 1812 no of steps: 171 score: 737.0 avg score: 4.3099 memorylength: 131072 epsilon: 0.1957729011906266
Training...
episode: 1813 no of steps: 178 score: 792.0 avg score: 4.4494 memorylength: 131072 epsilon: 0.19559678485279494
Training...
episode: 1814 no of steps: 174 score: 813.0 avg score: 4.6724 memorylength: 131072 epsilon: 0.19542082694836155
Training...
episode: 1815 no of steps: 167 score: 675.0 avg score: 4.0419 memorylength: 131072 epsilon: 0.19524502733480062
Training...
episode: 1816 no of steps: 154 score: 775.0 avg score: 5.0325 memorylength: 131072 epsilon: 0.1950693858697144
Training...
episode: 1817 no of steps: 163 score: 625.0 avg score: 3.8344 memorylength: 131072 epsilon: 0.19489390241083326
Training...
episode: 1818 no of steps: 159 score: 811.0 avg score: 5.1006 memorylength: 131072 epsilon: 0.1947185768160157
Training...
episode: 1819 no of steps: 151 score: 1038.0 avg score: 6.8742 memorylength: 131072 epsilon: 0.19454340894324784
Training...
episode: 1820 no of steps: 128 score: 466.0 avg score: 3.6406 memorylength: 131072 epsilon: 0.1943683986506438
Training...
episode: 1821 no of steps: 158 score: 817.0 avg score: 5.1709 memorylength: 131072 epsilon: 0.19419354579644516
Training...
episode: 1822 no of steps: 155 score: 908.0 avg score: 5.8581 memorylength: 131072 epsilon: 0.19401885023902116
Training...
episode: 1823 no of steps: 153 score: 899.0 avg score: 5.8758 memorylength: 131072 epsilon: 0.19384431183686832
Training...
episode: 1824 no of steps: 143 score: 679.0 avg score: 4.7483 memorylength: 131072 epsilon: 0.1936699304486106
Training...
episode: 1825 no of steps: 138 score: 904.0 avg score: 6.5507 memorylength: 131072 epsilon: 0.19349570593299906
Training...
episode: 1826 no of steps: 159 score: 540.0 avg score: 3.3962 memorylength: 131072 epsilon: 0.19332163814891176
Training...
episode: 1827 no of steps: 156 score: 764.0 avg score: 4.8974 memorylength: 131072 epsilon: 0.19314772695535387
Training...
episode: 1828 no of steps: 166 score: 614.0 avg score: 3.6988 memorylength: 131072 epsilon: 0.19297397221145723
Training...
episode: 1829 no of steps: 136 score: 930.0 avg score: 6.8382 memorylength: 131072 epsilon: 0.19280037377648057
Training...
episode: 1830 no of steps: 150 score: 692.0 avg score: 4.6133 memorylength: 131072 epsilon: 0.19262693150980906
Training...
episode: 1831 no of steps: 152 score: 1084.0 avg score: 7.1316 memorylength: 131072 epsilon: 0.19245364527095454
Training...
episode: 1832 no of steps: 153 score: 865.0 avg score: 5.6536 memorylength: 131072 epsilon: 0.1922805149195551
Training...
episode: 1833 no of steps: 157 score: 637.0 avg score: 4.0573 memorylength: 131072 epsilon: 0.1921075403153752
Training...
episode: 1834 no of steps: 153 score: 658.0 avg score: 4.3007 memorylength: 131072 epsilon: 0.19193472131830533
Training...
episode: 1835 no of steps: 169 score: 881.0 avg score: 5.213 memorylength: 131072 epsilon: 0.1917620577883621
Training...
episode: 1836 no of steps: 170 score: 626.0 avg score: 3.6824 memorylength: 131072 epsilon: 0.1915895495856881
Training...
episode: 1837 no of steps: 184 score: 621.0 avg score: 3.375 memorylength: 131072 epsilon: 0.1914171965705516
Training...
episode: 1838 no of steps: 170 score: 196.0 avg score: 1.1529 memorylength: 131072 epsilon: 0.1912449986033467
Training...
episode: 1839 no of steps: 138 score: 468.0 avg score: 3.3913 memorylength: 131072 epsilon: 0.19107295554459303
Training...
episode: 1840 no of steps: 171 score: 391.0 avg score: 2.2865 memorylength: 131072 epsilon: 0.19090106725493575
Training...
episode: 1841 no of steps: 132 score: 166.0 avg score: 1.2576 memorylength: 131072 epsilon: 0.19072933359514518
Training...
episode: 1842 no of steps: 158 score: 613.0 avg score: 3.8797 memorylength: 131072 epsilon: 0.19055775442611722
Training...
episode: 1843 no of steps: 148 score: 648.0 avg score: 4.3784 memorylength: 131072 epsilon: 0.19038632960887264
Training...
episode: 1844 no of steps: 125 score: 1024.0 avg score: 8.192 memorylength: 131072 epsilon: 0.19021505900455737
Training...
episode: 1845 no of steps: 154 score: 756.0 avg score: 4.9091 memorylength: 131072 epsilon: 0.1900439424744422
Training...
episode: 1846 no of steps: 170 score: 839.0 avg score: 4.9353 memorylength: 131072 epsilon: 0.1898729798799227
Training...
episode: 1847 no of steps: 154 score: 840.0 avg score: 5.4545 memorylength: 131072 epsilon: 0.18970217108251922
Training...
episode: 1848 no of steps: 150 score: 776.0 avg score: 5.1733 memorylength: 131072 epsilon: 0.18953151594387652
Training...
episode: 1849 no of steps: 184 score: 1020.0 avg score: 5.5435 memorylength: 131072 epsilon: 0.18936101432576408
Training...
episode: 1850 no of steps: 189 score: 684.0 avg score: 3.619 memorylength: 131072 epsilon: 0.18919066609007545
saving states...
Training...
episode: 1851 no of steps: 179 score: 636.0 avg score: 3.5531 memorylength: 131072 epsilon: 0.1890204710988286
Training...
episode: 1852 no of steps: 169 score: 378.0 avg score: 2.2367 memorylength: 131072 epsilon: 0.18885042921416556
Training...
episode: 1853 no of steps: 176 score: 507.0 avg score: 2.8807 memorylength: 131072 epsilon: 0.18868054029835246
Training...
episode: 1854 no of steps: 145 score: 559.0 avg score: 3.8552 memorylength: 131072 epsilon: 0.1885108042137792
Training...
episode: 1855 no of steps: 144 score: 853.0 avg score: 5.9236 memorylength: 131072 epsilon: 0.1883412208229595
Training...
episode: 1856 no of steps: 155 score: 350.0 avg score: 2.2581 memorylength: 131072 epsilon: 0.18817178998853093
Training...
episode: 1857 no of steps: 142 score: 348.0 avg score: 2.4507 memorylength: 131072 epsilon: 0.1880025115732544
Training...
episode: 1858 no of steps: 142 score: 810.0 avg score: 5.7042 memorylength: 131072 epsilon: 0.18783338544001446
Training...
episode: 1859 no of steps: 142 score: 775.0 avg score: 5.4577 memorylength: 131072 epsilon: 0.18766441145181886
Training...
episode: 1860 no of steps: 127 score: 630.0 avg score: 4.9606 memorylength: 131072 epsilon: 0.18749558947179873
Training...
episode: 1861 no of steps: 148 score: 345.0 avg score: 2.3311 memorylength: 131072 epsilon: 0.1873269193632082
Training...
episode: 1862 no of steps: 152 score: 376.0 avg score: 2.4737 memorylength: 131072 epsilon: 0.18715840098942452
Training...
episode: 1863 no of steps: 147 score: 494.0 avg score: 3.3605 memorylength: 131072 epsilon: 0.18699003421394778
Training...
episode: 1864 no of steps: 156 score: 395.0 avg score: 2.5321 memorylength: 131072 epsilon: 0.18682181890040084
Training...
episode: 1865 no of steps: 153 score: 358.0 avg score: 2.3399 memorylength: 131072 epsilon: 0.18665375491252936
Training...
episode: 1866 no of steps: 168 score: 1029.0 avg score: 6.125 memorylength: 131072 epsilon: 0.1864858421142014
Training...
episode: 1867 no of steps: 180 score: 1017.0 avg score: 5.65 memorylength: 131072 epsilon: 0.18631808036940772
Training...
episode: 1868 no of steps: 148 score: 1366.0 avg score: 9.2297 memorylength: 131072 epsilon: 0.1861504695422612
Training...
episode: 1869 no of steps: 169 score: 912.0 avg score: 5.3964 memorylength: 131072 epsilon: 0.1859830094969971
Training...
episode: 1870 no of steps: 170 score: 444.0 avg score: 2.6118 memorylength: 131072 epsilon: 0.1858157000979727
Training...
episode: 1871 no of steps: 175 score: 814.0 avg score: 4.6514 memorylength: 131072 epsilon: 0.18564854120966753
Training...
episode: 1872 no of steps: 149 score: 859.0 avg score: 5.7651 memorylength: 131072 epsilon: 0.18548153269668277
Training...
episode: 1873 no of steps: 146 score: 343.0 avg score: 2.3493 memorylength: 131072 epsilon: 0.18531467442374147
Training...
episode: 1874 no of steps: 133 score: 386.0 avg score: 2.9023 memorylength: 131072 epsilon: 0.18514796625568855
Training...
episode: 1875 no of steps: 152 score: 616.0 avg score: 4.0526 memorylength: 131072 epsilon: 0.18498140805749028
Training...
episode: 1876 no of steps: 150 score: 558.0 avg score: 3.72 memorylength: 131072 epsilon: 0.1848149996942346
Training...
episode: 1877 no of steps: 157 score: 610.0 avg score: 3.8854 memorylength: 131072 epsilon: 0.18464874103113058
Training...
episode: 1878 no of steps: 135 score: 494.0 avg score: 3.6593 memorylength: 131072 epsilon: 0.18448263193350892
Training...
episode: 1879 no of steps: 147 score: 651.0 avg score: 4.4286 memorylength: 131072 epsilon: 0.184316672266821
Training...
episode: 1880 no of steps: 155 score: 680.0 avg score: 4.3871 memorylength: 131072 epsilon: 0.18415086189663965
Training...
episode: 1881 no of steps: 176 score: 915.0 avg score: 5.1989 memorylength: 131072 epsilon: 0.18398520068865842
Training...
episode: 1882 no of steps: 168 score: 920.0 avg score: 5.4762 memorylength: 131072 epsilon: 0.18381968850869168
Training...
episode: 1883 no of steps: 181 score: 1106.0 avg score: 6.1105 memorylength: 131072 epsilon: 0.1836543252226746
Training...
episode: 1884 no of steps: 154 score: 802.0 avg score: 5.2078 memorylength: 131072 epsilon: 0.18348911069666285
Training...
episode: 1885 no of steps: 147 score: 953.0 avg score: 6.483 memorylength: 131072 epsilon: 0.18332404479683276
Training...
episode: 1886 no of steps: 153 score: 708.0 avg score: 4.6275 memorylength: 131072 epsilon: 0.18315912738948079
Training...
episode: 1887 no of steps: 159 score: 360.0 avg score: 2.2642 memorylength: 131072 epsilon: 0.182994358341024
Training...
episode: 1888 no of steps: 139 score: 981.0 avg score: 7.0576 memorylength: 131072 epsilon: 0.18282973751799933
Training...
episode: 1889 no of steps: 147 score: 745.0 avg score: 5.068 memorylength: 131072 epsilon: 0.18266526478706396
Training...
episode: 1890 no of steps: 151 score: 462.0 avg score: 3.0596 memorylength: 131072 epsilon: 0.18250094001499498
Training...
episode: 1891 no of steps: 150 score: 711.0 avg score: 4.74 memorylength: 131072 epsilon: 0.18233676306868923
Training...
episode: 1892 no of steps: 151 score: 432.0 avg score: 2.8609 memorylength: 131072 epsilon: 0.18217273381516352
Training...
episode: 1893 no of steps: 142 score: 588.0 avg score: 4.1408 memorylength: 131072 epsilon: 0.182008852121554
Training...
episode: 1894 no of steps: 143 score: 1106.0 avg score: 7.7343 memorylength: 131072 epsilon: 0.18184511785511656
Training...
episode: 1895 no of steps: 167 score: 805.0 avg score: 4.8204 memorylength: 131072 epsilon: 0.18168153088322642
Training...
episode: 1896 no of steps: 194 score: 755.0 avg score: 3.8918 memorylength: 131072 epsilon: 0.18151809107337813
Training...
episode: 1897 no of steps: 174 score: 711.0 avg score: 4.0862 memorylength: 131072 epsilon: 0.1813547982931854
Training...
episode: 1898 no of steps: 156 score: 430.0 avg score: 2.7564 memorylength: 131072 epsilon: 0.18119165241038118
Training...
episode: 1899 no of steps: 171 score: 747.0 avg score: 4.3684 memorylength: 131072 epsilon: 0.18102865329281717
Training...
episode: 1900 no of steps: 193 score: 557.0 avg score: 2.886 memorylength: 131072 epsilon: 0.18086580080846415
saving states...
Training...
episode: 1901 no of steps: 173 score: 866.0 avg score: 5.0058 memorylength: 131072 epsilon: 0.18070309482541155
Training...
episode: 1902 no of steps: 171 score: 799.0 avg score: 4.6725 memorylength: 131072 epsilon: 0.18054053521186755
Training...
episode: 1903 no of steps: 141 score: 875.0 avg score: 6.2057 memorylength: 131072 epsilon: 0.18037812183615887
Training...
episode: 1904 no of steps: 148 score: 872.0 avg score: 5.8919 memorylength: 131072 epsilon: 0.1802158545667306
Training...
episode: 1905 no of steps: 168 score: 1212.0 avg score: 7.2143 memorylength: 131072 epsilon: 0.1800537332721463
Training...
episode: 1906 no of steps: 143 score: 1190.0 avg score: 8.3217 memorylength: 131072 epsilon: 0.17989175782108766
Training...
episode: 1907 no of steps: 157 score: 849.0 avg score: 5.4076 memorylength: 131072 epsilon: 0.17972992808235463
Training...
episode: 1908 no of steps: 149 score: 935.0 avg score: 6.2752 memorylength: 131072 epsilon: 0.17956824392486506
Training...
episode: 1909 no of steps: 161 score: 557.0 avg score: 3.4596 memorylength: 131072 epsilon: 0.17940670521765478
Training...
episode: 1910 no of steps: 168 score: 580.0 avg score: 3.4524 memorylength: 131072 epsilon: 0.17924531182987746
Training...
episode: 1911 no of steps: 168 score: 676.0 avg score: 4.0238 memorylength: 131072 epsilon: 0.1790840636308044
Training...
episode: 1912 no of steps: 167 score: 481.0 avg score: 2.8802 memorylength: 131072 epsilon: 0.1789229604898246
Training...
episode: 1913 no of steps: 160 score: 459.0 avg score: 2.8688 memorylength: 131072 epsilon: 0.17876200227644443
Training...
episode: 1914 no of steps: 182 score: 207.0 avg score: 1.1374 memorylength: 131072 epsilon: 0.17860118886028784
Training...
episode: 1915 no of steps: 147 score: 468.0 avg score: 3.1837 memorylength: 131072 epsilon: 0.17844052011109582
Training...
episode: 1916 no of steps: 149 score: 570.0 avg score: 3.8255 memorylength: 131072 epsilon: 0.1782799958987268
Training...
episode: 1917 no of steps: 144 score: 434.0 avg score: 3.0139 memorylength: 131072 epsilon: 0.17811961609315607
Training...
episode: 1918 no of steps: 151 score: 1130.0 avg score: 7.4834 memorylength: 131072 epsilon: 0.17795938056447605
Training...
episode: 1919 no of steps: 163 score: 1287.0 avg score: 7.8957 memorylength: 131072 epsilon: 0.17779928918289592
Training...
episode: 1920 no of steps: 152 score: 921.0 avg score: 6.0592 memorylength: 131072 epsilon: 0.1776393418187416
Training...
episode: 1921 no of steps: 151 score: 1046.0 avg score: 6.9272 memorylength: 131072 epsilon: 0.1774795383424558
Training...
episode: 1922 no of steps: 180 score: 688.0 avg score: 3.8222 memorylength: 131072 epsilon: 0.17731987862459764
Training...
episode: 1923 no of steps: 139 score: 661.0 avg score: 4.7554 memorylength: 131072 epsilon: 0.1771603625358428
Training...
episode: 1924 no of steps: 150 score: 258.0 avg score: 1.72 memorylength: 131072 epsilon: 0.17700098994698316
Training...
episode: 1925 no of steps: 141 score: 84.0 avg score: 0.5957 memorylength: 131072 epsilon: 0.17684176072892702
Training...
episode: 1926 no of steps: 135 score: 336.0 avg score: 2.4889 memorylength: 131072 epsilon: 0.17668267475269853
Training...
episode: 1927 no of steps: 169 score: 610.0 avg score: 3.6095 memorylength: 131072 epsilon: 0.17652373188943826
Training...
episode: 1928 no of steps: 183 score: 702.0 avg score: 3.8361 memorylength: 131072 epsilon: 0.17636493201040232
Training...
episode: 1929 no of steps: 182 score: 788.0 avg score: 4.3297 memorylength: 131072 epsilon: 0.1762062749869628
Training...
episode: 1930 no of steps: 184 score: 759.0 avg score: 4.125 memorylength: 131072 epsilon: 0.17604776069060765
Training...
episode: 1931 no of steps: 175 score: 1147.0 avg score: 6.5543 memorylength: 131072 epsilon: 0.17588938899294015
Training...
episode: 1932 no of steps: 174 score: 864.0 avg score: 4.9655 memorylength: 131072 epsilon: 0.17573115976567924
Training...
episode: 1933 no of steps: 136 score: 860.0 avg score: 6.3235 memorylength: 131072 epsilon: 0.17557307288065924
Training...
episode: 1934 no of steps: 161 score: 498.0 avg score: 3.0932 memorylength: 131072 epsilon: 0.1754151282098298
Training...
episode: 1935 no of steps: 140 score: 927.0 avg score: 6.6214 memorylength: 131072 epsilon: 0.17525732562525567
Training...
episode: 1936 no of steps: 154 score: 768.0 avg score: 4.987 memorylength: 131072 epsilon: 0.1750996649991168
Training...
episode: 1937 no of steps: 148 score: 854.0 avg score: 5.7703 memorylength: 131072 epsilon: 0.17494214620370807
Training...
episode: 1938 no of steps: 158 score: 497.0 avg score: 3.1456 memorylength: 131072 epsilon: 0.1747847691114392
Training...
episode: 1939 no of steps: 149 score: 592.0 avg score: 3.9732 memorylength: 131072 epsilon: 0.17462753359483477
Training...
episode: 1940 no of steps: 147 score: 1015.0 avg score: 6.9048 memorylength: 131072 epsilon: 0.174470439526534
Training...
episode: 1941 no of steps: 147 score: 776.0 avg score: 5.2789 memorylength: 131072 epsilon: 0.17431348677929068
Training...
episode: 1942 no of steps: 160 score: 579.0 avg score: 3.6188 memorylength: 131072 epsilon: 0.17415667522597308
Training...
episode: 1943 no of steps: 170 score: 252.0 avg score: 1.4824 memorylength: 131072 epsilon: 0.17400000473956387
Training...
episode: 1944 no of steps: 172 score: 676.0 avg score: 3.9302 memorylength: 131072 epsilon: 0.17384347519315987
Training...
episode: 1945 no of steps: 199 score: 954.0 avg score: 4.794 memorylength: 131072 epsilon: 0.17368708645997222
Training...
episode: 1946 no of steps: 195 score: 544.0 avg score: 2.7897 memorylength: 131072 epsilon: 0.17353083841332598
Training...
episode: 1947 no of steps: 170 score: 810.0 avg score: 4.7647 memorylength: 131072 epsilon: 0.17337473092666023
Training...
episode: 1948 no of steps: 174 score: 1105.0 avg score: 6.3506 memorylength: 131072 epsilon: 0.17321876387352794
Training...
episode: 1949 no of steps: 172 score: 1062.0 avg score: 6.1744 memorylength: 131072 epsilon: 0.1730629371275957
Training...
episode: 1950 no of steps: 167 score: 562.0 avg score: 3.3653 memorylength: 131072 epsilon: 0.17290725056264394
saving states...
Training...
episode: 1951 no of steps: 156 score: 786.0 avg score: 5.0385 memorylength: 131072 epsilon: 0.17275170405256648
Training...
episode: 1952 no of steps: 163 score: 983.0 avg score: 6.0307 memorylength: 131072 epsilon: 0.17259629747137067
Training...
episode: 1953 no of steps: 160 score: 738.0 avg score: 4.6125 memorylength: 131072 epsilon: 0.17244103069317712
Training...
episode: 1954 no of steps: 167 score: 767.0 avg score: 4.5928 memorylength: 131072 epsilon: 0.1722859035922198
Training...
episode: 1955 no of steps: 147 score: 634.0 avg score: 4.3129 memorylength: 131072 epsilon: 0.17213091604284567
Training...
episode: 1956 no of steps: 152 score: 661.0 avg score: 4.3487 memorylength: 131072 epsilon: 0.17197606791951484
Training...
episode: 1957 no of steps: 161 score: 314.0 avg score: 1.9503 memorylength: 131072 epsilon: 0.17182135909680038
Training...
episode: 1958 no of steps: 143 score: 387.0 avg score: 2.7063 memorylength: 131072 epsilon: 0.171666789449388
Training...
episode: 1959 no of steps: 161 score: 621.0 avg score: 3.8571 memorylength: 131072 epsilon: 0.17151235885207644
Training...
episode: 1960 no of steps: 146 score: 774.0 avg score: 5.3014 memorylength: 131072 epsilon: 0.17135806717977675
Training...
episode: 1961 no of steps: 146 score: 927.0 avg score: 6.3493 memorylength: 131072 epsilon: 0.17120391430751283
Training...
episode: 1962 no of steps: 146 score: 705.0 avg score: 4.8288 memorylength: 131072 epsilon: 0.17104990011042068
Training...
episode: 1963 no of steps: 166 score: 917.0 avg score: 5.5241 memorylength: 131072 epsilon: 0.17089602446374894
Training...
episode: 1964 no of steps: 154 score: 1025.0 avg score: 6.6558 memorylength: 131072 epsilon: 0.17074228724285823
Training...
episode: 1965 no of steps: 153 score: 1044.0 avg score: 6.8235 memorylength: 131072 epsilon: 0.1705886883232214
Training...
episode: 1966 no of steps: 167 score: 727.0 avg score: 4.3533 memorylength: 131072 epsilon: 0.17043522758042337
Training...
episode: 1967 no of steps: 180 score: 718.0 avg score: 3.9889 memorylength: 131072 epsilon: 0.1702819048901609
Training...
episode: 1968 no of steps: 183 score: 854.0 avg score: 4.6667 memorylength: 131072 epsilon: 0.1701287201282426
Training...
episode: 1969 no of steps: 192 score: 931.0 avg score: 4.849 memorylength: 131072 epsilon: 0.16997567317058876
Training...
episode: 1970 no of steps: 173 score: 696.0 avg score: 4.0231 memorylength: 131072 epsilon: 0.16982276389323145
Training...
episode: 1971 no of steps: 171 score: 733.0 avg score: 4.2865 memorylength: 131072 epsilon: 0.16966999217231404
Training...
episode: 1972 no of steps: 177 score: 1252.0 avg score: 7.0734 memorylength: 131072 epsilon: 0.16951735788409147
Training...
episode: 1973 no of steps: 189 score: 983.0 avg score: 5.2011 memorylength: 131072 epsilon: 0.16936486090492994
Training...
episode: 1974 no of steps: 171 score: 758.0 avg score: 4.4327 memorylength: 131072 epsilon: 0.16921250111130692
Training...
episode: 1975 no of steps: 153 score: 499.0 avg score: 3.2614 memorylength: 131072 epsilon: 0.16906027837981097
Training...
episode: 1976 no of steps: 146 score: 899.0 avg score: 6.1575 memorylength: 131072 epsilon: 0.16890819258714163
Training...
episode: 1977 no of steps: 142 score: 883.0 avg score: 6.2183 memorylength: 131072 epsilon: 0.16875624361010944
Training...
episode: 1978 no of steps: 137 score: 843.0 avg score: 6.1533 memorylength: 131072 epsilon: 0.16860443132563563
Training...
episode: 1979 no of steps: 139 score: 502.0 avg score: 3.6115 memorylength: 131072 epsilon: 0.1684527556107524
Training...
episode: 1980 no of steps: 134 score: 629.0 avg score: 4.694 memorylength: 131072 epsilon: 0.16830121634260228
Training...
episode: 1981 no of steps: 152 score: 389.0 avg score: 2.5592 memorylength: 131072 epsilon: 0.16814981339843854
Training...
episode: 1982 no of steps: 187 score: 843.0 avg score: 4.508 memorylength: 131072 epsilon: 0.16799854665562466
Training...
episode: 1983 no of steps: 162 score: 558.0 avg score: 3.4444 memorylength: 131072 epsilon: 0.16784741599163475
Training...
episode: 1984 no of steps: 169 score: 620.0 avg score: 3.6686 memorylength: 131072 epsilon: 0.16769642128405282
Training...
episode: 1985 no of steps: 175 score: 316.0 avg score: 1.8057 memorylength: 131072 epsilon: 0.16754556241057322
Training...
episode: 1986 no of steps: 185 score: 505.0 avg score: 2.7297 memorylength: 131072 epsilon: 0.16739483924900025
Training...
episode: 1987 no of steps: 174 score: 841.0 avg score: 4.8333 memorylength: 131072 epsilon: 0.16724425167724807
Training...
episode: 1988 no of steps: 160 score: 804.0 avg score: 5.025 memorylength: 131072 epsilon: 0.16709379957334083
Training...
episode: 1989 no of steps: 154 score: 710.0 avg score: 4.6104 memorylength: 131072 epsilon: 0.16694348281541224
Training...
episode: 1990 no of steps: 135 score: 779.0 avg score: 5.7704 memorylength: 131072 epsilon: 0.16679330128170583
Training...
episode: 1991 no of steps: 141 score: 760.0 avg score: 5.3901 memorylength: 131072 epsilon: 0.16664325485057443
Training...
episode: 1992 no of steps: 162 score: 687.0 avg score: 4.2407 memorylength: 131072 epsilon: 0.16649334340048047
Training...
episode: 1993 no of steps: 154 score: 873.0 avg score: 5.6688 memorylength: 131072 epsilon: 0.1663435668099957
Training...
episode: 1994 no of steps: 164 score: 358.0 avg score: 2.1829 memorylength: 131072 epsilon: 0.166193924957801
Training...
episode: 1995 no of steps: 157 score: 525.0 avg score: 3.3439 memorylength: 131072 epsilon: 0.16604441772268652
Training...
episode: 1996 no of steps: 159 score: 90.0 avg score: 0.566 memorylength: 131072 epsilon: 0.16589504498355137
Training...
episode: 1997 no of steps: 175 score: 211.0 avg score: 1.2057 memorylength: 131072 epsilon: 0.16574580661940364
Training...
episode: 1998 no of steps: 151 score: 450.0 avg score: 2.9801 memorylength: 131072 epsilon: 0.1655967025093602
Training...
episode: 1999 no of steps: 149 score: 466.0 avg score: 3.1275 memorylength: 131072 epsilon: 0.1654477325326468
Training...
episode: 2000 no of steps: 141 score: 84.0 avg score: 0.5957 memorylength: 131072 epsilon: 0.16529889656859764
saving states...
Training...
episode: 2001 no of steps: 136 score: 697.0 avg score: 5.125 memorylength: 131072 epsilon: 0.16515019449665566
Training...
episode: 2002 no of steps: 143 score: 652.0 avg score: 4.5594 memorylength: 131072 epsilon: 0.1650016261963722
Training...
episode: 2003 no of steps: 142 score: 1064.0 avg score: 7.493 memorylength: 131072 epsilon: 0.16485319154740682
Training...
episode: 2004 no of steps: 169 score: 676.0 avg score: 4.0 memorylength: 131072 epsilon: 0.16470489042952752
Training...
episode: 2005 no of steps: 174 score: 1113.0 avg score: 6.3966 memorylength: 131072 epsilon: 0.16455672272261038
Training...
episode: 2006 no of steps: 167 score: 1215.0 avg score: 7.2754 memorylength: 131072 epsilon: 0.16440868830663954
Training...
episode: 2007 no of steps: 176 score: 679.0 avg score: 3.858 memorylength: 131072 epsilon: 0.1642607870617071
Training...
episode: 2008 no of steps: 179 score: 904.0 avg score: 5.0503 memorylength: 131072 epsilon: 0.16411301886801308
Training...
episode: 2009 no of steps: 197 score: 603.0 avg score: 3.0609 memorylength: 131072 epsilon: 0.1639653836058652
Training...
episode: 2010 no of steps: 171 score: 1019.0 avg score: 5.9591 memorylength: 131072 epsilon: 0.16381788115567894
Training...
episode: 2011 no of steps: 164 score: 824.0 avg score: 5.0244 memorylength: 131072 epsilon: 0.16367051139797728
Training...
episode: 2012 no of steps: 154 score: 467.0 avg score: 3.0325 memorylength: 131072 epsilon: 0.16352327421339063
Training...
episode: 2013 no of steps: 137 score: 547.0 avg score: 3.9927 memorylength: 131072 epsilon: 0.163376169482657
Training...
episode: 2014 no of steps: 145 score: 549.0 avg score: 3.7862 memorylength: 131072 epsilon: 0.16322919708662148
Training...
episode: 2015 no of steps: 119 score: 638.0 avg score: 5.3613 memorylength: 131072 epsilon: 0.1630823569062364
Training...
episode: 2016 no of steps: 146 score: 622.0 avg score: 4.2603 memorylength: 131072 epsilon: 0.16293564882256123
Training...
episode: 2017 no of steps: 147 score: 938.0 avg score: 6.381 memorylength: 131072 epsilon: 0.1627890727167624
Training...
episode: 2018 no of steps: 153 score: 414.0 avg score: 2.7059 memorylength: 131072 epsilon: 0.1626426284701133
Training...
episode: 2019 no of steps: 146 score: 179.0 avg score: 1.226 memorylength: 131072 epsilon: 0.16249631596399405
Training...
episode: 2020 no of steps: 151 score: 654.0 avg score: 4.3311 memorylength: 131072 epsilon: 0.1623501350798915
Training...
episode: 2021 no of steps: 155 score: 707.0 avg score: 4.5613 memorylength: 131072 epsilon: 0.16220408569939918
Training...
episode: 2022 no of steps: 164 score: 703.0 avg score: 4.2866 memorylength: 131072 epsilon: 0.16205816770421702
Training...
episode: 2023 no of steps: 200 score: 949.0 avg score: 4.745 memorylength: 131072 epsilon: 0.16191238097615146
Training...
episode: 2024 no of steps: 183 score: 513.0 avg score: 2.8033 memorylength: 131072 epsilon: 0.16176672539711526
Training...
episode: 2025 no of steps: 182 score: 776.0 avg score: 4.2637 memorylength: 131072 epsilon: 0.16162120084912732
Training...
episode: 2026 no of steps: 161 score: 677.0 avg score: 4.205 memorylength: 131072 epsilon: 0.16147580721431284
Training...
episode: 2027 no of steps: 155 score: 850.0 avg score: 5.4839 memorylength: 131072 epsilon: 0.1613305443749029
Training...
episode: 2028 no of steps: 136 score: 782.0 avg score: 5.75 memorylength: 131072 epsilon: 0.1611854122132347
Training...
episode: 2029 no of steps: 160 score: 534.0 avg score: 3.3375 memorylength: 131072 epsilon: 0.16104041061175103
Training...
episode: 2030 no of steps: 135 score: 376.0 avg score: 2.7852 memorylength: 131072 epsilon: 0.16089553945300072
Training...
episode: 2031 no of steps: 144 score: 169.0 avg score: 1.1736 memorylength: 131072 epsilon: 0.16075079861963806
Training...
episode: 2032 no of steps: 146 score: 206.0 avg score: 1.411 memorylength: 131072 epsilon: 0.16060618799442292
Training...
episode: 2033 no of steps: 142 score: 621.0 avg score: 4.3732 memorylength: 131072 epsilon: 0.1604617074602208
Training...
episode: 2034 no of steps: 134 score: 634.0 avg score: 4.7313 memorylength: 131072 epsilon: 0.16031735690000234
Training...
episode: 2035 no of steps: 140 score: 775.0 avg score: 5.5357 memorylength: 131072 epsilon: 0.16017313619684367
Training...
episode: 2036 no of steps: 181 score: 785.0 avg score: 4.337 memorylength: 131072 epsilon: 0.16002904523392594
Training...
episode: 2037 no of steps: 156 score: 889.0 avg score: 5.6987 memorylength: 131072 epsilon: 0.15988508389453554
Training...
episode: 2038 no of steps: 169 score: 600.0 avg score: 3.5503 memorylength: 131072 epsilon: 0.1597412520620637
Training...
episode: 2039 no of steps: 173 score: 1115.0 avg score: 6.4451 memorylength: 131072 epsilon: 0.15959754962000672
Training...
episode: 2040 no of steps: 168 score: 759.0 avg score: 4.5179 memorylength: 131072 epsilon: 0.15945397645196552
Training...
episode: 2041 no of steps: 171 score: 781.0 avg score: 4.5673 memorylength: 131072 epsilon: 0.15931053244164584
Training...
episode: 2042 no of steps: 151 score: 597.0 avg score: 3.9536 memorylength: 131072 epsilon: 0.15916721747285809
Training...
episode: 2043 no of steps: 153 score: 751.0 avg score: 4.9085 memorylength: 131072 epsilon: 0.15902403142951704
Training...
episode: 2044 no of steps: 141 score: 847.0 avg score: 6.0071 memorylength: 131072 epsilon: 0.15888097419564212
Training...
episode: 2045 no of steps: 143 score: 472.0 avg score: 3.3007 memorylength: 131072 epsilon: 0.15873804565535682
Training...
episode: 2046 no of steps: 146 score: 493.0 avg score: 3.3767 memorylength: 131072 epsilon: 0.15859524569288913
Training...
episode: 2047 no of steps: 147 score: 688.0 avg score: 4.6803 memorylength: 131072 epsilon: 0.15845257419257097
Training...
episode: 2048 no of steps: 155 score: 758.0 avg score: 4.8903 memorylength: 131072 epsilon: 0.15831003103883853
Training...
episode: 2049 no of steps: 164 score: 845.0 avg score: 5.1524 memorylength: 131072 epsilon: 0.15816761611623176
Training...
episode: 2050 no of steps: 171 score: 1145.0 avg score: 6.6959 memorylength: 131072 epsilon: 0.15802532930939459
saving states...
Training...
episode: 2051 no of steps: 163 score: 917.0 avg score: 5.6258 memorylength: 131072 epsilon: 0.1578831705030747
Training...
episode: 2052 no of steps: 179 score: 1093.0 avg score: 6.1061 memorylength: 131072 epsilon: 0.15774113958212344
Training...
episode: 2053 no of steps: 170 score: 763.0 avg score: 4.4882 memorylength: 131072 epsilon: 0.1575992364314958
Training...
episode: 2054 no of steps: 170 score: 688.0 avg score: 4.0471 memorylength: 131072 epsilon: 0.15745746093625013
Training...
episode: 2055 no of steps: 162 score: 300.0 avg score: 1.8519 memorylength: 131072 epsilon: 0.15731581298154837
Training...
episode: 2056 no of steps: 160 score: 549.0 avg score: 3.4312 memorylength: 131072 epsilon: 0.15717429245265557
Training...
episode: 2057 no of steps: 152 score: 498.0 avg score: 3.2763 memorylength: 131072 epsilon: 0.1570328992349402
Training...
episode: 2058 no of steps: 143 score: 744.0 avg score: 5.2028 memorylength: 131072 epsilon: 0.15689163321387373
Training...
episode: 2059 no of steps: 154 score: 778.0 avg score: 5.0519 memorylength: 131072 epsilon: 0.15675049427503057
Training...
episode: 2060 no of steps: 147 score: 538.0 avg score: 3.6599 memorylength: 131072 epsilon: 0.1566094823040883
Training...
episode: 2061 no of steps: 135 score: 562.0 avg score: 4.163 memorylength: 131072 epsilon: 0.1564685971868271
Training...
episode: 2062 no of steps: 160 score: 754.0 avg score: 4.7125 memorylength: 131072 epsilon: 0.15632783880913015
Training...
episode: 2063 no of steps: 146 score: 328.0 avg score: 2.2466 memorylength: 131072 epsilon: 0.15618720705698302
Training...
episode: 2064 no of steps: 177 score: 930.0 avg score: 5.2542 memorylength: 131072 epsilon: 0.15604670181647406
Training...
episode: 2065 no of steps: 170 score: 489.0 avg score: 2.8765 memorylength: 131072 epsilon: 0.155906322973794
Training...
episode: 2066 no of steps: 164 score: 670.0 avg score: 4.0854 memorylength: 131072 epsilon: 0.155766070415236
Training...
episode: 2067 no of steps: 174 score: 769.0 avg score: 4.4195 memorylength: 131072 epsilon: 0.15562594402719546
Training...
episode: 2068 no of steps: 151 score: 612.0 avg score: 4.053 memorylength: 131072 epsilon: 0.15548594369616994
Training...
episode: 2069 no of steps: 155 score: 722.0 avg score: 4.6581 memorylength: 131072 epsilon: 0.15534606930875927
Training...
episode: 2070 no of steps: 136 score: 457.0 avg score: 3.3603 memorylength: 131072 epsilon: 0.15520632075166507
Training...
episode: 2071 no of steps: 129 score: 303.0 avg score: 2.3488 memorylength: 131072 epsilon: 0.15506669791169114
Training...
episode: 2072 no of steps: 140 score: 756.0 avg score: 5.4 memorylength: 131072 epsilon: 0.15492720067574284
Training...
episode: 2073 no of steps: 126 score: 636.0 avg score: 5.0476 memorylength: 131072 epsilon: 0.1547878289308275
Training...
episode: 2074 no of steps: 138 score: 457.0 avg score: 3.3116 memorylength: 131072 epsilon: 0.1546485825640539
Training...
episode: 2075 no of steps: 167 score: 1011.0 avg score: 6.0539 memorylength: 131072 epsilon: 0.15450946146263259
Training...
episode: 2076 no of steps: 163 score: 721.0 avg score: 4.4233 memorylength: 131072 epsilon: 0.15437046551387537
Training...
episode: 2077 no of steps: 175 score: 619.0 avg score: 3.5371 memorylength: 131072 epsilon: 0.1542315946051956
Training...
episode: 2078 no of steps: 181 score: 882.0 avg score: 4.8729 memorylength: 131072 epsilon: 0.15409284862410774
Training...
episode: 2079 no of steps: 204 score: 847.0 avg score: 4.152 memorylength: 131072 epsilon: 0.15395422745822762
Training...
episode: 2080 no of steps: 166 score: 743.0 avg score: 4.4759 memorylength: 131072 epsilon: 0.15381573099527207
Training...
episode: 2081 no of steps: 170 score: 700.0 avg score: 4.1176 memorylength: 131072 epsilon: 0.1536773591230589
Training...
episode: 2082 no of steps: 160 score: 648.0 avg score: 4.05 memorylength: 131072 epsilon: 0.15353911172950696
Training...
episode: 2083 no of steps: 152 score: 504.0 avg score: 3.3158 memorylength: 131072 epsilon: 0.15340098870263577
Training...
episode: 2084 no of steps: 163 score: 744.0 avg score: 4.5644 memorylength: 131072 epsilon: 0.15326298993056575
Training...
episode: 2085 no of steps: 171 score: 542.0 avg score: 3.1696 memorylength: 131072 epsilon: 0.15312511530151784
Training...
episode: 2086 no of steps: 145 score: 754.0 avg score: 5.2 memorylength: 131072 epsilon: 0.15298736470381363
Training...
episode: 2087 no of steps: 153 score: 1035.0 avg score: 6.7647 memorylength: 131072 epsilon: 0.1528497380258751
Training...
episode: 2088 no of steps: 144 score: 924.0 avg score: 6.4167 memorylength: 131072 epsilon: 0.1527122351562246
Training...
episode: 2089 no of steps: 153 score: 688.0 avg score: 4.4967 memorylength: 131072 epsilon: 0.15257485598348483
Training...
episode: 2090 no of steps: 150 score: 657.0 avg score: 4.38 memorylength: 131072 epsilon: 0.1524376003963786
Training...
episode: 2091 no of steps: 179 score: 895.0 avg score: 5.0 memorylength: 131072 epsilon: 0.15230046828372898
Training...
episode: 2092 no of steps: 174 score: 229.0 avg score: 1.3161 memorylength: 131072 epsilon: 0.15216345953445887
Training...
episode: 2093 no of steps: 160 score: 112.0 avg score: 0.7 memorylength: 131072 epsilon: 0.15202657403759123
Training...
episode: 2094 no of steps: 162 score: 583.0 avg score: 3.5988 memorylength: 131072 epsilon: 0.15188981168224874
Training...
episode: 2095 no of steps: 163 score: 242.0 avg score: 1.4847 memorylength: 131072 epsilon: 0.15175317235765395
Training...
episode: 2096 no of steps: 159 score: 764.0 avg score: 4.805 memorylength: 131072 epsilon: 0.15161665595312898
Training...
episode: 2097 no of steps: 150 score: 369.0 avg score: 2.46 memorylength: 131072 epsilon: 0.1514802623580955
Training...
episode: 2098 no of steps: 131 score: 191.0 avg score: 1.458 memorylength: 131072 epsilon: 0.1513439914620747
Training...
episode: 2099 no of steps: 160 score: 548.0 avg score: 3.425 memorylength: 131072 epsilon: 0.15120784315468716
Training...
episode: 2100 no of steps: 134 score: 498.0 avg score: 3.7164 memorylength: 131072 epsilon: 0.15107181732565275
saving states...
Training...
episode: 2101 no of steps: 134 score: 566.0 avg score: 4.2239 memorylength: 131072 epsilon: 0.15093591386479052
Training...
episode: 2102 no of steps: 150 score: 715.0 avg score: 4.7667 memorylength: 131072 epsilon: 0.1508001326620187
Training...
episode: 2103 no of steps: 154 score: 543.0 avg score: 3.526 memorylength: 131072 epsilon: 0.15066447360735444
Training...
episode: 2104 no of steps: 167 score: 958.0 avg score: 5.7365 memorylength: 131072 epsilon: 0.15052893659091401
Training...
episode: 2105 no of steps: 144 score: 998.0 avg score: 6.9306 memorylength: 131072 epsilon: 0.1503935215029123
Training...
episode: 2106 no of steps: 182 score: 958.0 avg score: 5.2637 memorylength: 131072 epsilon: 0.15025822823366314
Training...
episode: 2107 no of steps: 183 score: 948.0 avg score: 5.1803 memorylength: 131072 epsilon: 0.15012305667357895
Training...
episode: 2108 no of steps: 176 score: 735.0 avg score: 4.1761 memorylength: 131072 epsilon: 0.14998800671317078
Training...
episode: 2109 no of steps: 187 score: 1077.0 avg score: 5.7594 memorylength: 131072 epsilon: 0.14985307824304817
Training...
episode: 2110 no of steps: 178 score: 733.0 avg score: 4.118 memorylength: 131072 epsilon: 0.149718271153919
Training...
episode: 2111 no of steps: 167 score: 574.0 avg score: 3.4371 memorylength: 131072 epsilon: 0.14958358533658955
Training...
episode: 2112 no of steps: 145 score: 654.0 avg score: 4.5103 memorylength: 131072 epsilon: 0.1494490206819643
Training...
episode: 2113 no of steps: 151 score: 466.0 avg score: 3.0861 memorylength: 131072 epsilon: 0.14931457708104592
Training...
episode: 2114 no of steps: 139 score: 778.0 avg score: 5.5971 memorylength: 131072 epsilon: 0.14918025442493504
Training...
episode: 2115 no of steps: 150 score: 909.0 avg score: 6.06 memorylength: 131072 epsilon: 0.14904605260483023
Training...
episode: 2116 no of steps: 151 score: 994.0 avg score: 6.5828 memorylength: 131072 epsilon: 0.14891197151202815
Training...
episode: 2117 no of steps: 145 score: 764.0 avg score: 5.269 memorylength: 131072 epsilon: 0.14877801103792296
Training...
episode: 2118 no of steps: 135 score: 528.0 avg score: 3.9111 memorylength: 131072 epsilon: 0.14864417107400682
Training...
episode: 2119 no of steps: 145 score: 678.0 avg score: 4.6759 memorylength: 131072 epsilon: 0.14851045151186923
Training...
episode: 2120 no of steps: 158 score: 280.0 avg score: 1.7722 memorylength: 131072 epsilon: 0.1483768522431974
Training...
episode: 2121 no of steps: 159 score: 741.0 avg score: 4.6604 memorylength: 131072 epsilon: 0.1482433731597759
Training...
episode: 2122 no of steps: 163 score: 899.0 avg score: 5.5153 memorylength: 131072 epsilon: 0.14811001415348665
Training...
episode: 2123 no of steps: 170 score: 729.0 avg score: 4.2882 memorylength: 131072 epsilon: 0.1479767751163089
Training...
episode: 2124 no of steps: 147 score: 1210.0 avg score: 8.2313 memorylength: 131072 epsilon: 0.14784365594031895
Training...
episode: 2125 no of steps: 160 score: 1305.0 avg score: 8.1562 memorylength: 131072 epsilon: 0.14771065651769033
Training...
episode: 2126 no of steps: 167 score: 1063.0 avg score: 6.3653 memorylength: 131072 epsilon: 0.14757777674069342
Training...
episode: 2127 no of steps: 170 score: 961.0 avg score: 5.6529 memorylength: 131072 epsilon: 0.14744501650169567
Training...
episode: 2128 no of steps: 179 score: 690.0 avg score: 3.8547 memorylength: 131072 epsilon: 0.14731237569316122
Training...
episode: 2129 no of steps: 158 score: 696.0 avg score: 4.4051 memorylength: 131072 epsilon: 0.1471798542076511
Training...
episode: 2130 no of steps: 174 score: 1050.0 avg score: 6.0345 memorylength: 131072 epsilon: 0.14704745193782276
Training...
episode: 2131 no of steps: 179 score: 770.0 avg score: 4.3017 memorylength: 131072 epsilon: 0.14691516877643046
Training...
episode: 2132 no of steps: 160 score: 736.0 avg score: 4.6 memorylength: 131072 epsilon: 0.14678300461632482
Training...
episode: 2133 no of steps: 154 score: 731.0 avg score: 4.7468 memorylength: 131072 epsilon: 0.1466509593504528
Training...
episode: 2134 no of steps: 163 score: 958.0 avg score: 5.8773 memorylength: 131072 epsilon: 0.14651903287185783
Training...
episode: 2135 no of steps: 162 score: 654.0 avg score: 4.037 memorylength: 131072 epsilon: 0.14638722507367935
Training...
episode: 2136 no of steps: 148 score: 837.0 avg score: 5.6554 memorylength: 131072 epsilon: 0.1462555358491531
Training...
episode: 2137 no of steps: 146 score: 625.0 avg score: 4.2808 memorylength: 131072 epsilon: 0.14612396509161077
Training...
episode: 2138 no of steps: 144 score: 927.0 avg score: 6.4375 memorylength: 131072 epsilon: 0.14599251269448008
Training...
episode: 2139 no of steps: 143 score: 414.0 avg score: 2.8951 memorylength: 131072 epsilon: 0.14586117855128453
Training...
episode: 2140 no of steps: 142 score: 414.0 avg score: 2.9155 memorylength: 131072 epsilon: 0.14572996255564347
Training...
episode: 2141 no of steps: 172 score: 944.0 avg score: 5.4884 memorylength: 131072 epsilon: 0.14559886460127197
Training...
episode: 2142 no of steps: 191 score: 1029.0 avg score: 5.3874 memorylength: 131072 epsilon: 0.14546788458198068
Training...
episode: 2143 no of steps: 178 score: 757.0 avg score: 4.2528 memorylength: 131072 epsilon: 0.14533702239167573
Training...
episode: 2144 no of steps: 181 score: 749.0 avg score: 4.1381 memorylength: 131072 epsilon: 0.14520627792435878
Training...
episode: 2145 no of steps: 207 score: 834.0 avg score: 4.029 memorylength: 131072 epsilon: 0.14507565107412676
Training...
episode: 2146 no of steps: 204 score: 1143.0 avg score: 5.6029 memorylength: 131072 epsilon: 0.14494514173517195
Training...
episode: 2147 no of steps: 183 score: 895.0 avg score: 4.8907 memorylength: 131072 epsilon: 0.1448147498017818
Training...
episode: 2148 no of steps: 181 score: 862.0 avg score: 4.7624 memorylength: 131072 epsilon: 0.14468447516833874
Training...
episode: 2149 no of steps: 181 score: 717.0 avg score: 3.9613 memorylength: 131072 epsilon: 0.14455431772932045
Training...
episode: 2150 no of steps: 168 score: 704.0 avg score: 4.1905 memorylength: 131072 epsilon: 0.14442427737929928
saving states...
Training...
episode: 2151 no of steps: 166 score: 1096.0 avg score: 6.6024 memorylength: 131072 epsilon: 0.1442943540129426
Training...
episode: 2152 no of steps: 136 score: 431.0 avg score: 3.1691 memorylength: 131072 epsilon: 0.14416454752501248
Training...
episode: 2153 no of steps: 138 score: 604.0 avg score: 4.3768 memorylength: 131072 epsilon: 0.1440348578103656
Training...
episode: 2154 no of steps: 153 score: 714.0 avg score: 4.6667 memorylength: 131072 epsilon: 0.14390528476395334
Training...
episode: 2155 no of steps: 141 score: 601.0 avg score: 4.2624 memorylength: 131072 epsilon: 0.14377582828082147
Training...
episode: 2156 no of steps: 145 score: 539.0 avg score: 3.7172 memorylength: 131072 epsilon: 0.14364648825611034
Training...
episode: 2157 no of steps: 137 score: 567.0 avg score: 4.1387 memorylength: 131072 epsilon: 0.1435172645850544
Training...
episode: 2158 no of steps: 136 score: 318.0 avg score: 2.3382 memorylength: 131072 epsilon: 0.14338815716298256
Training...
episode: 2159 no of steps: 150 score: 931.0 avg score: 6.2067 memorylength: 131072 epsilon: 0.1432591658853177
Training...
episode: 2160 no of steps: 152 score: 621.0 avg score: 4.0855 memorylength: 131072 epsilon: 0.14313029064757699
Training...
episode: 2161 no of steps: 164 score: 531.0 avg score: 3.2378 memorylength: 131072 epsilon: 0.1430015313453714
Training...
episode: 2162 no of steps: 171 score: 698.0 avg score: 4.0819 memorylength: 131072 epsilon: 0.14287288787440594
Training...
episode: 2163 no of steps: 163 score: 1191.0 avg score: 7.3067 memorylength: 131072 epsilon: 0.1427443601304794
Training...
episode: 2164 no of steps: 197 score: 828.0 avg score: 4.203 memorylength: 131072 epsilon: 0.14261594800948418
Training...
episode: 2165 no of steps: 192 score: 1134.0 avg score: 5.9062 memorylength: 131072 epsilon: 0.14248765140740663
Training...
episode: 2166 no of steps: 172 score: 832.0 avg score: 4.8372 memorylength: 131072 epsilon: 0.14235947022032636
Training...
episode: 2167 no of steps: 197 score: 1201.0 avg score: 6.0964 memorylength: 131072 epsilon: 0.1422314043444167
Training...
episode: 2168 no of steps: 197 score: 1012.0 avg score: 5.1371 memorylength: 131072 epsilon: 0.14210345367594418
Training...
episode: 2169 no of steps: 180 score: 646.0 avg score: 3.5889 memorylength: 131072 epsilon: 0.14197561811126885
Training...
episode: 2170 no of steps: 146 score: 381.0 avg score: 2.6096 memorylength: 131072 epsilon: 0.14184789754684385
Training...
episode: 2171 no of steps: 162 score: 1002.0 avg score: 6.1852 memorylength: 131072 epsilon: 0.1417202918792155
Training...
episode: 2172 no of steps: 148 score: 628.0 avg score: 4.2432 memorylength: 131072 epsilon: 0.14159280100502322
Training...
episode: 2173 no of steps: 143 score: 603.0 avg score: 4.2168 memorylength: 131072 epsilon: 0.14146542482099939
Training...
episode: 2174 no of steps: 144 score: 1006.0 avg score: 6.9861 memorylength: 131072 epsilon: 0.14133816322396933
Training...
episode: 2175 no of steps: 140 score: 827.0 avg score: 5.9071 memorylength: 131072 epsilon: 0.14121101611085107
Training...
episode: 2176 no of steps: 135 score: 611.0 avg score: 4.5259 memorylength: 131072 epsilon: 0.14108398337865552
Training...
episode: 2177 no of steps: 152 score: 747.0 avg score: 4.9145 memorylength: 131072 epsilon: 0.1409570649244861
Training...
episode: 2178 no of steps: 152 score: 469.0 avg score: 3.0855 memorylength: 131072 epsilon: 0.14083026064553889
Training...
episode: 2179 no of steps: 207 score: 961.0 avg score: 4.6425 memorylength: 131072 epsilon: 0.1407035704391024
Training...
episode: 2180 no of steps: 174 score: 630.0 avg score: 3.6207 memorylength: 131072 epsilon: 0.14057699420255754
Training...
episode: 2181 no of steps: 183 score: 141.0 avg score: 0.7705 memorylength: 131072 epsilon: 0.14045053183337758
Training...
episode: 2182 no of steps: 162 score: 890.0 avg score: 5.4938 memorylength: 131072 epsilon: 0.14032418322912799
Training...
episode: 2183 no of steps: 173 score: 962.0 avg score: 5.5607 memorylength: 131072 epsilon: 0.14019794828746637
Training...
episode: 2184 no of steps: 167 score: 628.0 avg score: 3.7605 memorylength: 131072 epsilon: 0.14007182690614242
Training...
episode: 2185 no of steps: 184 score: 792.0 avg score: 4.3043 memorylength: 131072 epsilon: 0.13994581898299785
Training...
episode: 2186 no of steps: 172 score: 1185.0 avg score: 6.8895 memorylength: 131072 epsilon: 0.1398199244159662
Training...
episode: 2187 no of steps: 153 score: 675.0 avg score: 4.4118 memorylength: 131072 epsilon: 0.13969414310307288
Training...
episode: 2188 no of steps: 158 score: 882.0 avg score: 5.5823 memorylength: 131072 epsilon: 0.139568474942435
Training...
episode: 2189 no of steps: 152 score: 1395.0 avg score: 9.1776 memorylength: 131072 epsilon: 0.13944291983226134
Training...
episode: 2190 no of steps: 144 score: 890.0 avg score: 6.1806 memorylength: 131072 epsilon: 0.1393174776708523
Training...
episode: 2191 no of steps: 154 score: 393.0 avg score: 2.5519 memorylength: 131072 epsilon: 0.13919214835659965
Training...
episode: 2192 no of steps: 156 score: 849.0 avg score: 5.4423 memorylength: 131072 epsilon: 0.13906693178798674
Training...
episode: 2193 no of steps: 142 score: 258.0 avg score: 1.8169 memorylength: 131072 epsilon: 0.13894182786358802
Training...
episode: 2194 no of steps: 167 score: 814.0 avg score: 4.8743 memorylength: 131072 epsilon: 0.1388168364820694
Training...
episode: 2195 no of steps: 154 score: 792.0 avg score: 5.1429 memorylength: 131072 epsilon: 0.1386919575421878
Training...
episode: 2196 no of steps: 174 score: 949.0 avg score: 5.454 memorylength: 131072 epsilon: 0.13856719094279132
Training...
episode: 2197 no of steps: 159 score: 810.0 avg score: 5.0943 memorylength: 131072 epsilon: 0.13844253658281896
Training...
episode: 2198 no of steps: 165 score: 1069.0 avg score: 6.4788 memorylength: 131072 epsilon: 0.1383179943613007
Training...
episode: 2199 no of steps: 154 score: 693.0 avg score: 4.5 memorylength: 131072 epsilon: 0.13819356417735737
Training...
episode: 2200 no of steps: 151 score: 875.0 avg score: 5.7947 memorylength: 131072 epsilon: 0.13806924593020042
saving states...
Training...
episode: 2201 no of steps: 144 score: 787.0 avg score: 5.4653 memorylength: 131072 epsilon: 0.13794503951913217
Training...
episode: 2202 no of steps: 163 score: 843.0 avg score: 5.1718 memorylength: 131072 epsilon: 0.13782094484354535
Training...
episode: 2203 no of steps: 157 score: 798.0 avg score: 5.0828 memorylength: 131072 epsilon: 0.1376969618029233
Training...
episode: 2204 no of steps: 145 score: 773.0 avg score: 5.331 memorylength: 131072 epsilon: 0.1375730902968397
Training...
episode: 2205 no of steps: 178 score: 1065.0 avg score: 5.9831 memorylength: 131072 epsilon: 0.13744933022495873
Training...
episode: 2206 no of steps: 146 score: 715.0 avg score: 4.8973 memorylength: 131072 epsilon: 0.1373256814870346
Training...
episode: 2207 no of steps: 152 score: 1070.0 avg score: 7.0395 memorylength: 131072 epsilon: 0.13720214398291192
Training...
episode: 2208 no of steps: 163 score: 1314.0 avg score: 8.0613 memorylength: 131072 epsilon: 0.13707871761252527
Training...
episode: 2209 no of steps: 177 score: 826.0 avg score: 4.6667 memorylength: 131072 epsilon: 0.13695540227589925
Training...
episode: 2210 no of steps: 186 score: 727.0 avg score: 3.9086 memorylength: 131072 epsilon: 0.1368321978731485
Training...
episode: 2211 no of steps: 160 score: 992.0 avg score: 6.2 memorylength: 131072 epsilon: 0.13670910430447736
Training...
episode: 2212 no of steps: 199 score: 729.0 avg score: 3.6633 memorylength: 131072 epsilon: 0.1365861214701801
Training...
episode: 2213 no of steps: 170 score: 1119.0 avg score: 6.5824 memorylength: 131072 epsilon: 0.1364632492706406
Training...
episode: 2214 no of steps: 181 score: 863.0 avg score: 4.768 memorylength: 131072 epsilon: 0.13634048760633238
Training...
episode: 2215 no of steps: 144 score: 1044.0 avg score: 7.25 memorylength: 131072 epsilon: 0.13621783637781845
Training...
episode: 2216 no of steps: 141 score: 1202.0 avg score: 8.5248 memorylength: 131072 epsilon: 0.13609529548575136
Training...
episode: 2217 no of steps: 127 score: 965.0 avg score: 7.5984 memorylength: 131072 epsilon: 0.13597286483087295
Training...
episode: 2218 no of steps: 151 score: 887.0 avg score: 5.8742 memorylength: 131072 epsilon: 0.1358505443140144
Training...
episode: 2219 no of steps: 128 score: 471.0 avg score: 3.6797 memorylength: 131072 epsilon: 0.13572833383609606
Training...
episode: 2220 no of steps: 145 score: 747.0 avg score: 5.1517 memorylength: 131072 epsilon: 0.13560623329812743
Training...
episode: 2221 no of steps: 147 score: 810.0 avg score: 5.5102 memorylength: 131072 epsilon: 0.13548424260120712
Training...
episode: 2222 no of steps: 137 score: 291.0 avg score: 2.1241 memorylength: 131072 epsilon: 0.13536236164652257
Training...
episode: 2223 no of steps: 152 score: 414.0 avg score: 2.7237 memorylength: 131072 epsilon: 0.1352405903353503
Training...
episode: 2224 no of steps: 154 score: 399.0 avg score: 2.5909 memorylength: 131072 epsilon: 0.13511892856905552
Training...
episode: 2225 no of steps: 166 score: 603.0 avg score: 3.6325 memorylength: 131072 epsilon: 0.1349973762490921
Training...
episode: 2226 no of steps: 182 score: 476.0 avg score: 2.6154 memorylength: 131072 epsilon: 0.13487593327700279
Training...
episode: 2227 no of steps: 164 score: 643.0 avg score: 3.9207 memorylength: 131072 epsilon: 0.1347545995544187
Training...
episode: 2228 no of steps: 169 score: 849.0 avg score: 5.0237 memorylength: 131072 epsilon: 0.13463337498305947
Training...
episode: 2229 no of steps: 210 score: 981.0 avg score: 4.6714 memorylength: 131072 epsilon: 0.13451225946473325
Training...
episode: 2230 no of steps: 198 score: 585.0 avg score: 2.9545 memorylength: 131072 epsilon: 0.13439125290133644
Training...
episode: 2231 no of steps: 239 score: 310.0 avg score: 1.2971 memorylength: 131072 epsilon: 0.13427035519485378
Training...
episode: 2232 no of steps: 197 score: 1026.0 avg score: 5.2081 memorylength: 131072 epsilon: 0.13414956624735805
Training...
episode: 2233 no of steps: 212 score: 877.0 avg score: 4.1368 memorylength: 131072 epsilon: 0.13402888596101017
Training...
episode: 2234 no of steps: 185 score: 1082.0 avg score: 5.8486 memorylength: 131072 epsilon: 0.13390831423805916
Training...
episode: 2235 no of steps: 156 score: 1051.0 avg score: 6.7372 memorylength: 131072 epsilon: 0.13378785098084198
Training...
episode: 2236 no of steps: 153 score: 718.0 avg score: 4.6928 memorylength: 131072 epsilon: 0.13366749609178322
Training...
episode: 2237 no of steps: 173 score: 686.0 avg score: 3.9653 memorylength: 131072 epsilon: 0.13354724947339552
Training...
episode: 2238 no of steps: 148 score: 612.0 avg score: 4.1351 memorylength: 131072 epsilon: 0.13342711102827917
Training...
episode: 2239 no of steps: 159 score: 589.0 avg score: 3.7044 memorylength: 131072 epsilon: 0.13330708065912186
Training...
episode: 2240 no of steps: 166 score: 390.0 avg score: 2.3494 memorylength: 131072 epsilon: 0.1331871582686991
Training...
episode: 2241 no of steps: 158 score: 426.0 avg score: 2.6962 memorylength: 131072 epsilon: 0.1330673437598737
Training...
episode: 2242 no of steps: 143 score: 421.0 avg score: 2.9441 memorylength: 131072 epsilon: 0.132947637035596
Training...
episode: 2243 no of steps: 151 score: 681.0 avg score: 4.5099 memorylength: 131072 epsilon: 0.1328280379989034
Training...
episode: 2244 no of steps: 158 score: 632.0 avg score: 4.0 memorylength: 131072 epsilon: 0.13270854655292072
Training...
episode: 2245 no of steps: 175 score: 738.0 avg score: 4.2171 memorylength: 131072 epsilon: 0.13258916260085998
Training...
episode: 2246 no of steps: 161 score: 957.0 avg score: 5.9441 memorylength: 131072 epsilon: 0.13246988604602003
Training...
episode: 2247 no of steps: 185 score: 693.0 avg score: 3.7459 memorylength: 131072 epsilon: 0.13235071679178692
Training...
episode: 2248 no of steps: 195 score: 643.0 avg score: 3.2974 memorylength: 131072 epsilon: 0.13223165474163354
Training...
episode: 2249 no of steps: 203 score: 822.0 avg score: 4.0493 memorylength: 131072 epsilon: 0.13211269979911971
Training...
episode: 2250 no of steps: 193 score: 738.0 avg score: 3.8238 memorylength: 131072 epsilon: 0.13199385186789178
saving states...
Training...
episode: 2251 no of steps: 166 score: 845.0 avg score: 5.0904 memorylength: 131072 epsilon: 0.13187511085168296
Training...
episode: 2252 no of steps: 177 score: 1080.0 avg score: 6.1017 memorylength: 131072 epsilon: 0.13175647665431306
Training...
episode: 2253 no of steps: 157 score: 1208.0 avg score: 7.6943 memorylength: 131072 epsilon: 0.1316379491796884
Training...
episode: 2254 no of steps: 148 score: 675.0 avg score: 4.5608 memorylength: 131072 epsilon: 0.13151952833180164
Training...
episode: 2255 no of steps: 151 score: 696.0 avg score: 4.6093 memorylength: 131072 epsilon: 0.1314012140147319
Training...
episode: 2256 no of steps: 135 score: 264.0 avg score: 1.9556 memorylength: 131072 epsilon: 0.13128300613264465
Training...
episode: 2257 no of steps: 139 score: 418.0 avg score: 3.0072 memorylength: 131072 epsilon: 0.1311649045897914
Training...
episode: 2258 no of steps: 142 score: 180.0 avg score: 1.2676 memorylength: 131072 epsilon: 0.1310469092905099
Training...
episode: 2259 no of steps: 141 score: 643.0 avg score: 4.5603 memorylength: 131072 epsilon: 0.13092902013922403
Training...
episode: 2260 no of steps: 151 score: 550.0 avg score: 3.6424 memorylength: 131072 epsilon: 0.1308112370404436
Training...
episode: 2261 no of steps: 154 score: 963.0 avg score: 6.2532 memorylength: 131072 epsilon: 0.13069355989876413
Training...
episode: 2262 no of steps: 159 score: 736.0 avg score: 4.6289 memorylength: 131072 epsilon: 0.13057598861886724
Training...
episode: 2263 no of steps: 163 score: 760.0 avg score: 4.6626 memorylength: 131072 epsilon: 0.13045852310552022
Training...
episode: 2264 no of steps: 165 score: 1008.0 avg score: 6.1091 memorylength: 131072 epsilon: 0.13034116326357592
Training...
episode: 2265 no of steps: 186 score: 1165.0 avg score: 6.2634 memorylength: 131072 epsilon: 0.13022390899797287
Training...
episode: 2266 no of steps: 167 score: 994.0 avg score: 5.9521 memorylength: 131072 epsilon: 0.13010676021373513
Training...
episode: 2267 no of steps: 180 score: 867.0 avg score: 4.8167 memorylength: 131072 epsilon: 0.12998971681597224
Training...
episode: 2268 no of steps: 170 score: 1382.0 avg score: 8.1294 memorylength: 131072 epsilon: 0.1298727787098789
Training...
episode: 2269 no of steps: 189 score: 1170.0 avg score: 6.1905 memorylength: 131072 epsilon: 0.12975594580073535
Training...
episode: 2270 no of steps: 175 score: 925.0 avg score: 5.2857 memorylength: 131072 epsilon: 0.12963921799390685
Training...
episode: 2271 no of steps: 166 score: 702.0 avg score: 4.2289 memorylength: 131072 epsilon: 0.129522595194844
Training...
episode: 2272 no of steps: 167 score: 1143.0 avg score: 6.8443 memorylength: 131072 epsilon: 0.12940607730908216
Training...
episode: 2273 no of steps: 153 score: 1053.0 avg score: 6.8824 memorylength: 131072 epsilon: 0.12928966424224195
Training...
episode: 2274 no of steps: 164 score: 606.0 avg score: 3.6951 memorylength: 131072 epsilon: 0.1291733559000288
Training...
episode: 2275 no of steps: 133 score: 611.0 avg score: 4.594 memorylength: 131072 epsilon: 0.1290571521882328
Training...
episode: 2276 no of steps: 130 score: 728.0 avg score: 5.6 memorylength: 131072 epsilon: 0.12894105301272904
Training...
episode: 2277 no of steps: 135 score: 835.0 avg score: 6.1852 memorylength: 131072 epsilon: 0.12882505827947716
Training...
episode: 2278 no of steps: 148 score: 1065.0 avg score: 7.1959 memorylength: 131072 epsilon: 0.12870916789452153
Training...
episode: 2279 no of steps: 123 score: 417.0 avg score: 3.3902 memorylength: 131072 epsilon: 0.1285933817639907
Training...
episode: 2280 no of steps: 147 score: 787.0 avg score: 5.3537 memorylength: 131072 epsilon: 0.1284776997940981
Training...
episode: 2281 no of steps: 177 score: 731.0 avg score: 4.1299 memorylength: 131072 epsilon: 0.12836212189114132
Training...
episode: 2282 no of steps: 165 score: 813.0 avg score: 4.9273 memorylength: 131072 epsilon: 0.12824664796150206
Training...
episode: 2283 no of steps: 180 score: 519.0 avg score: 2.8833 memorylength: 131072 epsilon: 0.12813127791164663
Training...
episode: 2284 no of steps: 163 score: 642.0 avg score: 3.9387 memorylength: 131072 epsilon: 0.1280160116481252
Training...
episode: 2285 no of steps: 196 score: 836.0 avg score: 4.2653 memorylength: 131072 epsilon: 0.12790084907757215
Training...
episode: 2286 no of steps: 187 score: 1046.0 avg score: 5.5936 memorylength: 131072 epsilon: 0.12778579010670568
Training...
episode: 2287 no of steps: 171 score: 1165.0 avg score: 6.8129 memorylength: 131072 epsilon: 0.1276708346423281
Training...
episode: 2288 no of steps: 141 score: 783.0 avg score: 5.5532 memorylength: 131072 epsilon: 0.12755598259132545
Training...
episode: 2289 no of steps: 168 score: 1083.0 avg score: 6.4464 memorylength: 131072 epsilon: 0.1274412338606676
Training...
episode: 2290 no of steps: 191 score: 1064.0 avg score: 5.5707 memorylength: 131072 epsilon: 0.12732658835740807
Training...
episode: 2291 no of steps: 163 score: 769.0 avg score: 4.7178 memorylength: 131072 epsilon: 0.1272120459886839
Training...
episode: 2292 no of steps: 186 score: 877.0 avg score: 4.7151 memorylength: 131072 epsilon: 0.1270976066617159
Training...
episode: 2293 no of steps: 142 score: 1489.0 avg score: 10.4859 memorylength: 131072 epsilon: 0.12698327028380813
Training...
episode: 2294 no of steps: 171 score: 873.0 avg score: 5.1053 memorylength: 131072 epsilon: 0.1268690367623481
Training...
episode: 2295 no of steps: 160 score: 1012.0 avg score: 6.325 memorylength: 131072 epsilon: 0.12675490600480668
Training...
episode: 2296 no of steps: 161 score: 632.0 avg score: 3.9255 memorylength: 131072 epsilon: 0.12664087791873804
Training...
episode: 2297 no of steps: 131 score: 445.0 avg score: 3.3969 memorylength: 131072 epsilon: 0.12652695241177925
Training...
episode: 2298 no of steps: 130 score: 489.0 avg score: 3.7615 memorylength: 131072 epsilon: 0.12641312939165075
Training...
episode: 2299 no of steps: 147 score: 450.0 avg score: 3.0612 memorylength: 131072 epsilon: 0.12629940876615586
Training...
episode: 2300 no of steps: 136 score: 395.0 avg score: 2.9044 memorylength: 131072 epsilon: 0.12618579044318096
saving states...
Training...
episode: 2301 no of steps: 135 score: 607.0 avg score: 4.4963 memorylength: 131072 epsilon: 0.126072274330695
Training...
episode: 2302 no of steps: 141 score: 592.0 avg score: 4.1986 memorylength: 131072 epsilon: 0.1259588603367501
Training...
episode: 2303 no of steps: 159 score: 981.0 avg score: 6.1698 memorylength: 131072 epsilon: 0.1258455483694809
Training...
episode: 2304 no of steps: 149 score: 890.0 avg score: 5.9732 memorylength: 131072 epsilon: 0.1257323383371046
Training...
episode: 2305 no of steps: 154 score: 649.0 avg score: 4.2143 memorylength: 131072 epsilon: 0.1256192301479211
Training...
episode: 2306 no of steps: 163 score: 1037.0 avg score: 6.362 memorylength: 131072 epsilon: 0.1255062237103128
Training...
episode: 2307 no of steps: 182 score: 1273.0 avg score: 6.9945 memorylength: 131072 epsilon: 0.12539331893274458
Training...
episode: 2308 no of steps: 178 score: 1449.0 avg score: 8.1404 memorylength: 131072 epsilon: 0.12528051572376334
Training...
episode: 2309 no of steps: 163 score: 1511.0 avg score: 9.2699 memorylength: 131072 epsilon: 0.12516781399199858
Training...
episode: 2310 no of steps: 160 score: 1071.0 avg score: 6.6938 memorylength: 131072 epsilon: 0.12505521364616198
Training...
episode: 2311 no of steps: 171 score: 877.0 avg score: 5.1287 memorylength: 131072 epsilon: 0.12494271459504712
Training...
episode: 2312 no of steps: 170 score: 957.0 avg score: 5.6294 memorylength: 131072 epsilon: 0.1248303167475298
Training...
episode: 2313 no of steps: 176 score: 784.0 avg score: 4.4545 memorylength: 131072 epsilon: 0.12471802001256777
Training...
episode: 2314 no of steps: 181 score: 895.0 avg score: 4.9448 memorylength: 131072 epsilon: 0.12460582429920072
Training...
episode: 2315 no of steps: 173 score: 969.0 avg score: 5.6012 memorylength: 131072 epsilon: 0.12449372951655002
Training...
episode: 2316 no of steps: 145 score: 738.0 avg score: 5.0897 memorylength: 131072 epsilon: 0.12438173557381893
Training...
episode: 2317 no of steps: 156 score: 891.0 avg score: 5.7115 memorylength: 131072 epsilon: 0.12426984238029234
Training...
episode: 2318 no of steps: 144 score: 468.0 avg score: 3.25 memorylength: 131072 epsilon: 0.12415804984533685
Training...
episode: 2319 no of steps: 132 score: 767.0 avg score: 5.8106 memorylength: 131072 epsilon: 0.12404635787840036
Training...
episode: 2320 no of steps: 143 score: 837.0 avg score: 5.8531 memorylength: 131072 epsilon: 0.12393476638901244
Training...
episode: 2321 no of steps: 136 score: 693.0 avg score: 5.0956 memorylength: 131072 epsilon: 0.12382327528678402
Training...
episode: 2322 no of steps: 129 score: 175.0 avg score: 1.3566 memorylength: 131072 epsilon: 0.12371188448140719
Training...
episode: 2323 no of steps: 144 score: 512.0 avg score: 3.5556 memorylength: 131072 epsilon: 0.12360059388265547
Training...
episode: 2324 no of steps: 149 score: 584.0 avg score: 3.9195 memorylength: 131072 epsilon: 0.12348940340038345
Training...
episode: 2325 no of steps: 172 score: 620.0 avg score: 3.6047 memorylength: 131072 epsilon: 0.12337831294452688
Training...
episode: 2326 no of steps: 185 score: 1334.0 avg score: 7.2108 memorylength: 131072 epsilon: 0.12326732242510238
Training...
episode: 2327 no of steps: 195 score: 993.0 avg score: 5.0923 memorylength: 131072 epsilon: 0.1231564317522077
Training...
episode: 2328 no of steps: 198 score: 603.0 avg score: 3.0455 memorylength: 131072 epsilon: 0.12304564083602143
Training...
episode: 2329 no of steps: 199 score: 567.0 avg score: 2.8492 memorylength: 131072 epsilon: 0.1229349495868028
Training...
episode: 2330 no of steps: 189 score: 771.0 avg score: 4.0794 memorylength: 131072 epsilon: 0.12282435791489196
Training...
episode: 2331 no of steps: 159 score: 783.0 avg score: 4.9245 memorylength: 131072 epsilon: 0.12271386573070965
Training...
episode: 2332 no of steps: 180 score: 671.0 avg score: 3.7278 memorylength: 131072 epsilon: 0.12260347294475724
Training...
episode: 2333 no of steps: 151 score: 793.0 avg score: 5.2517 memorylength: 131072 epsilon: 0.12249317946761647
Training...
episode: 2334 no of steps: 145 score: 697.0 avg score: 4.8069 memorylength: 131072 epsilon: 0.12238298520994965
Training...
episode: 2335 no of steps: 137 score: 599.0 avg score: 4.3723 memorylength: 131072 epsilon: 0.12227289008249946
Training...
episode: 2336 no of steps: 141 score: 837.0 avg score: 5.9362 memorylength: 131072 epsilon: 0.12216289399608887
Training...
episode: 2337 no of steps: 137 score: 787.0 avg score: 5.7445 memorylength: 131072 epsilon: 0.12205299686162095
Training...
episode: 2338 no of steps: 140 score: 378.0 avg score: 2.7 memorylength: 131072 epsilon: 0.12194319859007904
Training...
episode: 2339 no of steps: 161 score: 233.0 avg score: 1.4472 memorylength: 131072 epsilon: 0.12183349909252664
Training...
episode: 2340 no of steps: 150 score: 530.0 avg score: 3.5333 memorylength: 131072 epsilon: 0.12172389828010698
Training...
episode: 2341 no of steps: 186 score: 544.0 avg score: 2.9247 memorylength: 131072 epsilon: 0.1216143960640435
Training...
episode: 2342 no of steps: 185 score: 792.0 avg score: 4.2811 memorylength: 131072 epsilon: 0.12150499235563939
Training...
episode: 2343 no of steps: 172 score: 967.0 avg score: 5.6221 memorylength: 131072 epsilon: 0.12139568706627767
Training...
episode: 2344 no of steps: 183 score: 971.0 avg score: 5.306 memorylength: 131072 epsilon: 0.12128648010742095
Training...
episode: 2345 no of steps: 177 score: 981.0 avg score: 5.5424 memorylength: 131072 epsilon: 0.12117737139061167
Training...
episode: 2346 no of steps: 176 score: 1047.0 avg score: 5.9489 memorylength: 131072 epsilon: 0.12106836082747177
Training...
episode: 2347 no of steps: 200 score: 900.0 avg score: 4.5 memorylength: 131072 epsilon: 0.12095944832970264
Training...
episode: 2348 no of steps: 169 score: 560.0 avg score: 3.3136 memorylength: 131072 epsilon: 0.12085063380908515
Training...
episode: 2349 no of steps: 167 score: 850.0 avg score: 5.0898 memorylength: 131072 epsilon: 0.12074191717747954
Training...
episode: 2350 no of steps: 176 score: 1037.0 avg score: 5.892 memorylength: 131072 epsilon: 0.12063329834682542
saving states...
Training...
episode: 2351 no of steps: 151 score: 1234.0 avg score: 8.1722 memorylength: 131072 epsilon: 0.12052477722914139
Training...
episode: 2352 no of steps: 177 score: 1062.0 avg score: 6.0 memorylength: 131072 epsilon: 0.12041635373652541
Training...
episode: 2353 no of steps: 149 score: 336.0 avg score: 2.255 memorylength: 131072 epsilon: 0.12030802778115444
Training...
episode: 2354 no of steps: 162 score: 655.0 avg score: 4.0432 memorylength: 131072 epsilon: 0.12019979927528451
Training...
episode: 2355 no of steps: 163 score: 684.0 avg score: 4.1963 memorylength: 131072 epsilon: 0.1200916681312504
Training...
episode: 2356 no of steps: 146 score: 579.0 avg score: 3.9658 memorylength: 131072 epsilon: 0.11998363426146595
Training...
episode: 2357 no of steps: 149 score: 701.0 avg score: 4.7047 memorylength: 131072 epsilon: 0.11987569757842376
Training...
episode: 2358 no of steps: 176 score: 930.0 avg score: 5.2841 memorylength: 131072 epsilon: 0.11976785799469501
Training...
episode: 2359 no of steps: 166 score: 765.0 avg score: 4.6084 memorylength: 131072 epsilon: 0.1196601154229297
Training...
episode: 2360 no of steps: 176 score: 1043.0 avg score: 5.9261 memorylength: 131072 epsilon: 0.11955246977585632
Training...
episode: 2361 no of steps: 160 score: 814.0 avg score: 5.0875 memorylength: 131072 epsilon: 0.11944492096628194
Training...
episode: 2362 no of steps: 158 score: 571.0 avg score: 3.6139 memorylength: 131072 epsilon: 0.1193374689070919
Training...
episode: 2363 no of steps: 150 score: 819.0 avg score: 5.46 memorylength: 131072 epsilon: 0.11923011351125014
Training...
episode: 2364 no of steps: 152 score: 216.0 avg score: 1.4211 memorylength: 131072 epsilon: 0.11912285469179872
Training...
episode: 2365 no of steps: 133 score: 450.0 avg score: 3.3835 memorylength: 131072 epsilon: 0.11901569236185806
Training...
episode: 2366 no of steps: 147 score: 817.0 avg score: 5.5578 memorylength: 131072 epsilon: 0.11890862643462659
Training...
episode: 2367 no of steps: 143 score: 715.0 avg score: 5.0 memorylength: 131072 epsilon: 0.11880165682338091
Training...
episode: 2368 no of steps: 140 score: 552.0 avg score: 3.9429 memorylength: 131072 epsilon: 0.11869478344147572
Training...
episode: 2369 no of steps: 123 score: 450.0 avg score: 3.6585 memorylength: 131072 epsilon: 0.11858800620234346
Training...
episode: 2370 no of steps: 165 score: 670.0 avg score: 4.0606 memorylength: 131072 epsilon: 0.11848132501949458
Training...
episode: 2371 no of steps: 156 score: 455.0 avg score: 2.9167 memorylength: 131072 epsilon: 0.11837473980651736
Training...
episode: 2372 no of steps: 189 score: 846.0 avg score: 4.4762 memorylength: 131072 epsilon: 0.11826825047707781
Training...
episode: 2373 no of steps: 173 score: 628.0 avg score: 3.6301 memorylength: 131072 epsilon: 0.11816185694491947
Training...
episode: 2374 no of steps: 191 score: 515.0 avg score: 2.6963 memorylength: 131072 epsilon: 0.1180555591238636
Training...
episode: 2375 no of steps: 177 score: 965.0 avg score: 5.452 memorylength: 131072 epsilon: 0.11794935692780903
Training...
episode: 2376 no of steps: 165 score: 753.0 avg score: 4.5636 memorylength: 131072 epsilon: 0.11784325027073188
Training...
episode: 2377 no of steps: 188 score: 676.0 avg score: 3.5957 memorylength: 131072 epsilon: 0.11773723906668578
Training...
episode: 2378 no of steps: 182 score: 657.0 avg score: 3.6099 memorylength: 131072 epsilon: 0.11763132322980167
Training...
episode: 2379 no of steps: 153 score: 677.0 avg score: 4.4248 memorylength: 131072 epsilon: 0.11752550267428775
Training...
episode: 2380 no of steps: 133 score: 967.0 avg score: 7.2707 memorylength: 131072 epsilon: 0.11741977731442928
Training...
episode: 2381 no of steps: 142 score: 432.0 avg score: 3.0423 memorylength: 131072 epsilon: 0.11731414706458874
Training...
episode: 2382 no of steps: 158 score: 1273.0 avg score: 8.057 memorylength: 131072 epsilon: 0.11720861183920565
Training...
episode: 2383 no of steps: 147 score: 751.0 avg score: 5.1088 memorylength: 131072 epsilon: 0.11710317155279651
Training...
episode: 2384 no of steps: 156 score: 773.0 avg score: 4.9551 memorylength: 131072 epsilon: 0.11699782611995457
Training...
episode: 2385 no of steps: 189 score: 562.0 avg score: 2.9735 memorylength: 131072 epsilon: 0.11689257545535009
Training...
episode: 2386 no of steps: 160 score: 729.0 avg score: 4.5562 memorylength: 131072 epsilon: 0.11678741947373007
Training...
episode: 2387 no of steps: 199 score: 729.0 avg score: 3.6633 memorylength: 131072 epsilon: 0.11668235808991806
Training...
episode: 2388 no of steps: 182 score: 925.0 avg score: 5.0824 memorylength: 131072 epsilon: 0.11657739121881439
Training...
episode: 2389 no of steps: 188 score: 666.0 avg score: 3.5426 memorylength: 131072 epsilon: 0.11647251877539586
Training...
episode: 2390 no of steps: 200 score: 778.0 avg score: 3.89 memorylength: 131072 epsilon: 0.11636774067471586
Training...
episode: 2391 no of steps: 163 score: 873.0 avg score: 5.3558 memorylength: 131072 epsilon: 0.11626305683190402
Training...
episode: 2392 no of steps: 160 score: 301.0 avg score: 1.8812 memorylength: 131072 epsilon: 0.11615846716216649
Training...
episode: 2393 no of steps: 149 score: 620.0 avg score: 4.1611 memorylength: 131072 epsilon: 0.11605397158078565
Training...
episode: 2394 no of steps: 142 score: 520.0 avg score: 3.662 memorylength: 131072 epsilon: 0.11594957000311999
Training...
episode: 2395 no of steps: 135 score: 691.0 avg score: 5.1185 memorylength: 131072 epsilon: 0.11584526234460427
Training...
episode: 2396 no of steps: 133 score: 574.0 avg score: 4.3158 memorylength: 131072 epsilon: 0.11574104852074928
Training...
episode: 2397 no of steps: 132 score: 645.0 avg score: 4.8864 memorylength: 131072 epsilon: 0.11563692844714185
Training...
episode: 2398 no of steps: 135 score: 342.0 avg score: 2.5333 memorylength: 131072 epsilon: 0.11553290203944466
Training...
episode: 2399 no of steps: 142 score: 283.0 avg score: 1.993 memorylength: 131072 epsilon: 0.11542896921339633
Training...
episode: 2400 no of steps: 150 score: 496.0 avg score: 3.3067 memorylength: 131072 epsilon: 0.11532512988481129
saving states...
Training...
episode: 2401 no of steps: 166 score: 588.0 avg score: 3.5422 memorylength: 131072 epsilon: 0.1152213839695797
Training...
episode: 2402 no of steps: 208 score: 1030.0 avg score: 4.9519 memorylength: 131072 epsilon: 0.11511773138366727
Training...
episode: 2403 no of steps: 193 score: 886.0 avg score: 4.5907 memorylength: 131072 epsilon: 0.11501417204311547
Training...
episode: 2404 no of steps: 182 score: 831.0 avg score: 4.5659 memorylength: 131072 epsilon: 0.11491070586404124
Training...
episode: 2405 no of steps: 180 score: 763.0 avg score: 4.2389 memorylength: 131072 epsilon: 0.11480733276263691
Training...
episode: 2406 no of steps: 191 score: 990.0 avg score: 5.1832 memorylength: 131072 epsilon: 0.11470405265517028
Training...
episode: 2407 no of steps: 170 score: 1044.0 avg score: 6.1412 memorylength: 131072 epsilon: 0.1146008654579845
Training...
episode: 2408 no of steps: 143 score: 837.0 avg score: 5.8531 memorylength: 131072 epsilon: 0.11449777108749794
Training...
episode: 2409 no of steps: 146 score: 1006.0 avg score: 6.8904 memorylength: 131072 epsilon: 0.11439476946020405
Training...
episode: 2410 no of steps: 152 score: 863.0 avg score: 5.6776 memorylength: 131072 epsilon: 0.11429186049267161
Training...
episode: 2411 no of steps: 151 score: 927.0 avg score: 6.1391 memorylength: 131072 epsilon: 0.1141890441015443
Training...
episode: 2412 no of steps: 146 score: 576.0 avg score: 3.9452 memorylength: 131072 epsilon: 0.11408632020354093
Training...
episode: 2413 no of steps: 144 score: 778.0 avg score: 5.4028 memorylength: 131072 epsilon: 0.11398368871545497
Training...
episode: 2414 no of steps: 152 score: 992.0 avg score: 6.5263 memorylength: 131072 epsilon: 0.11388114955415504
Training...
episode: 2415 no of steps: 153 score: 664.0 avg score: 4.3399 memorylength: 131072 epsilon: 0.11377870263658439
Training...
episode: 2416 no of steps: 163 score: 1308.0 avg score: 8.0245 memorylength: 131072 epsilon: 0.11367634787976098
Training...
episode: 2417 no of steps: 196 score: 1105.0 avg score: 5.6378 memorylength: 131072 epsilon: 0.11357408520077746
Training...
episode: 2418 no of steps: 162 score: 967.0 avg score: 5.9691 memorylength: 131072 epsilon: 0.11347191451680104
Training...
episode: 2419 no of steps: 160 score: 859.0 avg score: 5.3688 memorylength: 131072 epsilon: 0.11336983574507356
Training...
episode: 2420 no of steps: 162 score: 945.0 avg score: 5.8333 memorylength: 131072 epsilon: 0.11326784880291106
Training...
episode: 2421 no of steps: 179 score: 718.0 avg score: 4.0112 memorylength: 131072 epsilon: 0.1131659536077042
Training...
episode: 2422 no of steps: 162 score: 830.0 avg score: 5.1235 memorylength: 131072 epsilon: 0.1130641500769179
Training...
episode: 2423 no of steps: 145 score: 686.0 avg score: 4.731 memorylength: 131072 epsilon: 0.11296243812809119
Training...
episode: 2424 no of steps: 164 score: 850.0 avg score: 5.1829 memorylength: 131072 epsilon: 0.11286081767883743
Training...
episode: 2425 no of steps: 131 score: 633.0 avg score: 4.8321 memorylength: 131072 epsilon: 0.11275928864684408
Training...
episode: 2426 no of steps: 163 score: 1078.0 avg score: 6.6135 memorylength: 131072 epsilon: 0.11265785094987263
Training...
episode: 2427 no of steps: 149 score: 692.0 avg score: 4.6443 memorylength: 131072 epsilon: 0.11255650450575848
Training...
episode: 2428 no of steps: 149 score: 490.0 avg score: 3.2886 memorylength: 131072 epsilon: 0.11245524923241101
Training...
episode: 2429 no of steps: 146 score: 738.0 avg score: 5.0548 memorylength: 131072 epsilon: 0.11235408504781348
Training...
episode: 2430 no of steps: 157 score: 516.0 avg score: 3.2866 memorylength: 131072 epsilon: 0.11225301187002293
Training...
episode: 2431 no of steps: 156 score: 1152.0 avg score: 7.3846 memorylength: 131072 epsilon: 0.11215202961716998
Training...
episode: 2432 no of steps: 175 score: 816.0 avg score: 4.6629 memorylength: 131072 epsilon: 0.11205113820745906
Training...
episode: 2433 no of steps: 166 score: 954.0 avg score: 5.747 memorylength: 131072 epsilon: 0.11195033755916815
Training...
episode: 2434 no of steps: 179 score: 1116.0 avg score: 6.2346 memorylength: 131072 epsilon: 0.11184962759064863
Training...
episode: 2435 no of steps: 172 score: 1078.0 avg score: 6.2674 memorylength: 131072 epsilon: 0.11174900822032549
Training...
episode: 2436 no of steps: 182 score: 1092.0 avg score: 6.0 memorylength: 131072 epsilon: 0.11164847936669701
Training...
episode: 2437 no of steps: 161 score: 792.0 avg score: 4.9193 memorylength: 131072 epsilon: 0.11154804094833488
Training...
episode: 2438 no of steps: 137 score: 704.0 avg score: 5.1387 memorylength: 131072 epsilon: 0.11144769288388387
Training...
episode: 2439 no of steps: 137 score: 621.0 avg score: 4.5328 memorylength: 131072 epsilon: 0.11134743509206207
Training...
episode: 2440 no of steps: 140 score: 746.0 avg score: 5.3286 memorylength: 131072 epsilon: 0.11124726749166076
Training...
episode: 2441 no of steps: 138 score: 882.0 avg score: 6.3913 memorylength: 131072 epsilon: 0.11114719000154402
Training...
episode: 2442 no of steps: 142 score: 652.0 avg score: 4.5915 memorylength: 131072 epsilon: 0.11104720254064919
Training...
episode: 2443 no of steps: 118 score: 422.0 avg score: 3.5763 memorylength: 131072 epsilon: 0.11094730502798636
Training...
episode: 2444 no of steps: 154 score: 747.0 avg score: 4.8506 memorylength: 131072 epsilon: 0.11084749738263863
Training...
episode: 2445 no of steps: 163 score: 1060.0 avg score: 6.5031 memorylength: 131072 epsilon: 0.1107477795237617
Training...
episode: 2446 no of steps: 175 score: 873.0 avg score: 4.9886 memorylength: 131072 epsilon: 0.11064815137058412
Training...
episode: 2447 no of steps: 192 score: 1189.0 avg score: 6.1927 memorylength: 131072 epsilon: 0.1105486128424071
Training...
episode: 2448 no of steps: 181 score: 935.0 avg score: 5.1657 memorylength: 131072 epsilon: 0.11044916385860451
Training...
episode: 2449 no of steps: 176 score: 552.0 avg score: 3.1364 memorylength: 131072 epsilon: 0.1103498043386225
Training...
episode: 2450 no of steps: 199 score: 1035.0 avg score: 5.201 memorylength: 131072 epsilon: 0.11025053420197996
saving states...
Training...
episode: 2451 no of steps: 160 score: 628.0 avg score: 3.925 memorylength: 131072 epsilon: 0.11015135336826809
Training...
episode: 2452 no of steps: 160 score: 859.0 avg score: 5.3688 memorylength: 131072 epsilon: 0.11005226175715031
Training...
episode: 2453 no of steps: 162 score: 985.0 avg score: 6.0802 memorylength: 131072 epsilon: 0.1099532592883625
Training...
episode: 2454 no of steps: 148 score: 540.0 avg score: 3.6486 memorylength: 131072 epsilon: 0.10985434588171258
Training...
episode: 2455 no of steps: 147 score: 794.0 avg score: 5.4014 memorylength: 131072 epsilon: 0.10975552145708083
Training...
episode: 2456 no of steps: 146 score: 1018.0 avg score: 6.9726 memorylength: 131072 epsilon: 0.10965678593441927
Training...
episode: 2457 no of steps: 141 score: 747.0 avg score: 5.2979 memorylength: 131072 epsilon: 0.10955813923375225
Training...
episode: 2458 no of steps: 149 score: 499.0 avg score: 3.349 memorylength: 131072 epsilon: 0.10945958127517592
Training...
episode: 2459 no of steps: 141 score: 381.0 avg score: 2.7021 memorylength: 131072 epsilon: 0.10936111197885827
Training...
episode: 2460 no of steps: 154 score: 816.0 avg score: 5.2987 memorylength: 131072 epsilon: 0.1092627312650392
Training...
episode: 2461 no of steps: 168 score: 885.0 avg score: 5.2679 memorylength: 131072 epsilon: 0.10916443905403034
Training...
episode: 2462 no of steps: 181 score: 967.0 avg score: 5.3425 memorylength: 131072 epsilon: 0.109066235266215
Training...
episode: 2463 no of steps: 206 score: 1235.0 avg score: 5.9951 memorylength: 131072 epsilon: 0.10896811982204808
Training...
episode: 2464 no of steps: 183 score: 945.0 avg score: 5.1639 memorylength: 131072 epsilon: 0.10887009264205605
Training...
episode: 2465 no of steps: 164 score: 839.0 avg score: 5.1159 memorylength: 131072 epsilon: 0.10877215364683691
Training...
episode: 2466 no of steps: 179 score: 944.0 avg score: 5.2737 memorylength: 131072 epsilon: 0.10867430275706012
Training...
episode: 2467 no of steps: 158 score: 589.0 avg score: 3.7278 memorylength: 131072 epsilon: 0.10857653989346638
Training...
episode: 2468 no of steps: 146 score: 542.0 avg score: 3.7123 memorylength: 131072 epsilon: 0.10847886497686776
Training...
episode: 2469 no of steps: 148 score: 738.0 avg score: 4.9865 memorylength: 131072 epsilon: 0.10838127792814767
Training...
episode: 2470 no of steps: 123 score: 614.0 avg score: 4.9919 memorylength: 131072 epsilon: 0.10828377866826047
Training...
episode: 2471 no of steps: 156 score: 1125.0 avg score: 7.2115 memorylength: 131072 epsilon: 0.10818636711823182
Training...
episode: 2472 no of steps: 137 score: 1170.0 avg score: 8.5401 memorylength: 131072 epsilon: 0.10808904319915834
Training...
episode: 2473 no of steps: 162 score: 976.0 avg score: 6.0247 memorylength: 131072 epsilon: 0.10799180683220772
Training...
episode: 2474 no of steps: 167 score: 1280.0 avg score: 7.6647 memorylength: 131072 epsilon: 0.10789465793861838
Training...
episode: 2475 no of steps: 165 score: 1053.0 avg score: 6.3818 memorylength: 131072 epsilon: 0.10779759643969979
Training...
episode: 2476 no of steps: 178 score: 913.0 avg score: 5.1292 memorylength: 131072 epsilon: 0.10770062225683208
Training...
episode: 2477 no of steps: 167 score: 1120.0 avg score: 6.7066 memorylength: 131072 epsilon: 0.10760373531146625
Training...
episode: 2478 no of steps: 175 score: 1170.0 avg score: 6.6857 memorylength: 131072 epsilon: 0.10750693552512376
Training...
episode: 2479 no of steps: 176 score: 391.0 avg score: 2.2216 memorylength: 131072 epsilon: 0.10741022281939683
Training...
episode: 2480 no of steps: 158 score: 860.0 avg score: 5.443 memorylength: 131072 epsilon: 0.10731359711594818
Training...
episode: 2481 no of steps: 158 score: 599.0 avg score: 3.7911 memorylength: 131072 epsilon: 0.10721705833651092
Training...
episode: 2482 no of steps: 151 score: 938.0 avg score: 6.2119 memorylength: 131072 epsilon: 0.10712060640288869
Training...
episode: 2483 no of steps: 143 score: 621.0 avg score: 4.3427 memorylength: 131072 epsilon: 0.1070242412369554
Training...
episode: 2484 no of steps: 141 score: 728.0 avg score: 5.1631 memorylength: 131072 epsilon: 0.1069279627606553
Training...
episode: 2485 no of steps: 183 score: 1132.0 avg score: 6.1858 memorylength: 131072 epsilon: 0.10683177089600274
Training...
episode: 2486 no of steps: 170 score: 1072.0 avg score: 6.3059 memorylength: 131072 epsilon: 0.10673566556508235
Training...
episode: 2487 no of steps: 151 score: 656.0 avg score: 4.3444 memorylength: 131072 epsilon: 0.10663964669004884
Training...
episode: 2488 no of steps: 174 score: 1168.0 avg score: 6.7126 memorylength: 131072 epsilon: 0.10654371419312686
Training...
episode: 2489 no of steps: 162 score: 884.0 avg score: 5.4568 memorylength: 131072 epsilon: 0.10644786799661107
Training...
episode: 2490 no of steps: 147 score: 1025.0 avg score: 6.9728 memorylength: 131072 epsilon: 0.1063521080228661
Training...
episode: 2491 no of steps: 149 score: 765.0 avg score: 5.1342 memorylength: 131072 epsilon: 0.10625643419432639
Training...
episode: 2492 no of steps: 171 score: 682.0 avg score: 3.9883 memorylength: 131072 epsilon: 0.10616084643349602
Training...
episode: 2493 no of steps: 146 score: 638.0 avg score: 4.3699 memorylength: 131072 epsilon: 0.10606534466294898
Training...
episode: 2494 no of steps: 163 score: 935.0 avg score: 5.7362 memorylength: 131072 epsilon: 0.10596992880532881
Training...
episode: 2495 no of steps: 154 score: 1142.0 avg score: 7.4156 memorylength: 131072 epsilon: 0.1058745987833487
Training...
episode: 2496 no of steps: 165 score: 972.0 avg score: 5.8909 memorylength: 131072 epsilon: 0.10577935451979127
Training...
episode: 2497 no of steps: 174 score: 873.0 avg score: 5.0172 memorylength: 131072 epsilon: 0.10568419593750868
Training...
episode: 2498 no of steps: 155 score: 1264.0 avg score: 8.1548 memorylength: 131072 epsilon: 0.10558912295942252
Training...
episode: 2499 no of steps: 169 score: 873.0 avg score: 5.1657 memorylength: 131072 epsilon: 0.10549413550852359
Training...
episode: 2500 no of steps: 160 score: 1088.0 avg score: 6.8 memorylength: 131072 epsilon: 0.10539923350787207
saving states...
Training...
episode: 2501 no of steps: 166 score: 1183.0 avg score: 7.1265 memorylength: 131072 epsilon: 0.10530441688059738
Training...
episode: 2502 no of steps: 153 score: 1141.0 avg score: 7.4575 memorylength: 131072 epsilon: 0.10520968554989805
Training...
episode: 2503 no of steps: 154 score: 861.0 avg score: 5.5909 memorylength: 131072 epsilon: 0.10511503943904163
Training...
episode: 2504 no of steps: 144 score: 877.0 avg score: 6.0903 memorylength: 131072 epsilon: 0.1050204784713648
Training...
episode: 2505 no of steps: 154 score: 758.0 avg score: 4.9221 memorylength: 131072 epsilon: 0.10492600257027322
Training...
episode: 2506 no of steps: 165 score: 1015.0 avg score: 6.1515 memorylength: 131072 epsilon: 0.10483161165924132
Training...
episode: 2507 no of steps: 148 score: 618.0 avg score: 4.1757 memorylength: 131072 epsilon: 0.10473730566181248
Training...
episode: 2508 no of steps: 153 score: 1042.0 avg score: 6.8105 memorylength: 131072 epsilon: 0.10464308450159886
Training...
episode: 2509 no of steps: 153 score: 720.0 avg score: 4.7059 memorylength: 131072 epsilon: 0.10454894810228135
Training...
episode: 2510 no of steps: 157 score: 873.0 avg score: 5.5605 memorylength: 131072 epsilon: 0.10445489638760938
Training...
episode: 2511 no of steps: 157 score: 607.0 avg score: 3.8662 memorylength: 131072 epsilon: 0.10436092928140109
Training...
episode: 2512 no of steps: 165 score: 862.0 avg score: 5.2242 memorylength: 131072 epsilon: 0.10426704670754314
Training...
episode: 2513 no of steps: 164 score: 999.0 avg score: 6.0915 memorylength: 131072 epsilon: 0.10417324858999065
Training...
episode: 2514 no of steps: 180 score: 800.0 avg score: 4.4444 memorylength: 131072 epsilon: 0.10407953485276707
Training...
episode: 2515 no of steps: 168 score: 889.0 avg score: 5.2917 memorylength: 131072 epsilon: 0.1039859054199643
Training...
episode: 2516 no of steps: 170 score: 1035.0 avg score: 6.0882 memorylength: 131072 epsilon: 0.10389236021574258
Training...
episode: 2517 no of steps: 164 score: 952.0 avg score: 5.8049 memorylength: 131072 epsilon: 0.10379889916433016
Training...
episode: 2518 no of steps: 159 score: 803.0 avg score: 5.0503 memorylength: 131072 epsilon: 0.10370552219002363
Training...
episode: 2519 no of steps: 146 score: 670.0 avg score: 4.589 memorylength: 131072 epsilon: 0.10361222921718766
Training...
episode: 2520 no of steps: 147 score: 666.0 avg score: 4.5306 memorylength: 131072 epsilon: 0.10351902017025494
Training...
episode: 2521 no of steps: 144 score: 665.0 avg score: 4.6181 memorylength: 131072 epsilon: 0.10342589497372609
Training...
episode: 2522 no of steps: 146 score: 421.0 avg score: 2.8836 memorylength: 131072 epsilon: 0.10333285355216972
Training...
episode: 2523 no of steps: 142 score: 391.0 avg score: 2.7535 memorylength: 131072 epsilon: 0.10323989583022232
Training...
episode: 2524 no of steps: 138 score: 795.0 avg score: 5.7609 memorylength: 131072 epsilon: 0.10314702173258805
Training...
episode: 2525 no of steps: 160 score: 736.0 avg score: 4.6 memorylength: 131072 epsilon: 0.10305423118403892
Training...
episode: 2526 no of steps: 165 score: 846.0 avg score: 5.1273 memorylength: 131072 epsilon: 0.10296152410941457
Training...
episode: 2527 no of steps: 169 score: 1089.0 avg score: 6.4438 memorylength: 131072 epsilon: 0.10286890043362233
Training...
episode: 2528 no of steps: 189 score: 1226.0 avg score: 6.4868 memorylength: 131072 epsilon: 0.10277636008163693
Training...
episode: 2529 no of steps: 167 score: 1263.0 avg score: 7.5629 memorylength: 131072 epsilon: 0.1026839029785007
Training...
episode: 2530 no of steps: 184 score: 1035.0 avg score: 5.625 memorylength: 131072 epsilon: 0.10259152904932342
Training...
episode: 2531 no of steps: 177 score: 992.0 avg score: 5.6045 memorylength: 131072 epsilon: 0.10249923821928221
Training...
episode: 2532 no of steps: 162 score: 692.0 avg score: 4.2716 memorylength: 131072 epsilon: 0.10240703041362142
Training...
episode: 2533 no of steps: 165 score: 1170.0 avg score: 7.0909 memorylength: 131072 epsilon: 0.10231490555765275
Training...
episode: 2534 no of steps: 151 score: 1201.0 avg score: 7.9536 memorylength: 131072 epsilon: 0.10222286357675514
Training...
episode: 2535 no of steps: 153 score: 721.0 avg score: 4.7124 memorylength: 131072 epsilon: 0.10213090439637447
Training...
episode: 2536 no of steps: 148 score: 579.0 avg score: 3.9122 memorylength: 131072 epsilon: 0.10203902794202384
Training...
episode: 2537 no of steps: 150 score: 936.0 avg score: 6.24 memorylength: 131072 epsilon: 0.10194723413928332
Training...
episode: 2538 no of steps: 153 score: 756.0 avg score: 4.9412 memorylength: 131072 epsilon: 0.10185552291379997
Training...
episode: 2539 no of steps: 153 score: 835.0 avg score: 5.4575 memorylength: 131072 epsilon: 0.1017638941912876
Training...
episode: 2540 no of steps: 150 score: 507.0 avg score: 3.38 memorylength: 131072 epsilon: 0.101672347897527
Training...
episode: 2541 no of steps: 149 score: 495.0 avg score: 3.3221 memorylength: 131072 epsilon: 0.10158088395836565
Training...
episode: 2542 no of steps: 160 score: 706.0 avg score: 4.4125 memorylength: 131072 epsilon: 0.10148950229971782
Training...
episode: 2543 no of steps: 176 score: 958.0 avg score: 5.4432 memorylength: 131072 epsilon: 0.10139820284756423
Training...
episode: 2544 no of steps: 170 score: 693.0 avg score: 4.0765 memorylength: 131072 epsilon: 0.1013069855279524
Training...
episode: 2545 no of steps: 212 score: 1273.0 avg score: 6.0047 memorylength: 131072 epsilon: 0.10121585026699635
Training...
episode: 2546 no of steps: 154 score: 932.0 avg score: 6.0519 memorylength: 131072 epsilon: 0.10112479699087638
Training...
episode: 2547 no of steps: 186 score: 1044.0 avg score: 5.6129 memorylength: 131072 epsilon: 0.10103382562583942
Training...
episode: 2548 no of steps: 169 score: 998.0 avg score: 5.9053 memorylength: 131072 epsilon: 0.10094293609819863
Training...
episode: 2549 no of steps: 150 score: 1032.0 avg score: 6.88 memorylength: 131072 epsilon: 0.10085212833433355
Training...
episode: 2550 no of steps: 145 score: 615.0 avg score: 4.2414 memorylength: 131072 epsilon: 0.10076140226068979
saving states...
Training...
episode: 2551 no of steps: 148 score: 801.0 avg score: 5.4122 memorylength: 131072 epsilon: 0.10067075780377926
Training...
episode: 2552 no of steps: 140 score: 690.0 avg score: 4.9286 memorylength: 131072 epsilon: 0.10058019489018001
Training...
episode: 2553 no of steps: 143 score: 675.0 avg score: 4.7203 memorylength: 131072 epsilon: 0.10048971344653597
Training...
episode: 2554 no of steps: 150 score: 998.0 avg score: 6.6533 memorylength: 131072 epsilon: 0.10039931339955721
Training...
episode: 2555 no of steps: 162 score: 863.0 avg score: 5.3272 memorylength: 131072 epsilon: 0.10030899467601971
Training...
episode: 2556 no of steps: 156 score: 324.0 avg score: 2.0769 memorylength: 131072 epsilon: 0.10021875720276532
Training...
episode: 2557 no of steps: 168 score: 904.0 avg score: 5.381 memorylength: 131072 epsilon: 0.10012860090670159
Training...
episode: 2558 no of steps: 161 score: 1050.0 avg score: 6.5217 memorylength: 131072 epsilon: 0.10003852571480198
Training...
episode: 2559 no of steps: 179 score: 786.0 avg score: 4.3911 memorylength: 131072 epsilon: 0.09994853155410557
Training...
episode: 2560 no of steps: 165 score: 1139.0 avg score: 6.903 memorylength: 131072 epsilon: 0.09985861835171712
Training...
episode: 2561 no of steps: 181 score: 976.0 avg score: 5.3923 memorylength: 131072 epsilon: 0.09976878603480685
Training...
episode: 2562 no of steps: 174 score: 772.0 avg score: 4.4368 memorylength: 131072 epsilon: 0.09967903453061062
Training...
episode: 2563 no of steps: 158 score: 751.0 avg score: 4.7532 memorylength: 131072 epsilon: 0.09958936376642978
Training...
episode: 2564 no of steps: 162 score: 739.0 avg score: 4.5617 memorylength: 131072 epsilon: 0.09949977366963086
Training...
episode: 2565 no of steps: 148 score: 733.0 avg score: 4.9527 memorylength: 131072 epsilon: 0.09941026416764598
Training...
episode: 2566 no of steps: 157 score: 786.0 avg score: 5.0064 memorylength: 131072 epsilon: 0.09932083518797238
Training...
episode: 2567 no of steps: 137 score: 1052.0 avg score: 7.6788 memorylength: 131072 epsilon: 0.09923148665817268
Training...
episode: 2568 no of steps: 136 score: 700.0 avg score: 5.1471 memorylength: 131072 epsilon: 0.09914221850587444
Training...
episode: 2569 no of steps: 138 score: 855.0 avg score: 6.1957 memorylength: 131072 epsilon: 0.09905303065877051
Training...
episode: 2570 no of steps: 150 score: 436.0 avg score: 2.9067 memorylength: 131072 epsilon: 0.09896392304461879
Training...
episode: 2571 no of steps: 157 score: 674.0 avg score: 4.293 memorylength: 131072 epsilon: 0.09887489559124199
Training...
episode: 2572 no of steps: 174 score: 566.0 avg score: 3.2529 memorylength: 131072 epsilon: 0.09878594822652793
Training...
episode: 2573 no of steps: 170 score: 693.0 avg score: 4.0765 memorylength: 131072 epsilon: 0.09869708087842922
Training...
episode: 2574 no of steps: 171 score: 385.0 avg score: 2.2515 memorylength: 131072 epsilon: 0.09860829347496339
Training...
episode: 2575 no of steps: 202 score: 872.0 avg score: 4.3168 memorylength: 131072 epsilon: 0.0985195859442125
Training...
episode: 2576 no of steps: 186 score: 799.0 avg score: 4.2957 memorylength: 131072 epsilon: 0.09843095821432353
Training...
episode: 2577 no of steps: 162 score: 1182.0 avg score: 7.2963 memorylength: 131072 epsilon: 0.09834241021350797
Training...
episode: 2578 no of steps: 153 score: 508.0 avg score: 3.3203 memorylength: 131072 epsilon: 0.09825394187004204
Training...
episode: 2579 no of steps: 175 score: 781.0 avg score: 4.4629 memorylength: 131072 epsilon: 0.09816555311226621
Training...
episode: 2580 no of steps: 167 score: 849.0 avg score: 5.0838 memorylength: 131072 epsilon: 0.0980772438685857
Training...
episode: 2581 no of steps: 169 score: 931.0 avg score: 5.5089 memorylength: 131072 epsilon: 0.09798901406747001
Training...
episode: 2582 no of steps: 143 score: 881.0 avg score: 6.1608 memorylength: 131072 epsilon: 0.09790086363745293
Training...
episode: 2583 no of steps: 141 score: 922.0 avg score: 6.539 memorylength: 131072 epsilon: 0.09781279250713266
Training...
episode: 2584 no of steps: 161 score: 957.0 avg score: 5.9441 memorylength: 131072 epsilon: 0.09772480060517157
Training...
episode: 2585 no of steps: 152 score: 516.0 avg score: 3.3947 memorylength: 131072 epsilon: 0.09763688786029626
Training...
episode: 2586 no of steps: 164 score: 927.0 avg score: 5.6524 memorylength: 131072 epsilon: 0.0975490542012973
Training...
episode: 2587 no of steps: 154 score: 900.0 avg score: 5.8442 memorylength: 131072 epsilon: 0.09746129955702948
Training...
episode: 2588 no of steps: 195 score: 918.0 avg score: 4.7077 memorylength: 131072 epsilon: 0.09737362385641157
Training...
episode: 2589 no of steps: 172 score: 1085.0 avg score: 6.3081 memorylength: 131072 epsilon: 0.09728602702842616
Training...
episode: 2590 no of steps: 159 score: 916.0 avg score: 5.761 memorylength: 131072 epsilon: 0.09719850900211986
Training...
episode: 2591 no of steps: 169 score: 1143.0 avg score: 6.7633 memorylength: 131072 epsilon: 0.09711106970660309
Training...
episode: 2592 no of steps: 164 score: 769.0 avg score: 4.689 memorylength: 131072 epsilon: 0.09702370907105001
Training...
episode: 2593 no of steps: 174 score: 944.0 avg score: 5.4253 memorylength: 131072 epsilon: 0.09693642702469846
Training...
episode: 2594 no of steps: 172 score: 1043.0 avg score: 6.064 memorylength: 131072 epsilon: 0.09684922349684999
Training...
episode: 2595 no of steps: 156 score: 935.0 avg score: 5.9936 memorylength: 131072 epsilon: 0.09676209841686974
Training...
episode: 2596 no of steps: 134 score: 561.0 avg score: 4.1866 memorylength: 131072 epsilon: 0.09667505171418646
Training...
episode: 2597 no of steps: 144 score: 899.0 avg score: 6.2431 memorylength: 131072 epsilon: 0.09658808331829219
Training...
episode: 2598 no of steps: 141 score: 629.0 avg score: 4.461 memorylength: 131072 epsilon: 0.0965011931587426
Training...
episode: 2599 no of steps: 153 score: 1063.0 avg score: 6.9477 memorylength: 131072 epsilon: 0.09641438116515669
Training...
episode: 2600 no of steps: 160 score: 738.0 avg score: 4.6125 memorylength: 131072 epsilon: 0.09632764726721664
saving states...
Training...
episode: 2601 no of steps: 134 score: 533.0 avg score: 3.9776 memorylength: 131072 epsilon: 0.09624099139466805
Training...
episode: 2602 no of steps: 171 score: 719.0 avg score: 4.2047 memorylength: 131072 epsilon: 0.09615441347731965
Training...
episode: 2603 no of steps: 157 score: 309.0 avg score: 1.9682 memorylength: 131072 epsilon: 0.09606791344504337
Training...
episode: 2604 no of steps: 188 score: 798.0 avg score: 4.2447 memorylength: 131072 epsilon: 0.0959814912277741
Training...
episode: 2605 no of steps: 167 score: 765.0 avg score: 4.5808 memorylength: 131072 epsilon: 0.09589514675550986
Training...
episode: 2606 no of steps: 182 score: 859.0 avg score: 4.7198 memorylength: 131072 epsilon: 0.09580887995831162
Training...
episode: 2607 no of steps: 176 score: 946.0 avg score: 5.375 memorylength: 131072 epsilon: 0.09572269076630335
Training...
episode: 2608 no of steps: 172 score: 1170.0 avg score: 6.8023 memorylength: 131072 epsilon: 0.09563657910967169
Training...
episode: 2609 no of steps: 177 score: 1002.0 avg score: 5.661 memorylength: 131072 epsilon: 0.09555054491866623
Training...
episode: 2610 no of steps: 169 score: 1015.0 avg score: 6.0059 memorylength: 131072 epsilon: 0.09546458812359934
Training...
episode: 2611 no of steps: 163 score: 970.0 avg score: 5.9509 memorylength: 131072 epsilon: 0.09537870865484588
Training...
episode: 2612 no of steps: 145 score: 827.0 avg score: 5.7034 memorylength: 131072 epsilon: 0.09529290644284356
Training...
episode: 2613 no of steps: 142 score: 754.0 avg score: 5.3099 memorylength: 131072 epsilon: 0.09520718141809258
Training...
episode: 2614 no of steps: 137 score: 657.0 avg score: 4.7956 memorylength: 131072 epsilon: 0.09512153351115568
Training...
episode: 2615 no of steps: 145 score: 908.0 avg score: 6.2621 memorylength: 131072 epsilon: 0.09503596265265797
Training...
episode: 2616 no of steps: 131 score: 603.0 avg score: 4.6031 memorylength: 131072 epsilon: 0.09495046877328712
Training...
episode: 2617 no of steps: 154 score: 913.0 avg score: 5.9286 memorylength: 131072 epsilon: 0.09486505180379311
Training...
episode: 2618 no of steps: 154 score: 624.0 avg score: 4.0519 memorylength: 131072 epsilon: 0.09477971167498811
Training...
episode: 2619 no of steps: 189 score: 834.0 avg score: 4.4127 memorylength: 131072 epsilon: 0.09469444831774665
Training...
episode: 2620 no of steps: 169 score: 668.0 avg score: 3.9527 memorylength: 131072 epsilon: 0.09460926166300539
Training...
episode: 2621 no of steps: 150 score: 699.0 avg score: 4.66 memorylength: 131072 epsilon: 0.09452415164176321
Training...
episode: 2622 no of steps: 147 score: 776.0 avg score: 5.2789 memorylength: 131072 epsilon: 0.09443911818508087
Training...
episode: 2623 no of steps: 164 score: 835.0 avg score: 5.0915 memorylength: 131072 epsilon: 0.09435416122408134
Training...
episode: 2624 no of steps: 149 score: 868.0 avg score: 5.8255 memorylength: 131072 epsilon: 0.09426928068994946
Training...
episode: 2625 no of steps: 169 score: 481.0 avg score: 2.8462 memorylength: 131072 epsilon: 0.094184476513932
Training...
episode: 2626 no of steps: 161 score: 1384.0 avg score: 8.5963 memorylength: 131072 epsilon: 0.09409974862733755
Training...
episode: 2627 no of steps: 163 score: 1397.0 avg score: 8.5706 memorylength: 131072 epsilon: 0.09401509696153654
Training...
episode: 2628 no of steps: 147 score: 918.0 avg score: 6.2449 memorylength: 131072 epsilon: 0.09393052144796114
Training...
episode: 2629 no of steps: 142 score: 958.0 avg score: 6.7465 memorylength: 131072 epsilon: 0.09384602201810512
Training...
episode: 2630 no of steps: 133 score: 949.0 avg score: 7.1353 memorylength: 131072 epsilon: 0.09376159860352395
Training...
episode: 2631 no of steps: 157 score: 924.0 avg score: 5.8854 memorylength: 131072 epsilon: 0.09367725113583468
Training...
episode: 2632 no of steps: 155 score: 571.0 avg score: 3.6839 memorylength: 131072 epsilon: 0.0935929795467159
Training...
episode: 2633 no of steps: 172 score: 1137.0 avg score: 6.6105 memorylength: 131072 epsilon: 0.09350878376790751
Training...
episode: 2634 no of steps: 179 score: 1320.0 avg score: 7.3743 memorylength: 131072 epsilon: 0.093424663731211
Training...
episode: 2635 no of steps: 164 score: 1000.0 avg score: 6.0976 memorylength: 131072 epsilon: 0.09334061936848917
Training...
episode: 2636 no of steps: 171 score: 1066.0 avg score: 6.2339 memorylength: 131072 epsilon: 0.09325665061166596
Training...
episode: 2637 no of steps: 165 score: 648.0 avg score: 3.9273 memorylength: 131072 epsilon: 0.09317275739272678
Training...
episode: 2638 no of steps: 170 score: 868.0 avg score: 5.1059 memorylength: 131072 epsilon: 0.09308893964371806
Training...
episode: 2639 no of steps: 165 score: 1064.0 avg score: 6.4485 memorylength: 131072 epsilon: 0.0930051972967475
Training...
episode: 2640 no of steps: 166 score: 965.0 avg score: 5.8133 memorylength: 131072 epsilon: 0.09292153028398367
Training...
episode: 2641 no of steps: 173 score: 911.0 avg score: 5.2659 memorylength: 131072 epsilon: 0.09283793853765636
Training...
episode: 2642 no of steps: 151 score: 1007.0 avg score: 6.6689 memorylength: 131072 epsilon: 0.09275442199005625
Training...
episode: 2643 no of steps: 148 score: 1244.0 avg score: 8.4054 memorylength: 131072 epsilon: 0.09267098057353496
Training...
episode: 2644 no of steps: 148 score: 866.0 avg score: 5.8514 memorylength: 131072 epsilon: 0.09258761422050486
Training...
episode: 2645 no of steps: 159 score: 439.0 avg score: 2.761 memorylength: 131072 epsilon: 0.09250432286343925
Training...
episode: 2646 no of steps: 143 score: 967.0 avg score: 6.7622 memorylength: 131072 epsilon: 0.09242110643487216
Training...
episode: 2647 no of steps: 165 score: 471.0 avg score: 2.8545 memorylength: 131072 epsilon: 0.09233796486739816
Training...
episode: 2648 no of steps: 169 score: 472.0 avg score: 2.7929 memorylength: 131072 epsilon: 0.09225489809367267
Training...
episode: 2649 no of steps: 159 score: 701.0 avg score: 4.4088 memorylength: 131072 epsilon: 0.0921719060464116
Training...
episode: 2650 no of steps: 154 score: 774.0 avg score: 5.026 memorylength: 131072 epsilon: 0.0920889886583914
saving states...
Training...
episode: 2651 no of steps: 176 score: 961.0 avg score: 5.4602 memorylength: 131072 epsilon: 0.09200614586244889
Training...
episode: 2652 no of steps: 175 score: 841.0 avg score: 4.8057 memorylength: 131072 epsilon: 0.09192337759148146
Training...
episode: 2653 no of steps: 151 score: 1215.0 avg score: 8.0464 memorylength: 131072 epsilon: 0.09184068377844681
Training...
episode: 2654 no of steps: 183 score: 1191.0 avg score: 6.5082 memorylength: 131072 epsilon: 0.091758064356363
Training...
episode: 2655 no of steps: 174 score: 1260.0 avg score: 7.2414 memorylength: 131072 epsilon: 0.09167551925830818
Training...
episode: 2656 no of steps: 164 score: 1056.0 avg score: 6.439 memorylength: 131072 epsilon: 0.09159304841742086
Training...
episode: 2657 no of steps: 140 score: 1070.0 avg score: 7.6429 memorylength: 131072 epsilon: 0.09151065176689972
Training...
episode: 2658 no of steps: 154 score: 901.0 avg score: 5.8506 memorylength: 131072 epsilon: 0.09142832924000338
Training...
episode: 2659 no of steps: 132 score: 871.0 avg score: 6.5985 memorylength: 131072 epsilon: 0.09134608077005062
Training...
episode: 2660 no of steps: 136 score: 546.0 avg score: 4.0147 memorylength: 131072 epsilon: 0.09126390629042017
Training...
episode: 2661 no of steps: 158 score: 782.0 avg score: 4.9494 memorylength: 131072 epsilon: 0.09118180573455074
Training...
episode: 2662 no of steps: 159 score: 682.0 avg score: 4.2893 memorylength: 131072 epsilon: 0.09109977903594081
Training...
episode: 2663 no of steps: 147 score: 583.0 avg score: 3.966 memorylength: 131072 epsilon: 0.0910178261281488
Training...
episode: 2664 no of steps: 175 score: 733.0 avg score: 4.1886 memorylength: 131072 epsilon: 0.09093594694479284
Training...
episode: 2665 no of steps: 169 score: 669.0 avg score: 3.9586 memorylength: 131072 epsilon: 0.09085414141955074
Training...
episode: 2666 no of steps: 182 score: 718.0 avg score: 3.9451 memorylength: 131072 epsilon: 0.09077240948616007
Training...
episode: 2667 no of steps: 181 score: 630.0 avg score: 3.4807 memorylength: 131072 epsilon: 0.09069075107841794
Training...
episode: 2668 no of steps: 177 score: 945.0 avg score: 5.339 memorylength: 131072 epsilon: 0.09060916613018108
Training...
episode: 2669 no of steps: 172 score: 852.0 avg score: 4.9535 memorylength: 131072 epsilon: 0.0905276545753656
Training...
episode: 2670 no of steps: 153 score: 882.0 avg score: 5.7647 memorylength: 131072 epsilon: 0.09044621634794718
Training...
episode: 2671 no of steps: 172 score: 765.0 avg score: 4.4477 memorylength: 131072 epsilon: 0.09036485138196085
Training...
episode: 2672 no of steps: 174 score: 1340.0 avg score: 7.7011 memorylength: 131072 epsilon: 0.09028355961150102
Training...
episode: 2673 no of steps: 188 score: 899.0 avg score: 4.7819 memorylength: 131072 epsilon: 0.09020234097072127
Training...
episode: 2674 no of steps: 164 score: 1170.0 avg score: 7.1341 memorylength: 131072 epsilon: 0.09012119539383452
Training...
episode: 2675 no of steps: 146 score: 920.0 avg score: 6.3014 memorylength: 131072 epsilon: 0.09004012281511292
Training...
episode: 2676 no of steps: 148 score: 849.0 avg score: 5.7365 memorylength: 131072 epsilon: 0.08995912316888759
Training...
episode: 2677 no of steps: 167 score: 877.0 avg score: 5.2515 memorylength: 131072 epsilon: 0.08987819638954883
Training...
episode: 2678 no of steps: 152 score: 1061.0 avg score: 6.9803 memorylength: 131072 epsilon: 0.08979734241154598
Training...
episode: 2679 no of steps: 154 score: 682.0 avg score: 4.4286 memorylength: 131072 epsilon: 0.08971656116938732
Training...
episode: 2680 no of steps: 134 score: 560.0 avg score: 4.1791 memorylength: 131072 epsilon: 0.08963585259763997
Training...
episode: 2681 no of steps: 141 score: 378.0 avg score: 2.6809 memorylength: 131072 epsilon: 0.08955521663093004
Training...
episode: 2682 no of steps: 131 score: 628.0 avg score: 4.7939 memorylength: 131072 epsilon: 0.0894746532039424
Training...
episode: 2683 no of steps: 139 score: 566.0 avg score: 4.0719 memorylength: 131072 epsilon: 0.08939416225142063
Training...
episode: 2684 no of steps: 155 score: 953.0 avg score: 6.1484 memorylength: 131072 epsilon: 0.08931374370816704
Training...
episode: 2685 no of steps: 172 score: 762.0 avg score: 4.4302 memorylength: 131072 epsilon: 0.08923339750904266
Training...
episode: 2686 no of steps: 175 score: 1376.0 avg score: 7.8629 memorylength: 131072 epsilon: 0.08915312358896707
Training...
episode: 2687 no of steps: 171 score: 911.0 avg score: 5.3275 memorylength: 131072 epsilon: 0.08907292188291834
Training...
episode: 2688 no of steps: 178 score: 1109.0 avg score: 6.2303 memorylength: 131072 epsilon: 0.08899279232593307
Training...
episode: 2689 no of steps: 181 score: 1384.0 avg score: 7.6464 memorylength: 131072 epsilon: 0.08891273485310638
Training...
episode: 2690 no of steps: 209 score: 1251.0 avg score: 5.9856 memorylength: 131072 epsilon: 0.08883274939959171
Training...
episode: 2691 no of steps: 188 score: 1043.0 avg score: 5.5479 memorylength: 131072 epsilon: 0.08875283590060078
Training...
episode: 2692 no of steps: 171 score: 684.0 avg score: 4.0 memorylength: 131072 epsilon: 0.08867299429140367
Training...
episode: 2693 no of steps: 154 score: 782.0 avg score: 5.0779 memorylength: 131072 epsilon: 0.08859322450732873
Training...
episode: 2694 no of steps: 165 score: 868.0 avg score: 5.2606 memorylength: 131072 epsilon: 0.08851352648376236
Training...
episode: 2695 no of steps: 142 score: 783.0 avg score: 5.5141 memorylength: 131072 epsilon: 0.08843390015614915
Training...
episode: 2696 no of steps: 153 score: 981.0 avg score: 6.4118 memorylength: 131072 epsilon: 0.08835434545999182
Training...
episode: 2697 no of steps: 138 score: 384.0 avg score: 2.7826 memorylength: 131072 epsilon: 0.08827486233085108
Training...
episode: 2698 no of steps: 131 score: 733.0 avg score: 5.5954 memorylength: 131072 epsilon: 0.08819545070434551
Training...
episode: 2699 no of steps: 138 score: 832.0 avg score: 6.029 memorylength: 131072 epsilon: 0.08811611051615174
Training...
episode: 2700 no of steps: 144 score: 512.0 avg score: 3.5556 memorylength: 131072 epsilon: 0.08803684170200425
saving states...
Training...
episode: 2701 no of steps: 149 score: 843.0 avg score: 5.6577 memorylength: 131072 epsilon: 0.08795764419769521
Training...
episode: 2702 no of steps: 191 score: 804.0 avg score: 4.2094 memorylength: 131072 epsilon: 0.08787851793907468
Training...
episode: 2703 no of steps: 179 score: 632.0 avg score: 3.5307 memorylength: 131072 epsilon: 0.08779946286205037
Training...
episode: 2704 no of steps: 168 score: 1116.0 avg score: 6.6429 memorylength: 131072 epsilon: 0.08772047890258773
Training...
episode: 2705 no of steps: 170 score: 934.0 avg score: 5.4941 memorylength: 131072 epsilon: 0.08764156599670965
Training...
episode: 2706 no of steps: 159 score: 767.0 avg score: 4.8239 memorylength: 131072 epsilon: 0.08756272408049673
Training...
episode: 2707 no of steps: 146 score: 674.0 avg score: 4.6164 memorylength: 131072 epsilon: 0.087483953090087
Training...
episode: 2708 no of steps: 153 score: 594.0 avg score: 3.8824 memorylength: 131072 epsilon: 0.08740525296167599
Training...
episode: 2709 no of steps: 148 score: 1093.0 avg score: 7.3851 memorylength: 131072 epsilon: 0.08732662363151653
Training...
episode: 2710 no of steps: 138 score: 801.0 avg score: 5.8043 memorylength: 131072 epsilon: 0.08724806503591888
Training...
episode: 2711 no of steps: 152 score: 385.0 avg score: 2.5329 memorylength: 131072 epsilon: 0.0871695771112506
Training...
episode: 2712 no of steps: 136 score: 719.0 avg score: 5.2868 memorylength: 131072 epsilon: 0.08709115979393643
Training...
episode: 2713 no of steps: 167 score: 804.0 avg score: 4.8144 memorylength: 131072 epsilon: 0.08701281302045835
Training...
episode: 2714 no of steps: 172 score: 666.0 avg score: 3.8721 memorylength: 131072 epsilon: 0.08693453672735547
Training...
episode: 2715 no of steps: 171 score: 718.0 avg score: 4.1988 memorylength: 131072 epsilon: 0.08685633085122405
Training...
episode: 2716 no of steps: 171 score: 601.0 avg score: 3.5146 memorylength: 131072 epsilon: 0.08677819532871721
Training...
episode: 2717 no of steps: 177 score: 666.0 avg score: 3.7627 memorylength: 131072 epsilon: 0.08670013009654522
Training...
episode: 2718 no of steps: 171 score: 629.0 avg score: 3.6784 memorylength: 131072 epsilon: 0.08662213509147527
Training...
episode: 2719 no of steps: 165 score: 719.0 avg score: 4.3576 memorylength: 131072 epsilon: 0.08654421025033142
Training...
episode: 2720 no of steps: 178 score: 802.0 avg score: 4.5056 memorylength: 131072 epsilon: 0.08646635550999444
Training...
episode: 2721 no of steps: 131 score: 687.0 avg score: 5.2443 memorylength: 131072 epsilon: 0.08638857080740209
Training...
episode: 2722 no of steps: 136 score: 854.0 avg score: 6.2794 memorylength: 131072 epsilon: 0.08631085607954872
Training...
episode: 2723 no of steps: 148 score: 857.0 avg score: 5.7905 memorylength: 131072 epsilon: 0.08623321126348538
Training...
episode: 2724 no of steps: 170 score: 984.0 avg score: 5.7882 memorylength: 131072 epsilon: 0.08615563629631977
Training...
episode: 2725 no of steps: 163 score: 1066.0 avg score: 6.5399 memorylength: 131072 epsilon: 0.08607813111521616
Training...
episode: 2726 no of steps: 144 score: 791.0 avg score: 5.4931 memorylength: 131072 epsilon: 0.0860006956573954
Training...
episode: 2727 no of steps: 167 score: 1008.0 avg score: 6.0359 memorylength: 131072 epsilon: 0.08592332986013469
Training...
episode: 2728 no of steps: 166 score: 972.0 avg score: 5.8554 memorylength: 131072 epsilon: 0.08584603366076778
Training...
episode: 2729 no of steps: 163 score: 1073.0 avg score: 6.5828 memorylength: 131072 epsilon: 0.08576880699668475
Training...
episode: 2730 no of steps: 165 score: 1020.0 avg score: 6.1818 memorylength: 131072 epsilon: 0.08569164980533193
Training...
episode: 2731 no of steps: 148 score: 702.0 avg score: 4.7432 memorylength: 131072 epsilon: 0.08561456202421205
Training...
episode: 2732 no of steps: 155 score: 728.0 avg score: 4.6968 memorylength: 131072 epsilon: 0.08553754359088399
Training...
episode: 2733 no of steps: 176 score: 751.0 avg score: 4.267 memorylength: 131072 epsilon: 0.08546059444296286
Training...
episode: 2734 no of steps: 163 score: 822.0 avg score: 5.0429 memorylength: 131072 epsilon: 0.08538371451811975
Training...
episode: 2735 no of steps: 159 score: 695.0 avg score: 4.3711 memorylength: 131072 epsilon: 0.08530690375408198
Training...
episode: 2736 no of steps: 188 score: 1249.0 avg score: 6.6436 memorylength: 131072 epsilon: 0.08523016208863281
Training...
episode: 2737 no of steps: 151 score: 917.0 avg score: 6.0728 memorylength: 131072 epsilon: 0.08515348945961154
Training...
episode: 2738 no of steps: 176 score: 935.0 avg score: 5.3125 memorylength: 131072 epsilon: 0.08507688580491322
Training...
episode: 2739 no of steps: 170 score: 1019.0 avg score: 5.9941 memorylength: 131072 epsilon: 0.08500035106248897
Training...
episode: 2740 no of steps: 152 score: 801.0 avg score: 5.2697 memorylength: 131072 epsilon: 0.08492388517034569
Training...
episode: 2741 no of steps: 165 score: 814.0 avg score: 4.9333 memorylength: 131072 epsilon: 0.08484748806654588
Training...
episode: 2742 no of steps: 149 score: 750.0 avg score: 5.0336 memorylength: 131072 epsilon: 0.08477115968920794
Training...
episode: 2743 no of steps: 148 score: 669.0 avg score: 4.5203 memorylength: 131072 epsilon: 0.0846948999765059
Training...
episode: 2744 no of steps: 155 score: 658.0 avg score: 4.2452 memorylength: 131072 epsilon: 0.08461870886666939
Training...
episode: 2745 no of steps: 147 score: 939.0 avg score: 6.3878 memorylength: 131072 epsilon: 0.08454258629798357
Training...
episode: 2746 no of steps: 147 score: 1401.0 avg score: 9.5306 memorylength: 131072 epsilon: 0.08446653220878915
Training...
episode: 2747 no of steps: 170 score: 1020.0 avg score: 6.0 memorylength: 131072 epsilon: 0.08439054653748239
Training...
episode: 2748 no of steps: 146 score: 935.0 avg score: 6.4041 memorylength: 131072 epsilon: 0.0843146292225148
Training...
episode: 2749 no of steps: 168 score: 966.0 avg score: 5.75 memorylength: 131072 epsilon: 0.08423878020239339
Training...
episode: 2750 no of steps: 161 score: 859.0 avg score: 5.3354 memorylength: 131072 epsilon: 0.08416299941568045
saving states...
Training...
episode: 2751 no of steps: 162 score: 1021.0 avg score: 6.3025 memorylength: 131072 epsilon: 0.08408728680099357
Training...
episode: 2752 no of steps: 174 score: 1014.0 avg score: 5.8276 memorylength: 131072 epsilon: 0.08401164229700546
Training...
episode: 2753 no of steps: 175 score: 962.0 avg score: 5.4971 memorylength: 131072 epsilon: 0.08393606584244412
Training...
episode: 2754 no of steps: 156 score: 1102.0 avg score: 7.0641 memorylength: 131072 epsilon: 0.08386055737609258
Training...
episode: 2755 no of steps: 168 score: 820.0 avg score: 4.881 memorylength: 131072 epsilon: 0.08378511683678905
Training...
episode: 2756 no of steps: 161 score: 985.0 avg score: 6.118 memorylength: 131072 epsilon: 0.08370974416342661
Training...
episode: 2757 no of steps: 161 score: 425.0 avg score: 2.6398 memorylength: 131072 epsilon: 0.0836344392949534
Training...
episode: 2758 no of steps: 153 score: 811.0 avg score: 5.3007 memorylength: 131072 epsilon: 0.08355920217037253
Training...
episode: 2759 no of steps: 148 score: 911.0 avg score: 6.1554 memorylength: 131072 epsilon: 0.08348403272874186
Training...
episode: 2760 no of steps: 162 score: 849.0 avg score: 5.2407 memorylength: 131072 epsilon: 0.08340893090917416
Training...
episode: 2761 no of steps: 143 score: 885.0 avg score: 6.1888 memorylength: 131072 epsilon: 0.08333389665083696
Training...
episode: 2762 no of steps: 151 score: 1121.0 avg score: 7.4238 memorylength: 131072 epsilon: 0.08325892989295254
Training...
episode: 2763 no of steps: 169 score: 1296.0 avg score: 7.6686 memorylength: 131072 epsilon: 0.08318403057479774
Training...
episode: 2764 no of steps: 168 score: 1390.0 avg score: 8.2738 memorylength: 131072 epsilon: 0.08310919863570415
Training...
episode: 2765 no of steps: 175 score: 1093.0 avg score: 6.2457 memorylength: 131072 epsilon: 0.08303443401505796
Training...
episode: 2766 no of steps: 154 score: 990.0 avg score: 6.4286 memorylength: 131072 epsilon: 0.0829597366522997
Training...
episode: 2767 no of steps: 169 score: 818.0 avg score: 4.8402 memorylength: 131072 epsilon: 0.08288510648692458
Training...
episode: 2768 no of steps: 151 score: 925.0 avg score: 6.1258 memorylength: 131072 epsilon: 0.08281054345848214
Training...
episode: 2769 no of steps: 158 score: 808.0 avg score: 5.1139 memorylength: 131072 epsilon: 0.08273604750657637
Training...
episode: 2770 no of steps: 173 score: 718.0 avg score: 4.1503 memorylength: 131072 epsilon: 0.08266161857086547
Training...
episode: 2771 no of steps: 161 score: 927.0 avg score: 5.7578 memorylength: 131072 epsilon: 0.08258725659106202
Training...
episode: 2772 no of steps: 150 score: 898.0 avg score: 5.9867 memorylength: 131072 epsilon: 0.08251296150693282
Training...
episode: 2773 no of steps: 154 score: 989.0 avg score: 6.4221 memorylength: 131072 epsilon: 0.08243873325829891
Training...
episode: 2774 no of steps: 152 score: 1020.0 avg score: 6.7105 memorylength: 131072 epsilon: 0.0823645717850353
Training...
episode: 2775 no of steps: 164 score: 1078.0 avg score: 6.5732 memorylength: 131072 epsilon: 0.08229047702707123
Training...
episode: 2776 no of steps: 134 score: 654.0 avg score: 4.8806 memorylength: 131072 epsilon: 0.08221644892438999
Training...
episode: 2777 no of steps: 144 score: 818.0 avg score: 5.6806 memorylength: 131072 epsilon: 0.08214248741702875
Training...
episode: 2778 no of steps: 155 score: 749.0 avg score: 4.8323 memorylength: 131072 epsilon: 0.0820685924450787
Training...
episode: 2779 no of steps: 155 score: 576.0 avg score: 3.7161 memorylength: 131072 epsilon: 0.08199476394868492
Training...
episode: 2780 no of steps: 169 score: 1179.0 avg score: 6.9763 memorylength: 131072 epsilon: 0.08192100186804636
Training...
episode: 2781 no of steps: 147 score: 1179.0 avg score: 8.0204 memorylength: 131072 epsilon: 0.08184730614341566
Training...
episode: 2782 no of steps: 154 score: 779.0 avg score: 5.0584 memorylength: 131072 epsilon: 0.0817736767150993
Training...
episode: 2783 no of steps: 163 score: 1281.0 avg score: 7.8589 memorylength: 131072 epsilon: 0.08170011352345745
Training...
episode: 2784 no of steps: 150 score: 742.0 avg score: 4.9467 memorylength: 131072 epsilon: 0.08162661650890396
Training...
episode: 2785 no of steps: 155 score: 1035.0 avg score: 6.6774 memorylength: 131072 epsilon: 0.08155318561190618
Training...
episode: 2786 no of steps: 172 score: 1412.0 avg score: 8.2093 memorylength: 131072 epsilon: 0.0814798207729851
Training...
episode: 2787 no of steps: 152 score: 972.0 avg score: 6.3947 memorylength: 131072 epsilon: 0.08140652193271522
Training...
episode: 2788 no of steps: 147 score: 735.0 avg score: 5.0 memorylength: 131072 epsilon: 0.08133328903172445
Training...
episode: 2789 no of steps: 157 score: 1016.0 avg score: 6.4713 memorylength: 131072 epsilon: 0.0812601220106941
Training...
episode: 2790 no of steps: 154 score: 951.0 avg score: 6.1753 memorylength: 131072 epsilon: 0.08118702081035896
Training...
episode: 2791 no of steps: 139 score: 749.0 avg score: 5.3885 memorylength: 131072 epsilon: 0.08111398537150705
Training...
episode: 2792 no of steps: 160 score: 908.0 avg score: 5.675 memorylength: 131072 epsilon: 0.08104101563497956
Training...
episode: 2793 no of steps: 139 score: 362.0 avg score: 2.6043 memorylength: 131072 epsilon: 0.08096811154167109
Training...
episode: 2794 no of steps: 169 score: 1025.0 avg score: 6.0651 memorylength: 131072 epsilon: 0.08089527303252933
Training...
episode: 2795 no of steps: 184 score: 958.0 avg score: 5.2065 memorylength: 131072 epsilon: 0.080822500048555
Training...
episode: 2796 no of steps: 174 score: 884.0 avg score: 5.0805 memorylength: 131072 epsilon: 0.08074979253080204
Training...
episode: 2797 no of steps: 202 score: 756.0 avg score: 3.7426 memorylength: 131072 epsilon: 0.08067715042037735
Training...
episode: 2798 no of steps: 187 score: 1201.0 avg score: 6.4225 memorylength: 131072 epsilon: 0.08060457365844084
Training...
episode: 2799 no of steps: 183 score: 935.0 avg score: 5.1093 memorylength: 131072 epsilon: 0.08053206218620526
Training...
episode: 2800 no of steps: 172 score: 661.0 avg score: 3.843 memorylength: 131072 epsilon: 0.08045961594493636
saving states...
Training...
episode: 2801 no of steps: 162 score: 780.0 avg score: 4.8148 memorylength: 131072 epsilon: 0.08038723487595267
Training...
episode: 2802 no of steps: 161 score: 953.0 avg score: 5.9193 memorylength: 131072 epsilon: 0.08031491892062556
Training...
episode: 2803 no of steps: 156 score: 561.0 avg score: 3.5962 memorylength: 131072 epsilon: 0.08024266802037903
Training...
episode: 2804 no of steps: 135 score: 621.0 avg score: 4.6 memorylength: 131072 epsilon: 0.0801704821166899
Training...
episode: 2805 no of steps: 163 score: 1096.0 avg score: 6.7239 memorylength: 131072 epsilon: 0.08009836115108758
Training...
episode: 2806 no of steps: 129 score: 721.0 avg score: 5.5891 memorylength: 131072 epsilon: 0.08002630506515404
Training...
episode: 2807 no of steps: 140 score: 647.0 avg score: 4.6214 memorylength: 131072 epsilon: 0.07995431380052388
Training...
episode: 2808 no of steps: 144 score: 729.0 avg score: 5.0625 memorylength: 131072 epsilon: 0.0798823872988842
Training...
episode: 2809 no of steps: 155 score: 1101.0 avg score: 7.1032 memorylength: 131072 epsilon: 0.0798105255019745
Training...
episode: 2810 no of steps: 155 score: 685.0 avg score: 4.4194 memorylength: 131072 epsilon: 0.0797387283515867
Training...
episode: 2811 no of steps: 153 score: 586.0 avg score: 3.8301 memorylength: 131072 epsilon: 0.07966699578956511
Training...
episode: 2812 no of steps: 151 score: 877.0 avg score: 5.8079 memorylength: 131072 epsilon: 0.07959532775780641
Training...
episode: 2813 no of steps: 155 score: 1119.0 avg score: 7.2194 memorylength: 131072 epsilon: 0.07952372419825941
Training...
episode: 2814 no of steps: 162 score: 769.0 avg score: 4.7469 memorylength: 131072 epsilon: 0.07945218505292526
Training...
episode: 2815 no of steps: 177 score: 1080.0 avg score: 6.1017 memorylength: 131072 epsilon: 0.07938071026385725
Training...
episode: 2816 no of steps: 172 score: 895.0 avg score: 5.2035 memorylength: 131072 epsilon: 0.07930929977316083
Training...
episode: 2817 no of steps: 160 score: 1145.0 avg score: 7.1562 memorylength: 131072 epsilon: 0.07923795352299341
Training...
episode: 2818 no of steps: 201 score: 1231.0 avg score: 6.1244 memorylength: 131072 epsilon: 0.07916667145556461
Training...
episode: 2819 no of steps: 174 score: 1445.0 avg score: 8.3046 memorylength: 131072 epsilon: 0.07909545351313589
Training...
episode: 2820 no of steps: 177 score: 988.0 avg score: 5.5819 memorylength: 131072 epsilon: 0.07902429963802077
Training...
episode: 2821 no of steps: 168 score: 1343.0 avg score: 7.994 memorylength: 131072 epsilon: 0.07895320977258456
Training...
episode: 2822 no of steps: 168 score: 1361.0 avg score: 8.1012 memorylength: 131072 epsilon: 0.07888218385924449
Training...
episode: 2823 no of steps: 191 score: 1187.0 avg score: 6.2147 memorylength: 131072 epsilon: 0.07881122184046957
Training...
episode: 2824 no of steps: 151 score: 1044.0 avg score: 6.9139 memorylength: 131072 epsilon: 0.07874032365878053
Training...
episode: 2825 no of steps: 162 score: 862.0 avg score: 5.321 memorylength: 131072 epsilon: 0.07866948925674984
Training...
episode: 2826 no of steps: 140 score: 839.0 avg score: 5.9929 memorylength: 131072 epsilon: 0.07859871857700167
Training...
episode: 2827 no of steps: 166 score: 888.0 avg score: 5.3494 memorylength: 131072 epsilon: 0.07852801156221177
Training...
episode: 2828 no of steps: 148 score: 516.0 avg score: 3.4865 memorylength: 131072 epsilon: 0.0784573681551074
Training...
episode: 2829 no of steps: 162 score: 985.0 avg score: 6.0802 memorylength: 131072 epsilon: 0.07838678829846743
Training...
episode: 2830 no of steps: 159 score: 670.0 avg score: 4.2138 memorylength: 131072 epsilon: 0.07831627193512218
Training...
episode: 2831 no of steps: 153 score: 669.0 avg score: 4.3725 memorylength: 131072 epsilon: 0.07824581900795337
Training...
episode: 2832 no of steps: 139 score: 454.0 avg score: 3.2662 memorylength: 131072 epsilon: 0.07817542945989411
Training...
episode: 2833 no of steps: 165 score: 652.0 avg score: 3.9515 memorylength: 131072 epsilon: 0.0781051032339289
Training...
episode: 2834 no of steps: 149 score: 634.0 avg score: 4.255 memorylength: 131072 epsilon: 0.07803484027309353
Training...
episode: 2835 no of steps: 162 score: 694.0 avg score: 4.284 memorylength: 131072 epsilon: 0.07796464052047489
Training...
episode: 2836 no of steps: 158 score: 990.0 avg score: 6.2658 memorylength: 131072 epsilon: 0.07789450391921124
Training...
episode: 2837 no of steps: 137 score: 675.0 avg score: 4.927 memorylength: 131072 epsilon: 0.07782443041249193
Training...
episode: 2838 no of steps: 168 score: 917.0 avg score: 5.4583 memorylength: 131072 epsilon: 0.07775441994355743
Training...
episode: 2839 no of steps: 154 score: 771.0 avg score: 5.0065 memorylength: 131072 epsilon: 0.07768447245569922
Training...
episode: 2840 no of steps: 171 score: 633.0 avg score: 3.7018 memorylength: 131072 epsilon: 0.07761458789225983
Training...
episode: 2841 no of steps: 184 score: 1008.0 avg score: 5.4783 memorylength: 131072 epsilon: 0.07754476619663282
Training...
episode: 2842 no of steps: 172 score: 1051.0 avg score: 6.1105 memorylength: 131072 epsilon: 0.07747500731226253
Training...
episode: 2843 no of steps: 167 score: 1255.0 avg score: 7.515 memorylength: 131072 epsilon: 0.07740531118264429
Training...
episode: 2844 no of steps: 157 score: 697.0 avg score: 4.4395 memorylength: 131072 epsilon: 0.07733567775132427
Training...
episode: 2845 no of steps: 169 score: 647.0 avg score: 3.8284 memorylength: 131072 epsilon: 0.07726610696189937
Training...
episode: 2846 no of steps: 178 score: 1326.0 avg score: 7.4494 memorylength: 131072 epsilon: 0.07719659875801721
Training...
episode: 2847 no of steps: 176 score: 829.0 avg score: 4.7102 memorylength: 131072 epsilon: 0.07712715308337616
Training...
episode: 2848 no of steps: 154 score: 1053.0 avg score: 6.8377 memorylength: 131072 epsilon: 0.0770577698817252
Training...
episode: 2849 no of steps: 158 score: 883.0 avg score: 5.5886 memorylength: 131072 epsilon: 0.07698844909686402
Training...
episode: 2850 no of steps: 144 score: 963.0 avg score: 6.6875 memorylength: 131072 epsilon: 0.07691919067264268
saving states...
Training...
episode: 2851 no of steps: 152 score: 832.0 avg score: 5.4737 memorylength: 131072 epsilon: 0.07684999455296188
Training...
episode: 2852 no of steps: 152 score: 748.0 avg score: 4.9211 memorylength: 131072 epsilon: 0.07678086068177281
Training...
episode: 2853 no of steps: 148 score: 1021.0 avg score: 6.8986 memorylength: 131072 epsilon: 0.07671178900307696
Training...
episode: 2854 no of steps: 161 score: 983.0 avg score: 6.1056 memorylength: 131072 epsilon: 0.07664277946092629
Training...
episode: 2855 no of steps: 158 score: 1158.0 avg score: 7.3291 memorylength: 131072 epsilon: 0.07657383199942308
Training...
episode: 2856 no of steps: 154 score: 1161.0 avg score: 7.539 memorylength: 131072 epsilon: 0.07650494656271992
Training...
episode: 2857 no of steps: 161 score: 716.0 avg score: 4.4472 memorylength: 131072 epsilon: 0.0764361230950195
Training...
episode: 2858 no of steps: 161 score: 970.0 avg score: 6.0248 memorylength: 131072 epsilon: 0.07636736154057487
Training...
episode: 2859 no of steps: 162 score: 792.0 avg score: 4.8889 memorylength: 131072 epsilon: 0.0762986618436892
Training...
episode: 2860 no of steps: 161 score: 1068.0 avg score: 6.6335 memorylength: 131072 epsilon: 0.07623002394871567
Training...
episode: 2861 no of steps: 162 score: 1354.0 avg score: 8.358 memorylength: 131072 epsilon: 0.07616144780005761
Training...
episode: 2862 no of steps: 137 score: 273.0 avg score: 1.9927 memorylength: 131072 epsilon: 0.07609293334216832
Training...
episode: 2863 no of steps: 168 score: 999.0 avg score: 5.9464 memorylength: 131072 epsilon: 0.07602448051955114
Training...
episode: 2864 no of steps: 143 score: 985.0 avg score: 6.8881 memorylength: 131072 epsilon: 0.0759560892767592
Training...
episode: 2865 no of steps: 140 score: 1011.0 avg score: 7.2214 memorylength: 131072 epsilon: 0.07588775955839563
Training...
episode: 2866 no of steps: 154 score: 679.0 avg score: 4.4091 memorylength: 131072 epsilon: 0.07581949130911335
Training...
episode: 2867 no of steps: 149 score: 1075.0 avg score: 7.2148 memorylength: 131072 epsilon: 0.0757512844736151
Training...
episode: 2868 no of steps: 160 score: 787.0 avg score: 4.9188 memorylength: 131072 epsilon: 0.07568313899665328
Training...
episode: 2869 no of steps: 161 score: 787.0 avg score: 4.8882 memorylength: 131072 epsilon: 0.0756150548230301
Training...
episode: 2870 no of steps: 159 score: 669.0 avg score: 4.2075 memorylength: 131072 epsilon: 0.0755470318975974
Training...
episode: 2871 no of steps: 172 score: 495.0 avg score: 2.8779 memorylength: 131072 epsilon: 0.07547907016525651
Training...
episode: 2872 no of steps: 168 score: 511.0 avg score: 3.0417 memorylength: 131072 epsilon: 0.0754111695709585
Training...
episode: 2873 no of steps: 179 score: 1299.0 avg score: 7.257 memorylength: 131072 epsilon: 0.07534333005970385
Training...
episode: 2874 no of steps: 176 score: 670.0 avg score: 3.8068 memorylength: 131072 epsilon: 0.07527555157654263
Training...
episode: 2875 no of steps: 164 score: 909.0 avg score: 5.5427 memorylength: 131072 epsilon: 0.07520783406657415
Training...
episode: 2876 no of steps: 174 score: 945.0 avg score: 5.431 memorylength: 131072 epsilon: 0.07514017747494726
Training...
episode: 2877 no of steps: 146 score: 960.0 avg score: 6.5753 memorylength: 131072 epsilon: 0.0750725817468602
Training...
episode: 2878 no of steps: 155 score: 621.0 avg score: 4.0065 memorylength: 131072 epsilon: 0.0750050468275603
Training...
episode: 2879 no of steps: 144 score: 814.0 avg score: 5.6528 memorylength: 131072 epsilon: 0.07493757266234435
Training...
episode: 2880 no of steps: 139 score: 786.0 avg score: 5.6547 memorylength: 131072 epsilon: 0.07487015919655823
Training...
episode: 2881 no of steps: 147 score: 765.0 avg score: 5.2041 memorylength: 131072 epsilon: 0.07480280637559711
Training...
episode: 2882 no of steps: 146 score: 652.0 avg score: 4.4658 memorylength: 131072 epsilon: 0.07473551414490509
Training...
episode: 2883 no of steps: 138 score: 453.0 avg score: 3.2826 memorylength: 131072 epsilon: 0.07466828244997553
Training...
episode: 2884 no of steps: 154 score: 813.0 avg score: 5.2792 memorylength: 131072 epsilon: 0.07460111123635074
Training...
episode: 2885 no of steps: 148 score: 667.0 avg score: 4.5068 memorylength: 131072 epsilon: 0.07453400044962205
Training...
episode: 2886 no of steps: 151 score: 593.0 avg score: 3.9272 memorylength: 131072 epsilon: 0.07446695003542966
Training...
episode: 2887 no of steps: 149 score: 562.0 avg score: 3.7718 memorylength: 131072 epsilon: 0.07439995993946279
Training...
episode: 2888 no of steps: 159 score: 737.0 avg score: 4.6352 memorylength: 131072 epsilon: 0.07433303010745945
Training...
episode: 2889 no of steps: 144 score: 670.0 avg score: 4.6528 memorylength: 131072 epsilon: 0.07426616048520646
Training...
episode: 2890 no of steps: 148 score: 693.0 avg score: 4.6824 memorylength: 131072 epsilon: 0.07419935101853939
Training...
episode: 2891 no of steps: 158 score: 710.0 avg score: 4.4937 memorylength: 131072 epsilon: 0.07413260165334262
Training...
episode: 2892 no of steps: 158 score: 1023.0 avg score: 6.4747 memorylength: 131072 epsilon: 0.07406591233554917
Training...
episode: 2893 no of steps: 171 score: 513.0 avg score: 3.0 memorylength: 131072 epsilon: 0.07399928301114063
Training...
episode: 2894 no of steps: 187 score: 1215.0 avg score: 6.4973 memorylength: 131072 epsilon: 0.07393271362614728
Training...
episode: 2895 no of steps: 162 score: 1061.0 avg score: 6.5494 memorylength: 131072 epsilon: 0.0738662041266479
Training...
episode: 2896 no of steps: 148 score: 1109.0 avg score: 7.4932 memorylength: 131072 epsilon: 0.07379975445876984
Training...
episode: 2897 no of steps: 149 score: 1129.0 avg score: 7.5772 memorylength: 131072 epsilon: 0.07373336456868879
Training...
episode: 2898 no of steps: 140 score: 493.0 avg score: 3.5214 memorylength: 131072 epsilon: 0.07366703440262898
Training...
episode: 2899 no of steps: 134 score: 721.0 avg score: 5.3806 memorylength: 131072 epsilon: 0.07360076390686299
Training...
episode: 2900 no of steps: 139 score: 488.0 avg score: 3.5108 memorylength: 131072 epsilon: 0.07353455302771165
saving states...
Training...
episode: 2901 no of steps: 132 score: 858.0 avg score: 6.5 memorylength: 131072 epsilon: 0.07346840171154419
Training...
episode: 2902 no of steps: 131 score: 289.0 avg score: 2.2061 memorylength: 131072 epsilon: 0.07340230990477803
Training...
episode: 2903 no of steps: 148 score: 886.0 avg score: 5.9865 memorylength: 131072 epsilon: 0.07333627755387884
Training...
episode: 2904 no of steps: 184 score: 1119.0 avg score: 6.0815 memorylength: 131072 epsilon: 0.07327030460536035
Training...
episode: 2905 no of steps: 182 score: 967.0 avg score: 5.3132 memorylength: 131072 epsilon: 0.0732043910057845
Training...
episode: 2906 no of steps: 193 score: 584.0 avg score: 3.0259 memorylength: 131072 epsilon: 0.07313853670176129
Training...
episode: 2907 no of steps: 187 score: 927.0 avg score: 4.9572 memorylength: 131072 epsilon: 0.07307274163994867
Training...
episode: 2908 no of steps: 221 score: 1134.0 avg score: 5.1312 memorylength: 131072 epsilon: 0.0730070057670527
Training...
episode: 2909 no of steps: 179 score: 890.0 avg score: 4.9721 memorylength: 131072 epsilon: 0.07294132902982726
Training...
episode: 2910 no of steps: 154 score: 704.0 avg score: 4.5714 memorylength: 131072 epsilon: 0.07287571137507427
Training...
episode: 2911 no of steps: 153 score: 707.0 avg score: 4.6209 memorylength: 131072 epsilon: 0.07281015274964335
Training...
episode: 2912 no of steps: 153 score: 477.0 avg score: 3.1176 memorylength: 131072 epsilon: 0.07274465310043204
Training...
episode: 2913 no of steps: 135 score: 768.0 avg score: 5.6889 memorylength: 131072 epsilon: 0.07267921237438561
Training...
episode: 2914 no of steps: 136 score: 513.0 avg score: 3.7721 memorylength: 131072 epsilon: 0.0726138305184971
Training...
episode: 2915 no of steps: 143 score: 571.0 avg score: 3.993 memorylength: 131072 epsilon: 0.07254850747980716
Training...
episode: 2916 no of steps: 130 score: 328.0 avg score: 2.5231 memorylength: 131072 epsilon: 0.07248324320540414
Training...
episode: 2917 no of steps: 158 score: 404.0 avg score: 2.557 memorylength: 131072 epsilon: 0.07241803764242402
Training...
episode: 2918 no of steps: 124 score: 353.0 avg score: 2.8468 memorylength: 131072 epsilon: 0.07235289073805022
Training...
episode: 2919 no of steps: 160 score: 1001.0 avg score: 6.2562 memorylength: 131072 epsilon: 0.07228780243951376
Training...
episode: 2920 no of steps: 178 score: 904.0 avg score: 5.0787 memorylength: 131072 epsilon: 0.07222277269409313
Training...
episode: 2921 no of steps: 158 score: 895.0 avg score: 5.6646 memorylength: 131072 epsilon: 0.07215780144911428
Training...
episode: 2922 no of steps: 199 score: 963.0 avg score: 4.8392 memorylength: 131072 epsilon: 0.0720928886519504
Training...
episode: 2923 no of steps: 180 score: 405.0 avg score: 2.25 memorylength: 131072 epsilon: 0.07202803425002219
Training...
episode: 2924 no of steps: 169 score: 683.0 avg score: 4.0414 memorylength: 131072 epsilon: 0.07196323819079757
Training...
episode: 2925 no of steps: 188 score: 305.0 avg score: 1.6223 memorylength: 131072 epsilon: 0.0718985004217917
Training...
episode: 2926 no of steps: 148 score: 751.0 avg score: 5.0743 memorylength: 131072 epsilon: 0.07183382089056699
Training...
episode: 2927 no of steps: 134 score: 783.0 avg score: 5.8433 memorylength: 131072 epsilon: 0.07176919954473304
Training...
episode: 2928 no of steps: 131 score: 988.0 avg score: 7.542 memorylength: 131072 epsilon: 0.07170463633194658
Training...
episode: 2929 no of steps: 133 score: 378.0 avg score: 2.8421 memorylength: 131072 epsilon: 0.07164013119991133
Training...
episode: 2930 no of steps: 117 score: 755.0 avg score: 6.453 memorylength: 131072 epsilon: 0.07157568409637817
Training...
episode: 2931 no of steps: 124 score: 565.0 avg score: 4.5565 memorylength: 131072 epsilon: 0.07151129496914495
Training...
episode: 2932 no of steps: 127 score: 661.0 avg score: 5.2047 memorylength: 131072 epsilon: 0.07144696376605647
Training...
episode: 2933 no of steps: 142 score: 679.0 avg score: 4.7817 memorylength: 131072 epsilon: 0.07138269043500443
Training...
episode: 2934 no of steps: 162 score: 773.0 avg score: 4.7716 memorylength: 131072 epsilon: 0.07131847492392746
Training...
episode: 2935 no of steps: 176 score: 420.0 avg score: 2.3864 memorylength: 131072 epsilon: 0.071254317180811
Training...
episode: 2936 no of steps: 208 score: 711.0 avg score: 3.4183 memorylength: 131072 epsilon: 0.07119021715368722
Training...
episode: 2937 no of steps: 218 score: 810.0 avg score: 3.7156 memorylength: 131072 epsilon: 0.07112617479063511
Training...
episode: 2938 no of steps: 259 score: -3.0 avg score: -0.0116 memorylength: 131072 epsilon: 0.0710621900397804
Training...
episode: 2939 no of steps: 176 score: 830.0 avg score: 4.7159 memorylength: 131072 epsilon: 0.07099826284929542
Training...
episode: 2940 no of steps: 132 score: 1111.0 avg score: 8.4167 memorylength: 131072 epsilon: 0.07093439316739909
Training...
episode: 2941 no of steps: 158 score: 809.0 avg score: 5.1203 memorylength: 131072 epsilon: 0.07087058094235703
Training...
episode: 2942 no of steps: 134 score: 534.0 avg score: 3.9851 memorylength: 131072 epsilon: 0.07080682612248132
Training...
episode: 2943 no of steps: 145 score: 747.0 avg score: 5.1517 memorylength: 131072 epsilon: 0.07074312865613051
Training...
episode: 2944 no of steps: 153 score: 549.0 avg score: 3.5882 memorylength: 131072 epsilon: 0.0706794884917097
Training...
episode: 2945 no of steps: 180 score: 666.0 avg score: 3.7 memorylength: 131072 epsilon: 0.07061590557767031
Training...
episode: 2946 no of steps: 179 score: 241.0 avg score: 1.3464 memorylength: 131072 epsilon: 0.07055237986251024
Training...
episode: 2947 no of steps: 157 score: 332.0 avg score: 2.1146 memorylength: 131072 epsilon: 0.07048891129477358
Training...
episode: 2948 no of steps: 145 score: 37.0 avg score: 0.2552 memorylength: 131072 epsilon: 0.07042549982305082
Training...
episode: 2949 no of steps: 151 score: 307.0 avg score: 2.0331 memorylength: 131072 epsilon: 0.07036214539597867
Training...
episode: 2950 no of steps: 163 score: 593.0 avg score: 3.638 memorylength: 131072 epsilon: 0.07029884796224008
saving states...
Training...
episode: 2951 no of steps: 175 score: 958.0 avg score: 5.4743 memorylength: 131072 epsilon: 0.07023560747056405
Training...
episode: 2952 no of steps: 187 score: 829.0 avg score: 4.4332 memorylength: 131072 epsilon: 0.07017242386972579
Training...
episode: 2953 no of steps: 172 score: 1323.0 avg score: 7.6919 memorylength: 131072 epsilon: 0.07010929710854666
Training...
episode: 2954 no of steps: 176 score: 792.0 avg score: 4.5 memorylength: 131072 epsilon: 0.07004622713589385
Training...
episode: 2955 no of steps: 161 score: 947.0 avg score: 5.882 memorylength: 131072 epsilon: 0.06998321390068078
Training...
episode: 2956 no of steps: 156 score: 630.0 avg score: 4.0385 memorylength: 131072 epsilon: 0.0699202573518667
Training...
episode: 2957 no of steps: 178 score: 810.0 avg score: 4.5506 memorylength: 131072 epsilon: 0.06985735743845682
Training...
episode: 2958 no of steps: 162 score: 534.0 avg score: 3.2963 memorylength: 131072 epsilon: 0.06979451410950216
Training...
episode: 2959 no of steps: 142 score: 602.0 avg score: 4.2394 memorylength: 131072 epsilon: 0.06973172731409963
Training...
episode: 2960 no of steps: 159 score: 814.0 avg score: 5.1195 memorylength: 131072 epsilon: 0.06966899700139195
Training...
episode: 2961 no of steps: 142 score: 279.0 avg score: 1.9648 memorylength: 131072 epsilon: 0.06960632312056758
Training...
episode: 2962 no of steps: 125 score: 459.0 avg score: 3.672 memorylength: 131072 epsilon: 0.06954370562086061
Training...
episode: 2963 no of steps: 136 score: 593.0 avg score: 4.3603 memorylength: 131072 epsilon: 0.06948114445155089
Training...
episode: 2964 no of steps: 139 score: 518.0 avg score: 3.7266 memorylength: 131072 epsilon: 0.06941863956196392
Training...
episode: 2965 no of steps: 138 score: 922.0 avg score: 6.6812 memorylength: 131072 epsilon: 0.06935619090147065
Training...
episode: 2966 no of steps: 140 score: 772.0 avg score: 5.5143 memorylength: 131072 epsilon: 0.0692937984194877
Training...
episode: 2967 no of steps: 149 score: 1355.0 avg score: 9.094 memorylength: 131072 epsilon: 0.06923146206547717
Training...
episode: 2968 no of steps: 165 score: 836.0 avg score: 5.0667 memorylength: 131072 epsilon: 0.06916918178894661
Training...
episode: 2969 no of steps: 164 score: 516.0 avg score: 3.1463 memorylength: 131072 epsilon: 0.06910695753944897
Training...
episode: 2970 no of steps: 162 score: 954.0 avg score: 5.8889 memorylength: 131072 epsilon: 0.06904478926658261
Training...
episode: 2971 no of steps: 160 score: 1138.0 avg score: 7.1125 memorylength: 131072 epsilon: 0.06898267691999124
Training...
episode: 2972 no of steps: 159 score: 489.0 avg score: 3.0755 memorylength: 131072 epsilon: 0.06892062044936384
Training...
episode: 2973 no of steps: 156 score: 824.0 avg score: 5.2821 memorylength: 131072 epsilon: 0.06885861980443467
Training...
episode: 2974 no of steps: 146 score: 1039.0 avg score: 7.1164 memorylength: 131072 epsilon: 0.0687966749349832
Training...
episode: 2975 no of steps: 144 score: 786.0 avg score: 5.4583 memorylength: 131072 epsilon: 0.06873478579083413
Training...
episode: 2976 no of steps: 125 score: 657.0 avg score: 5.256 memorylength: 131072 epsilon: 0.06867295232185716
Training...
episode: 2977 no of steps: 125 score: 587.0 avg score: 4.696 memorylength: 131072 epsilon: 0.06861117447796723
Training...
episode: 2978 no of steps: 146 score: 710.0 avg score: 4.863 memorylength: 131072 epsilon: 0.06854945220912428
Training...
episode: 2979 no of steps: 141 score: 729.0 avg score: 5.1702 memorylength: 131072 epsilon: 0.06848778546533331
Training...
episode: 2980 no of steps: 149 score: 1020.0 avg score: 6.8456 memorylength: 131072 epsilon: 0.06842617419664418
Training...
episode: 2981 no of steps: 165 score: 942.0 avg score: 5.7091 memorylength: 131072 epsilon: 0.06836461835315177
Training...
episode: 2982 no of steps: 175 score: 1138.0 avg score: 6.5029 memorylength: 131072 epsilon: 0.0683031178849959
Training...
episode: 2983 no of steps: 185 score: 995.0 avg score: 5.3784 memorylength: 131072 epsilon: 0.06824167274236113
Training...
episode: 2984 no of steps: 174 score: 1155.0 avg score: 6.6379 memorylength: 131072 epsilon: 0.06818028287547692
Training...
episode: 2985 no of steps: 179 score: 864.0 avg score: 4.8268 memorylength: 131072 epsilon: 0.06811894823461745
Training...
episode: 2986 no of steps: 160 score: 900.0 avg score: 5.625 memorylength: 131072 epsilon: 0.06805766877010172
Training...
episode: 2987 no of steps: 150 score: 638.0 avg score: 4.2533 memorylength: 131072 epsilon: 0.06799644443229327
Training...
episode: 2988 no of steps: 160 score: 998.0 avg score: 6.2375 memorylength: 131072 epsilon: 0.06793527517160045
Training...
episode: 2989 no of steps: 167 score: 926.0 avg score: 5.5449 memorylength: 131072 epsilon: 0.06787416093847613
Training...
episode: 2990 no of steps: 149 score: 779.0 avg score: 5.2282 memorylength: 131072 epsilon: 0.06781310168341778
Training...
episode: 2991 no of steps: 163 score: 468.0 avg score: 2.8712 memorylength: 131072 epsilon: 0.06775209735696738
Training...
episode: 2992 no of steps: 175 score: 348.0 avg score: 1.9886 memorylength: 131072 epsilon: 0.06769114790971147
Training...
episode: 2993 no of steps: 175 score: 396.0 avg score: 2.2629 memorylength: 131072 epsilon: 0.06763025329228096
Training...
episode: 2994 no of steps: 154 score: 334.0 avg score: 2.1688 memorylength: 131072 epsilon: 0.06756941345535122
Training...
episode: 2995 no of steps: 180 score: 344.0 avg score: 1.9111 memorylength: 131072 epsilon: 0.06750862834964196
Training...
episode: 2996 no of steps: 164 score: 351.0 avg score: 2.1402 memorylength: 131072 epsilon: 0.06744789792591725
Training...
episode: 2997 no of steps: 157 score: 477.0 avg score: 3.0382 memorylength: 131072 epsilon: 0.06738722213498549
Training...
episode: 2998 no of steps: 155 score: 684.0 avg score: 4.4129 memorylength: 131072 epsilon: 0.0673266009276992
Training...
episode: 2999 no of steps: 135 score: 548.0 avg score: 4.0593 memorylength: 131072 epsilon: 0.06726603425495525
Training...
episode: 3000 no of steps: 156 score: 558.0 avg score: 3.5769 memorylength: 131072 epsilon: 0.06720552206769465
saving states...
Training...
episode: 3001 no of steps: 159 score: 922.0 avg score: 5.7987 memorylength: 131072 epsilon: 0.06714506431690247
Training...
episode: 3002 no of steps: 158 score: 444.0 avg score: 2.8101 memorylength: 131072 epsilon: 0.06708466095360796
Training...
episode: 3003 no of steps: 138 score: 683.0 avg score: 4.9493 memorylength: 131072 epsilon: 0.06702431192888439
Training...
episode: 3004 no of steps: 167 score: 522.0 avg score: 3.1257 memorylength: 131072 epsilon: 0.06696401719384908
Training...
episode: 3005 no of steps: 178 score: 524.0 avg score: 2.9438 memorylength: 131072 epsilon: 0.06690377669966323
Training...
episode: 3006 no of steps: 179 score: 384.0 avg score: 2.1453 memorylength: 131072 epsilon: 0.06684359039753204
Training...
episode: 3007 no of steps: 179 score: 130.0 avg score: 0.7263 memorylength: 131072 epsilon: 0.06678345823870468
Training...
episode: 3008 no of steps: 149 score: 399.0 avg score: 2.6779 memorylength: 131072 epsilon: 0.06672338017447402
Training...
episode: 3009 no of steps: 150 score: 798.0 avg score: 5.32 memorylength: 131072 epsilon: 0.06666335615617683
Training...
episode: 3010 no of steps: 144 score: 696.0 avg score: 4.8333 memorylength: 131072 epsilon: 0.06660338613519369
Training...
episode: 3011 no of steps: 142 score: 1110.0 avg score: 7.8169 memorylength: 131072 epsilon: 0.06654347006294888
Training...
episode: 3012 no of steps: 130 score: 1189.0 avg score: 9.1462 memorylength: 131072 epsilon: 0.06648360789091033
Training...
episode: 3013 no of steps: 170 score: 926.0 avg score: 5.4471 memorylength: 131072 epsilon: 0.0664237995705897
Training...
episode: 3014 no of steps: 162 score: 1178.0 avg score: 7.2716 memorylength: 131072 epsilon: 0.06636404505354226
Training...
episode: 3015 no of steps: 192 score: 871.0 avg score: 4.5365 memorylength: 131072 epsilon: 0.06630434429136688
Training...
episode: 3016 no of steps: 164 score: 1233.0 avg score: 7.5183 memorylength: 131072 epsilon: 0.06624469723570586
Training...
episode: 3017 no of steps: 176 score: 1196.0 avg score: 6.7955 memorylength: 131072 epsilon: 0.06618510383824514
Training...
episode: 3018 no of steps: 147 score: 1170.0 avg score: 7.9592 memorylength: 131072 epsilon: 0.06612556405071406
Training...
episode: 3019 no of steps: 144 score: 995.0 avg score: 6.9097 memorylength: 131072 epsilon: 0.06606607782488536
Training...
episode: 3020 no of steps: 148 score: 988.0 avg score: 6.6757 memorylength: 131072 epsilon: 0.06600664511257519
Training...
episode: 3021 no of steps: 151 score: 1444.0 avg score: 9.5629 memorylength: 131072 epsilon: 0.06594726586564309
Training...
episode: 3022 no of steps: 138 score: 908.0 avg score: 6.5797 memorylength: 131072 epsilon: 0.06588794003599187
Training...
episode: 3023 no of steps: 137 score: 486.0 avg score: 3.5474 memorylength: 131072 epsilon: 0.06582866757556755
Training...
episode: 3024 no of steps: 143 score: 1035.0 avg score: 7.2378 memorylength: 131072 epsilon: 0.06576944843635946
Training...
episode: 3025 no of steps: 168 score: 1188.0 avg score: 7.0714 memorylength: 131072 epsilon: 0.06571028257040011
Training...
episode: 3026 no of steps: 147 score: 562.0 avg score: 3.8231 memorylength: 131072 epsilon: 0.06565116992976516
Training...
episode: 3027 no of steps: 183 score: 1019.0 avg score: 5.5683 memorylength: 131072 epsilon: 0.06559211046657332
Training...
episode: 3028 no of steps: 187 score: 645.0 avg score: 3.4492 memorylength: 131072 epsilon: 0.06553310413298642
Training...
episode: 3029 no of steps: 179 score: 616.0 avg score: 3.4413 memorylength: 131072 epsilon: 0.06547415088120942
Training...
episode: 3030 no of steps: 161 score: 825.0 avg score: 5.1242 memorylength: 131072 epsilon: 0.06541525066349005
Training...
episode: 3031 no of steps: 204 score: 818.0 avg score: 4.0098 memorylength: 131072 epsilon: 0.06535640343211921
Training...
episode: 3032 no of steps: 162 score: 718.0 avg score: 4.4321 memorylength: 131072 epsilon: 0.06529760913943061
Training...
episode: 3033 no of steps: 158 score: 733.0 avg score: 4.6392 memorylength: 131072 epsilon: 0.06523886773780092
Training...
episode: 3034 no of steps: 155 score: 859.0 avg score: 5.5419 memorylength: 131072 epsilon: 0.06518017917964955
Training...
episode: 3035 no of steps: 175 score: 1120.0 avg score: 6.4 memorylength: 131072 epsilon: 0.06512154341743875
Training...
episode: 3036 no of steps: 174 score: 793.0 avg score: 4.5575 memorylength: 131072 epsilon: 0.06506296040367364
Training...
episode: 3037 no of steps: 156 score: 837.0 avg score: 5.3654 memorylength: 131072 epsilon: 0.06500443009090186
Training...
episode: 3038 no of steps: 153 score: 270.0 avg score: 1.7647 memorylength: 131072 epsilon: 0.06494595243171393
Training...
episode: 3039 no of steps: 166 score: 652.0 avg score: 3.9277 memorylength: 131072 epsilon: 0.06488752737874288
Training...
episode: 3040 no of steps: 162 score: 490.0 avg score: 3.0247 memorylength: 131072 epsilon: 0.06482915488466452
Training...
episode: 3041 no of steps: 161 score: 638.0 avg score: 3.9627 memorylength: 131072 epsilon: 0.06477083490219702
Training...
episode: 3042 no of steps: 151 score: 1077.0 avg score: 7.1325 memorylength: 131072 epsilon: 0.06471256738410124
Training...
episode: 3043 no of steps: 174 score: 376.0 avg score: 2.1609 memorylength: 131072 epsilon: 0.06465435228318048
Training...
episode: 3044 no of steps: 158 score: 1120.0 avg score: 7.0886 memorylength: 131072 epsilon: 0.06459618955228053
Training...
episode: 3045 no of steps: 162 score: 666.0 avg score: 4.1111 memorylength: 131072 epsilon: 0.06453807914428951
Training...
episode: 3046 no of steps: 171 score: 965.0 avg score: 5.6433 memorylength: 131072 epsilon: 0.06448002101213804
Training...
episode: 3047 no of steps: 146 score: 1090.0 avg score: 7.4658 memorylength: 131072 epsilon: 0.06442201510879904
Training...
episode: 3048 no of steps: 168 score: 841.0 avg score: 5.006 memorylength: 131072 epsilon: 0.06436406138728766
Training...
episode: 3049 no of steps: 165 score: 774.0 avg score: 4.6909 memorylength: 131072 epsilon: 0.06430615980066144
Training...
episode: 3050 no of steps: 179 score: 763.0 avg score: 4.2626 memorylength: 131072 epsilon: 0.06424831030202006
saving states...
Training...
episode: 3051 no of steps: 171 score: 578.0 avg score: 3.3801 memorylength: 131072 epsilon: 0.06419051284450547
Training...
episode: 3052 no of steps: 185 score: 716.0 avg score: 3.8703 memorylength: 131072 epsilon: 0.06413276738130166
Training...
episode: 3053 no of steps: 178 score: 617.0 avg score: 3.4663 memorylength: 131072 epsilon: 0.06407507386563487
Training...
episode: 3054 no of steps: 185 score: 1021.0 avg score: 5.5189 memorylength: 131072 epsilon: 0.0640174322507733
Training...
episode: 3055 no of steps: 169 score: 1020.0 avg score: 6.0355 memorylength: 131072 epsilon: 0.06395984249002724
Training...
episode: 3056 no of steps: 158 score: 888.0 avg score: 5.6203 memorylength: 131072 epsilon: 0.063902304536749
Training...
episode: 3057 no of steps: 159 score: 841.0 avg score: 5.2893 memorylength: 131072 epsilon: 0.06384481834433281
Training...
episode: 3058 no of steps: 157 score: 1012.0 avg score: 6.4459 memorylength: 131072 epsilon: 0.06378738386621492
Training...
episode: 3059 no of steps: 143 score: 772.0 avg score: 5.3986 memorylength: 131072 epsilon: 0.06373000105587331
Training...
episode: 3060 no of steps: 139 score: 608.0 avg score: 4.3741 memorylength: 131072 epsilon: 0.06367266986682796
Training...
episode: 3061 no of steps: 154 score: 1026.0 avg score: 6.6623 memorylength: 131072 epsilon: 0.06361539025264056
Training...
episode: 3062 no of steps: 129 score: 529.0 avg score: 4.1008 memorylength: 131072 epsilon: 0.06355816216691466
Training...
episode: 3063 no of steps: 129 score: 484.0 avg score: 3.7519 memorylength: 131072 epsilon: 0.06350098556329549
Training...
episode: 3064 no of steps: 135 score: 755.0 avg score: 5.5926 memorylength: 131072 epsilon: 0.06344386039546998
Training...
episode: 3065 no of steps: 149 score: 881.0 avg score: 5.9128 memorylength: 131072 epsilon: 0.06338678661716679
Training...
episode: 3066 no of steps: 155 score: 769.0 avg score: 4.9613 memorylength: 131072 epsilon: 0.0633297641821561
Training...
episode: 3067 no of steps: 151 score: 908.0 avg score: 6.0132 memorylength: 131072 epsilon: 0.06327279304424976
Training...
episode: 3068 no of steps: 138 score: 904.0 avg score: 6.5507 memorylength: 131072 epsilon: 0.06321587315730115
Training...
episode: 3069 no of steps: 157 score: 1133.0 avg score: 7.2166 memorylength: 131072 epsilon: 0.06315900447520519
Training...
episode: 3070 no of steps: 180 score: 1016.0 avg score: 5.6444 memorylength: 131072 epsilon: 0.06310218695189816
Training...
episode: 3071 no of steps: 194 score: 840.0 avg score: 4.3299 memorylength: 131072 epsilon: 0.06304542054135792
Training...
episode: 3072 no of steps: 209 score: 1035.0 avg score: 4.9522 memorylength: 131072 epsilon: 0.06298870519760368
Training...
episode: 3073 no of steps: 209 score: 988.0 avg score: 4.7273 memorylength: 131072 epsilon: 0.06293204087469599
Training...
episode: 3074 no of steps: 200 score: 1079.0 avg score: 5.395 memorylength: 131072 epsilon: 0.06287542752673674
Training...
episode: 3075 no of steps: 209 score: 1076.0 avg score: 5.1483 memorylength: 131072 epsilon: 0.06281886510786913
Training...
episode: 3076 no of steps: 201 score: 1213.0 avg score: 6.0348 memorylength: 131072 epsilon: 0.06276235357227762
Training...
episode: 3077 no of steps: 212 score: 1342.0 avg score: 6.3302 memorylength: 131072 epsilon: 0.06270589287418779
Training...
episode: 3078 no of steps: 200 score: 895.0 avg score: 4.475 memorylength: 131072 epsilon: 0.06264948296786652
Training...
episode: 3079 no of steps: 173 score: 562.0 avg score: 3.2486 memorylength: 131072 epsilon: 0.06259312380762179
Training...
episode: 3080 no of steps: 170 score: 468.0 avg score: 2.7529 memorylength: 131072 epsilon: 0.0625368153478027
Training...
episode: 3081 no of steps: 146 score: 415.0 avg score: 2.8425 memorylength: 131072 epsilon: 0.062480557542799325
Training...
episode: 3082 no of steps: 148 score: 263.0 avg score: 1.777 memorylength: 131072 epsilon: 0.06242435034704287
Training...
episode: 3083 no of steps: 135 score: 293.0 avg score: 2.1704 memorylength: 131072 epsilon: 0.06236819371500554
Training...
episode: 3084 no of steps: 146 score: 452.0 avg score: 3.0959 memorylength: 131072 epsilon: 0.062312087601200404
Training...
episode: 3085 no of steps: 136 score: 422.0 avg score: 3.1029 memorylength: 131072 epsilon: 0.062256031960181535
Training...
episode: 3086 no of steps: 141 score: 469.0 avg score: 3.3262 memorylength: 131072 epsilon: 0.06220002674654385
Training...
episode: 3087 no of steps: 136 score: 279.0 avg score: 2.0515 memorylength: 131072 epsilon: 0.06214407191492316
Training...
episode: 3088 no of steps: 143 score: 797.0 avg score: 5.5734 memorylength: 131072 epsilon: 0.062088167419995996
Training...
episode: 3089 no of steps: 138 score: 522.0 avg score: 3.7826 memorylength: 131072 epsilon: 0.06203231321647973
Training...
episode: 3090 no of steps: 155 score: 1071.0 avg score: 6.9097 memorylength: 131072 epsilon: 0.061976509259132465
Training...
episode: 3091 no of steps: 141 score: 890.0 avg score: 6.3121 memorylength: 131072 epsilon: 0.061920755502753014
Training...
episode: 3092 no of steps: 156 score: 954.0 avg score: 6.1154 memorylength: 131072 epsilon: 0.06186505190218078
Training...
episode: 3093 no of steps: 144 score: 327.0 avg score: 2.2708 memorylength: 131072 epsilon: 0.061809398412295866
Training...
episode: 3094 no of steps: 161 score: 756.0 avg score: 4.6957 memorylength: 131072 epsilon: 0.06175379498801897
Training...
episode: 3095 no of steps: 184 score: 801.0 avg score: 4.3533 memorylength: 131072 epsilon: 0.061698241584311274
Training...
episode: 3096 no of steps: 185 score: 628.0 avg score: 3.3946 memorylength: 131072 epsilon: 0.06164273815617453
Training...
episode: 3097 no of steps: 181 score: 648.0 avg score: 3.5801 memorylength: 131072 epsilon: 0.06158728465865096
Training...
episode: 3098 no of steps: 194 score: 1098.0 avg score: 5.6598 memorylength: 131072 epsilon: 0.061531881046823264
Training...
episode: 3099 no of steps: 182 score: 1132.0 avg score: 6.2198 memorylength: 131072 epsilon: 0.061476527275814444
Training...
episode: 3100 no of steps: 167 score: 1012.0 avg score: 6.0599 memorylength: 131072 epsilon: 0.06142122330078799
saving states...
Training...
episode: 3101 no of steps: 183 score: 1032.0 avg score: 5.6393 memorylength: 131072 epsilon: 0.061365969076947684
Training...
episode: 3102 no of steps: 155 score: 1218.0 avg score: 7.8581 memorylength: 131072 epsilon: 0.06131076455953756
Training...
episode: 3103 no of steps: 144 score: 940.0 avg score: 6.5278 memorylength: 131072 epsilon: 0.06125560970384199
Training...
episode: 3104 no of steps: 161 score: 1212.0 avg score: 7.528 memorylength: 131072 epsilon: 0.061200504465185525
Training...
episode: 3105 no of steps: 158 score: 953.0 avg score: 6.0316 memorylength: 131072 epsilon: 0.061145448798932946
Training...
episode: 3106 no of steps: 147 score: 654.0 avg score: 4.449 memorylength: 131072 epsilon: 0.06109044266048912
Training...
episode: 3107 no of steps: 143 score: 648.0 avg score: 4.5315 memorylength: 131072 epsilon: 0.061035486005299074
Training...
episode: 3108 no of steps: 146 score: 758.0 avg score: 5.1918 memorylength: 131072 epsilon: 0.06098057878884794
Training...
episode: 3109 no of steps: 152 score: 692.0 avg score: 4.5526 memorylength: 131072 epsilon: 0.060925720966660886
Training...
episode: 3110 no of steps: 151 score: 707.0 avg score: 4.6821 memorylength: 131072 epsilon: 0.060870912494303014
Training...
episode: 3111 no of steps: 154 score: 818.0 avg score: 5.3117 memorylength: 131072 epsilon: 0.06081615332737949
Training...
episode: 3112 no of steps: 165 score: 1090.0 avg score: 6.6061 memorylength: 131072 epsilon: 0.06076144342153542
Training...
episode: 3113 no of steps: 156 score: 1085.0 avg score: 6.9551 memorylength: 131072 epsilon: 0.06070678273245571
Training...
episode: 3114 no of steps: 162 score: 1687.0 avg score: 10.4136 memorylength: 131072 epsilon: 0.06065217121586523
Training...
episode: 3115 no of steps: 176 score: 1133.0 avg score: 6.4375 memorylength: 131072 epsilon: 0.06059760882752866
Training...
episode: 3116 no of steps: 141 score: 880.0 avg score: 6.2411 memorylength: 131072 epsilon: 0.060543095523250476
Training...
episode: 3117 no of steps: 168 score: 971.0 avg score: 5.7798 memorylength: 131072 epsilon: 0.06048863125887485
Training...
episode: 3118 no of steps: 191 score: 715.0 avg score: 3.7435 memorylength: 131072 epsilon: 0.060434215990285756
Training...
episode: 3119 no of steps: 192 score: 1102.0 avg score: 5.7396 memorylength: 131072 epsilon: 0.06037984967340684
Training...
episode: 3120 no of steps: 180 score: 1350.0 avg score: 7.5 memorylength: 131072 epsilon: 0.060325532264201336
Training...
episode: 3121 no of steps: 159 score: 976.0 avg score: 6.1384 memorylength: 131072 epsilon: 0.060271263718672155
Training...
episode: 3122 no of steps: 135 score: 872.0 avg score: 6.4593 memorylength: 131072 epsilon: 0.06021704399286179
Training...
episode: 3123 no of steps: 148 score: 818.0 avg score: 5.527 memorylength: 131072 epsilon: 0.060162873042852276
Training...
episode: 3124 no of steps: 132 score: 517.0 avg score: 3.9167 memorylength: 131072 epsilon: 0.06010875082476509
Training...
episode: 3125 no of steps: 133 score: 585.0 avg score: 4.3985 memorylength: 131072 epsilon: 0.060054677294761265
Training...
episode: 3126 no of steps: 141 score: 935.0 avg score: 6.6312 memorylength: 131072 epsilon: 0.060000652409041226
Training...
episode: 3127 no of steps: 167 score: 905.0 avg score: 5.4192 memorylength: 131072 epsilon: 0.05994667612384484
Training...
episode: 3128 no of steps: 136 score: 333.0 avg score: 2.4485 memorylength: 131072 epsilon: 0.05989274839545127
Training...
episode: 3129 no of steps: 158 score: 638.0 avg score: 4.038 memorylength: 131072 epsilon: 0.059838869180179076
Training...
episode: 3130 no of steps: 156 score: 837.0 avg score: 5.3654 memorylength: 131072 epsilon: 0.05978503843438612
Training...
episode: 3131 no of steps: 175 score: 1460.0 avg score: 8.3429 memorylength: 131072 epsilon: 0.05973125611446944
Training...
episode: 3132 no of steps: 166 score: 1098.0 avg score: 6.6145 memorylength: 131072 epsilon: 0.059677522176865366
Training...
episode: 3133 no of steps: 176 score: 793.0 avg score: 4.5057 memorylength: 131072 epsilon: 0.05962383657804943
Training...
episode: 3134 no of steps: 162 score: 598.0 avg score: 3.6914 memorylength: 131072 epsilon: 0.0595701992745363
Training...
episode: 3135 no of steps: 167 score: 953.0 avg score: 5.7066 memorylength: 131072 epsilon: 0.05951661022287971
Training...
episode: 3136 no of steps: 174 score: 683.0 avg score: 3.9253 memorylength: 131072 epsilon: 0.05946306937967257
Training...
episode: 3137 no of steps: 178 score: 1363.0 avg score: 7.6573 memorylength: 131072 epsilon: 0.05940957670154677
Training...
episode: 3138 no of steps: 150 score: 477.0 avg score: 3.18 memorylength: 131072 epsilon: 0.059356132145173275
Training...
episode: 3139 no of steps: 153 score: 1017.0 avg score: 6.6471 memorylength: 131072 epsilon: 0.05930273566726193
Training...
episode: 3140 no of steps: 146 score: 841.0 avg score: 5.7603 memorylength: 131072 epsilon: 0.05924938722456162
Training...
episode: 3141 no of steps: 135 score: 396.0 avg score: 2.9333 memorylength: 131072 epsilon: 0.05919608677386013
Training...
episode: 3142 no of steps: 155 score: 625.0 avg score: 4.0323 memorylength: 131072 epsilon: 0.05914283427198404
Training...
episode: 3143 no of steps: 163 score: 301.0 avg score: 1.8466 memorylength: 131072 epsilon: 0.05908962967579884
Training...
episode: 3144 no of steps: 165 score: 529.0 avg score: 3.2061 memorylength: 131072 epsilon: 0.059036472942208804
Training...
episode: 3145 no of steps: 161 score: 480.0 avg score: 2.9814 memorylength: 131072 epsilon: 0.058983364028157015
Training...
episode: 3146 no of steps: 155 score: 480.0 avg score: 3.0968 memorylength: 131072 epsilon: 0.058930302890625175
Training...
episode: 3147 no of steps: 177 score: 558.0 avg score: 3.1525 memorylength: 131072 epsilon: 0.058877289486633816
Training...
episode: 3148 no of steps: 185 score: 768.0 avg score: 4.1514 memorylength: 131072 epsilon: 0.05882432377324207
Training...
episode: 3149 no of steps: 191 score: 774.0 avg score: 4.0524 memorylength: 131072 epsilon: 0.05877140570754768
Training...
episode: 3150 no of steps: 172 score: 747.0 avg score: 4.343 memorylength: 131072 epsilon: 0.05871853524668703
saving states...
Training...
episode: 3151 no of steps: 166 score: 755.0 avg score: 4.5482 memorylength: 131072 epsilon: 0.05866571234783502
Training...
episode: 3152 no of steps: 189 score: 661.0 avg score: 3.4974 memorylength: 131072 epsilon: 0.058612936968205166
Training...
episode: 3153 no of steps: 174 score: 1093.0 avg score: 6.2816 memorylength: 131072 epsilon: 0.05856020906504933
Training...
episode: 3154 no of steps: 163 score: 621.0 avg score: 3.8098 memorylength: 131072 epsilon: 0.05850752859565793
Training...
episode: 3155 no of steps: 163 score: 952.0 avg score: 5.8405 memorylength: 131072 epsilon: 0.0584548955173598
Training...
episode: 3156 no of steps: 165 score: 768.0 avg score: 4.6545 memorylength: 131072 epsilon: 0.05840230978752216
Training...
episode: 3157 no of steps: 133 score: 409.0 avg score: 3.0752 memorylength: 131072 epsilon: 0.05834977136355051
Training...
episode: 3158 no of steps: 149 score: 502.0 avg score: 3.3691 memorylength: 131072 epsilon: 0.05829728020288876
Training...
episode: 3159 no of steps: 153 score: 678.0 avg score: 4.4314 memorylength: 131072 epsilon: 0.05824483626301909
Training...
episode: 3160 no of steps: 143 score: 792.0 avg score: 5.5385 memorylength: 131072 epsilon: 0.05819243950146185
Training...
episode: 3161 no of steps: 131 score: 744.0 avg score: 5.6794 memorylength: 131072 epsilon: 0.05814008987577568
Training...
episode: 3162 no of steps: 152 score: 903.0 avg score: 5.9408 memorylength: 131072 epsilon: 0.05808778734355739
Training...
episode: 3163 no of steps: 136 score: 756.0 avg score: 5.5588 memorylength: 131072 epsilon: 0.05803553186244195
Training...
episode: 3164 no of steps: 146 score: 622.0 avg score: 4.2603 memorylength: 131072 epsilon: 0.05798332339010238
Training...
episode: 3165 no of steps: 141 score: 984.0 avg score: 6.9787 memorylength: 131072 epsilon: 0.057931161884249814
Training...
episode: 3166 no of steps: 127 score: 728.0 avg score: 5.7323 memorylength: 131072 epsilon: 0.05787904730263346
Training...
episode: 3167 no of steps: 143 score: 972.0 avg score: 6.7972 memorylength: 131072 epsilon: 0.05782697960304048
Training...
episode: 3168 no of steps: 163 score: 1057.0 avg score: 6.4847 memorylength: 131072 epsilon: 0.05777495874329603
Training...
episode: 3169 no of steps: 149 score: 854.0 avg score: 5.7315 memorylength: 131072 epsilon: 0.05772298468126322
Training...
episode: 3170 no of steps: 172 score: 1031.0 avg score: 5.9942 memorylength: 131072 epsilon: 0.05767105737484308
Training...
episode: 3171 no of steps: 175 score: 1424.0 avg score: 8.1371 memorylength: 131072 epsilon: 0.057619176781974445
Training...
episode: 3172 no of steps: 178 score: 1498.0 avg score: 8.4157 memorylength: 131072 epsilon: 0.05756734286063406
Training...
episode: 3173 no of steps: 158 score: 961.0 avg score: 6.0823 memorylength: 131072 epsilon: 0.057515555568836425
Training...
episode: 3174 no of steps: 162 score: 1164.0 avg score: 7.1852 memorylength: 131072 epsilon: 0.05746381486463388
Training...
episode: 3175 no of steps: 167 score: 918.0 avg score: 5.497 memorylength: 131072 epsilon: 0.05741212070611639
Training...
episode: 3176 no of steps: 161 score: 736.0 avg score: 4.5714 memorylength: 131072 epsilon: 0.05736047305141172
Training...
episode: 3177 no of steps: 144 score: 856.0 avg score: 5.9444 memorylength: 131072 epsilon: 0.05730887185868527
Training...
episode: 3178 no of steps: 132 score: 979.0 avg score: 7.4167 memorylength: 131072 epsilon: 0.05725731708614004
Training...
episode: 3179 no of steps: 157 score: 1012.0 avg score: 6.4459 memorylength: 131072 epsilon: 0.05720580869201668
Training...
episode: 3180 no of steps: 142 score: 454.0 avg score: 3.1972 memorylength: 131072 epsilon: 0.057154346634593386
Training...
episode: 3181 no of steps: 159 score: 893.0 avg score: 5.6164 memorylength: 131072 epsilon: 0.05710293087218592
Training...
episode: 3182 no of steps: 165 score: 827.0 avg score: 5.0121 memorylength: 131072 epsilon: 0.05705156136314745
Training...
episode: 3183 no of steps: 158 score: 453.0 avg score: 2.8671 memorylength: 131072 epsilon: 0.05700023806586871
Training...
episode: 3184 no of steps: 150 score: 978.0 avg score: 6.52 memorylength: 131072 epsilon: 0.05694896093877784
Training...
episode: 3185 no of steps: 149 score: 432.0 avg score: 2.8993 memorylength: 131072 epsilon: 0.05689772994034033
Training...
episode: 3186 no of steps: 159 score: 1141.0 avg score: 7.1761 memorylength: 131072 epsilon: 0.05684654502905907
Training...
episode: 3187 no of steps: 154 score: 1101.0 avg score: 7.1494 memorylength: 131072 epsilon: 0.056795406163474296
Training...
episode: 3188 no of steps: 153 score: 711.0 avg score: 4.6471 memorylength: 131072 epsilon: 0.05674431330216354
Training...
episode: 3189 no of steps: 157 score: 1118.0 avg score: 7.121 memorylength: 131072 epsilon: 0.05669326640374155
Training...
episode: 3190 no of steps: 160 score: 1340.0 avg score: 8.375 memorylength: 131072 epsilon: 0.056642265426860336
Training...
episode: 3191 no of steps: 170 score: 623.0 avg score: 3.6647 memorylength: 131072 epsilon: 0.056591310330209116
Training...
episode: 3192 no of steps: 151 score: 503.0 avg score: 3.3311 memorylength: 131072 epsilon: 0.05654040107251428
Training...
episode: 3193 no of steps: 141 score: 278.0 avg score: 1.9716 memorylength: 131072 epsilon: 0.05648953761253929
Training...
episode: 3194 no of steps: 143 score: 566.0 avg score: 3.958 memorylength: 131072 epsilon: 0.05643871990908474
Training...
episode: 3195 no of steps: 145 score: 502.0 avg score: 3.4621 memorylength: 131072 epsilon: 0.056387947920988335
Training...
episode: 3196 no of steps: 145 score: 369.0 avg score: 2.5448 memorylength: 131072 epsilon: 0.056337221607124705
Training...
episode: 3197 no of steps: 151 score: 767.0 avg score: 5.0795 memorylength: 131072 epsilon: 0.05628654092640556
Training...
episode: 3198 no of steps: 164 score: 1174.0 avg score: 7.1585 memorylength: 131072 epsilon: 0.056235905837779536
Training...
episode: 3199 no of steps: 159 score: 871.0 avg score: 5.478 memorylength: 131072 epsilon: 0.05618531630023224
Training...
episode: 3200 no of steps: 172 score: 802.0 avg score: 4.6628 memorylength: 131072 epsilon: 0.0561347722727861
saving states...
Training...
episode: 3201 no of steps: 170 score: 1099.0 avg score: 6.4647 memorylength: 131072 epsilon: 0.05608427371450047
Training...
episode: 3202 no of steps: 169 score: 792.0 avg score: 4.6864 memorylength: 131072 epsilon: 0.056033820584471504
Training...
episode: 3203 no of steps: 165 score: 1150.0 avg score: 6.9697 memorylength: 131072 epsilon: 0.055983412841832204
Training...
episode: 3204 no of steps: 174 score: 591.0 avg score: 3.3966 memorylength: 131072 epsilon: 0.05593305044575225
Training...
episode: 3205 no of steps: 140 score: 795.0 avg score: 5.6786 memorylength: 131072 epsilon: 0.05588273335543811
Training...
episode: 3206 no of steps: 178 score: 966.0 avg score: 5.427 memorylength: 131072 epsilon: 0.05583246153013297
Training...
episode: 3207 no of steps: 150 score: 975.0 avg score: 6.5 memorylength: 131072 epsilon: 0.055782234929116596
Training...
episode: 3208 no of steps: 159 score: 972.0 avg score: 6.1132 memorylength: 131072 epsilon: 0.055732053511705466
Training...
episode: 3209 no of steps: 144 score: 962.0 avg score: 6.6806 memorylength: 131072 epsilon: 0.055681917237252625
Training...
episode: 3210 no of steps: 142 score: 193.0 avg score: 1.3592 memorylength: 131072 epsilon: 0.055631826065147716
Training...
episode: 3211 no of steps: 143 score: 1040.0 avg score: 7.2727 memorylength: 131072 epsilon: 0.05558177995481684
Training...
episode: 3212 no of steps: 127 score: 508.0 avg score: 4.0 memorylength: 131072 epsilon: 0.05553177886572267
Training...
episode: 3213 no of steps: 144 score: 730.0 avg score: 5.0694 memorylength: 131072 epsilon: 0.05548182275736433
Training...
episode: 3214 no of steps: 142 score: 773.0 avg score: 5.4437 memorylength: 131072 epsilon: 0.05543191158927734
Training...
episode: 3215 no of steps: 148 score: 682.0 avg score: 4.6081 memorylength: 131072 epsilon: 0.05538204532103366
Training...
episode: 3216 no of steps: 155 score: 1012.0 avg score: 6.529 memorylength: 131072 epsilon: 0.05533222391224163
Training...
episode: 3217 no of steps: 161 score: 1434.0 avg score: 8.9068 memorylength: 131072 epsilon: 0.05528244732254591
Training...
episode: 3218 no of steps: 174 score: 932.0 avg score: 5.3563 memorylength: 131072 epsilon: 0.05523271551162742
Training...
episode: 3219 no of steps: 166 score: 957.0 avg score: 5.7651 memorylength: 131072 epsilon: 0.055183028439203426
Training...
episode: 3220 no of steps: 177 score: 880.0 avg score: 4.9718 memorylength: 131072 epsilon: 0.05513338606502737
Training...
episode: 3221 no of steps: 194 score: 898.0 avg score: 4.6289 memorylength: 131072 epsilon: 0.055083788348888975
Training...
episode: 3222 no of steps: 212 score: 1190.0 avg score: 5.6132 memorylength: 131072 epsilon: 0.05503423525061403
Training...
episode: 3223 no of steps: 180 score: 591.0 avg score: 3.2833 memorylength: 131072 epsilon: 0.05498472673006454
Training...
episode: 3224 no of steps: 170 score: 828.0 avg score: 4.8706 memorylength: 131072 epsilon: 0.054935262747138634
Training...
episode: 3225 no of steps: 200 score: 765.0 avg score: 3.825 memorylength: 131072 epsilon: 0.05488584326177043
Training...
episode: 3226 no of steps: 153 score: 1146.0 avg score: 7.4902 memorylength: 131072 epsilon: 0.05483646823393017
Training...
episode: 3227 no of steps: 142 score: 1028.0 avg score: 7.2394 memorylength: 131072 epsilon: 0.05478713762362408
Training...
episode: 3228 no of steps: 142 score: 967.0 avg score: 6.8099 memorylength: 131072 epsilon: 0.05473785139089439
Training...
episode: 3229 no of steps: 130 score: 841.0 avg score: 6.4692 memorylength: 131072 epsilon: 0.05468860949581919
Training...
episode: 3230 no of steps: 139 score: 450.0 avg score: 3.2374 memorylength: 131072 epsilon: 0.05463941189851257
Training...
episode: 3231 no of steps: 142 score: 925.0 avg score: 6.5141 memorylength: 131072 epsilon: 0.0545902585591245
Training...
episode: 3232 no of steps: 152 score: 657.0 avg score: 4.3224 memorylength: 131072 epsilon: 0.054541149437840726
Training...
episode: 3233 no of steps: 147 score: 1014.0 avg score: 6.898 memorylength: 131072 epsilon: 0.054492084494882874
Training...
episode: 3234 no of steps: 162 score: 226.0 avg score: 1.3951 memorylength: 131072 epsilon: 0.05444306369050835
Training...
episode: 3235 no of steps: 149 score: 369.0 avg score: 2.4765 memorylength: 131072 epsilon: 0.05439408698501031
Training...
episode: 3236 no of steps: 147 score: 476.0 avg score: 3.2381 memorylength: 131072 epsilon: 0.05434515433871758
Training...
episode: 3237 no of steps: 154 score: 816.0 avg score: 5.2987 memorylength: 131072 epsilon: 0.05429626571199474
Training...
episode: 3238 no of steps: 188 score: 1050.0 avg score: 5.5851 memorylength: 131072 epsilon: 0.05424742106524198
Training...
episode: 3239 no of steps: 188 score: 786.0 avg score: 4.1809 memorylength: 131072 epsilon: 0.054198620358895194
Training...
episode: 3240 no of steps: 173 score: 813.0 avg score: 4.6994 memorylength: 131072 epsilon: 0.05414986355342573
Training...
episode: 3241 no of steps: 186 score: 1005.0 avg score: 5.4032 memorylength: 131072 epsilon: 0.05410115060934059
Training...
episode: 3242 no of steps: 225 score: 976.0 avg score: 4.3378 memorylength: 131072 epsilon: 0.05405248148718234
Training...
episode: 3243 no of steps: 202 score: 1134.0 avg score: 5.6139 memorylength: 131072 epsilon: 0.05400385614752892
Training...
episode: 3244 no of steps: 186 score: 696.0 avg score: 3.7419 memorylength: 131072 epsilon: 0.053955274550993845
Training...
episode: 3245 no of steps: 179 score: 480.0 avg score: 2.6816 memorylength: 131072 epsilon: 0.05390673665822599
Training...
episode: 3246 no of steps: 155 score: 565.0 avg score: 3.6452 memorylength: 131072 epsilon: 0.05385824242990971
Training...
episode: 3247 no of steps: 161 score: 274.0 avg score: 1.7019 memorylength: 131072 epsilon: 0.05380979182676462
Training...
episode: 3248 no of steps: 137 score: 427.0 avg score: 3.1168 memorylength: 131072 epsilon: 0.05376138480954574
Training...
episode: 3249 no of steps: 147 score: 313.0 avg score: 2.1293 memorylength: 131072 epsilon: 0.05371302133904343
Training...
episode: 3250 no of steps: 133 score: 230.0 avg score: 1.7293 memorylength: 131072 epsilon: 0.053664701376083215
saving states...
Training...
episode: 3251 no of steps: 143 score: 562.0 avg score: 3.9301 memorylength: 131072 epsilon: 0.053616424881525945
Training...
episode: 3252 no of steps: 144 score: 139.0 avg score: 0.9653 memorylength: 131072 epsilon: 0.053568191816267666
Training...
episode: 3253 no of steps: 158 score: 854.0 avg score: 5.4051 memorylength: 131072 epsilon: 0.05352000214123961
Training...
episode: 3254 no of steps: 145 score: 911.0 avg score: 6.2828 memorylength: 131072 epsilon: 0.053471855817408084
Training...
episode: 3255 no of steps: 163 score: 1035.0 avg score: 6.3497 memorylength: 131072 epsilon: 0.0534237528057746
Training...
episode: 3256 no of steps: 162 score: 993.0 avg score: 6.1296 memorylength: 131072 epsilon: 0.05337569306737571
Training...
episode: 3257 no of steps: 160 score: 926.0 avg score: 5.7875 memorylength: 131072 epsilon: 0.05332767656328304
Training...
episode: 3258 no of steps: 177 score: 945.0 avg score: 5.339 memorylength: 131072 epsilon: 0.05327970325460319
Training...
episode: 3259 no of steps: 167 score: 1064.0 avg score: 6.3713 memorylength: 131072 epsilon: 0.05323177310247777
Training...
episode: 3260 no of steps: 177 score: 772.0 avg score: 4.3616 memorylength: 131072 epsilon: 0.05318388606808342
Training...
episode: 3261 no of steps: 170 score: 829.0 avg score: 4.8765 memorylength: 131072 epsilon: 0.05313604211263155
Training...
episode: 3262 no of steps: 151 score: 998.0 avg score: 6.6093 memorylength: 131072 epsilon: 0.053088241197368616
Training...
episode: 3263 no of steps: 148 score: 629.0 avg score: 4.25 memorylength: 131072 epsilon: 0.053040483283575836
Training...
episode: 3264 no of steps: 127 score: 503.0 avg score: 3.9606 memorylength: 131072 epsilon: 0.05299276833256935
Training...
episode: 3265 no of steps: 139 score: 652.0 avg score: 4.6906 memorylength: 131072 epsilon: 0.05294509630569998
Training...
episode: 3266 no of steps: 137 score: 930.0 avg score: 6.7883 memorylength: 131072 epsilon: 0.052897467164353416
Training...
episode: 3267 no of steps: 154 score: 814.0 avg score: 5.2857 memorylength: 131072 epsilon: 0.05284988086995005
Training...
episode: 3268 no of steps: 134 score: 728.0 avg score: 5.4328 memorylength: 131072 epsilon: 0.052802337383945
Training...
episode: 3269 no of steps: 160 score: 620.0 avg score: 3.875 memorylength: 131072 epsilon: 0.052754836667827994
Training...
episode: 3270 no of steps: 172 score: 868.0 avg score: 5.0465 memorylength: 131072 epsilon: 0.052707378683123474
Training...
episode: 3271 no of steps: 169 score: 952.0 avg score: 5.6331 memorylength: 131072 epsilon: 0.052659963391390494
Training...
episode: 3272 no of steps: 161 score: 944.0 avg score: 5.8634 memorylength: 131072 epsilon: 0.05261259075422261
Training...
episode: 3273 no of steps: 164 score: 999.0 avg score: 6.0915 memorylength: 131072 epsilon: 0.05256526073324802
Training...
episode: 3274 no of steps: 169 score: 575.0 avg score: 3.4024 memorylength: 131072 epsilon: 0.052517973290129395
Training...
episode: 3275 no of steps: 162 score: 1011.0 avg score: 6.2407 memorylength: 131072 epsilon: 0.05247072838656393
Training...
episode: 3276 no of steps: 163 score: 776.0 avg score: 4.7607 memorylength: 131072 epsilon: 0.0524235259842832
Training...
episode: 3277 no of steps: 164 score: 897.0 avg score: 5.4695 memorylength: 131072 epsilon: 0.052376366045053295
Training...
episode: 3278 no of steps: 147 score: 754.0 avg score: 5.1293 memorylength: 131072 epsilon: 0.052329248530674666
Training...
episode: 3279 no of steps: 153 score: 1056.0 avg score: 6.902 memorylength: 131072 epsilon: 0.052282173402982086
Training...
episode: 3280 no of steps: 140 score: 821.0 avg score: 5.8643 memorylength: 131072 epsilon: 0.05223514062384472
Training...
episode: 3281 no of steps: 135 score: 737.0 avg score: 5.4593 memorylength: 131072 epsilon: 0.05218815015516602
Training...
episode: 3282 no of steps: 120 score: 809.0 avg score: 6.7417 memorylength: 131072 epsilon: 0.052141201958883714
Training...
episode: 3283 no of steps: 135 score: 748.0 avg score: 5.5407 memorylength: 131072 epsilon: 0.05209429599696973
Training...
episode: 3284 no of steps: 134 score: 384.0 avg score: 2.8657 memorylength: 131072 epsilon: 0.05204743223143024
Training...
episode: 3285 no of steps: 147 score: 878.0 avg score: 5.9728 memorylength: 131072 epsilon: 0.05200061062430561
Training...
episode: 3286 no of steps: 164 score: 621.0 avg score: 3.7866 memorylength: 131072 epsilon: 0.05195383113767036
Training...
episode: 3287 no of steps: 156 score: 634.0 avg score: 4.0641 memorylength: 131072 epsilon: 0.05190709373363304
Training...
episode: 3288 no of steps: 189 score: 996.0 avg score: 5.2698 memorylength: 131072 epsilon: 0.05186039837433638
Training...
episode: 3289 no of steps: 220 score: 1321.0 avg score: 6.0045 memorylength: 131072 epsilon: 0.05181374502195717
Training...
episode: 3290 no of steps: 184 score: 845.0 avg score: 4.5924 memorylength: 131072 epsilon: 0.05176713363870613
Training...
episode: 3291 no of steps: 168 score: 1192.0 avg score: 7.0952 memorylength: 131072 epsilon: 0.05172056418682807
Training...
episode: 3292 no of steps: 173 score: 1367.0 avg score: 7.9017 memorylength: 131072 epsilon: 0.05167403662860173
Training...
episode: 3293 no of steps: 156 score: 953.0 avg score: 6.109 memorylength: 131072 epsilon: 0.05162755092633981
Training...
episode: 3294 no of steps: 165 score: 764.0 avg score: 4.6303 memorylength: 131072 epsilon: 0.05158110704238884
Training...
episode: 3295 no of steps: 142 score: 1219.0 avg score: 8.5845 memorylength: 131072 epsilon: 0.05153470493912929
Training...
episode: 3296 no of steps: 129 score: 812.0 avg score: 6.2946 memorylength: 131072 epsilon: 0.051488344578975484
Training...
episode: 3297 no of steps: 131 score: 665.0 avg score: 5.0763 memorylength: 131072 epsilon: 0.05144202592437548
Training...
episode: 3298 no of steps: 136 score: 1080.0 avg score: 7.9412 memorylength: 131072 epsilon: 0.05139574893781119
Training...
episode: 3299 no of steps: 141 score: 710.0 avg score: 5.0355 memorylength: 131072 epsilon: 0.05134951358179824
Training...
episode: 3300 no of steps: 154 score: 827.0 avg score: 5.3701 memorylength: 131072 epsilon: 0.05130331981888603
saving states...
Training...
episode: 3301 no of steps: 140 score: 450.0 avg score: 3.2143 memorylength: 131072 epsilon: 0.05125716761165755
Training...
episode: 3302 no of steps: 143 score: 386.0 avg score: 2.6993 memorylength: 131072 epsilon: 0.05121105692272954
Training...
episode: 3303 no of steps: 142 score: 318.0 avg score: 2.2394 memorylength: 131072 epsilon: 0.05116498771475234
Training...
episode: 3304 no of steps: 163 score: 460.0 avg score: 2.8221 memorylength: 131072 epsilon: 0.05111895995040991
Training...
episode: 3305 no of steps: 141 score: 468.0 avg score: 3.3191 memorylength: 131072 epsilon: 0.051072973592419704
Training...
episode: 3306 no of steps: 176 score: 773.0 avg score: 4.392 memorylength: 131072 epsilon: 0.05102702860353281
Training...
episode: 3307 no of steps: 162 score: 1133.0 avg score: 6.9938 memorylength: 131072 epsilon: 0.05098112494653379
Training...
episode: 3308 no of steps: 167 score: 685.0 avg score: 4.1018 memorylength: 131072 epsilon: 0.05093526258424065
Training...
episode: 3309 no of steps: 197 score: 909.0 avg score: 4.6142 memorylength: 131072 epsilon: 0.05088944147950488
Training...
episode: 3310 no of steps: 168 score: 911.0 avg score: 5.4226 memorylength: 131072 epsilon: 0.0508436615952114
Training...
episode: 3311 no of steps: 190 score: 1255.0 avg score: 6.6053 memorylength: 131072 epsilon: 0.0507979228942785
Training...
episode: 3312 no of steps: 200 score: 1205.0 avg score: 6.025 memorylength: 131072 epsilon: 0.05075222533965781
Training...
episode: 3313 no of steps: 195 score: 747.0 avg score: 3.8308 memorylength: 131072 epsilon: 0.050706568894334315
Training...
episode: 3314 no of steps: 191 score: 589.0 avg score: 3.0838 memorylength: 131072 epsilon: 0.0506609535213263
Training...
episode: 3315 no of steps: 167 score: 647.0 avg score: 3.8743 memorylength: 131072 epsilon: 0.050615379183685326
Training...
episode: 3316 no of steps: 152 score: 225.0 avg score: 1.4803 memorylength: 131072 epsilon: 0.05056984584449614
Training...
episode: 3317 no of steps: 157 score: 585.0 avg score: 3.7261 memorylength: 131072 epsilon: 0.050524353466876754
Training...
episode: 3318 no of steps: 148 score: 798.0 avg score: 5.3919 memorylength: 131072 epsilon: 0.05047890201397836
Training...
episode: 3319 no of steps: 129 score: 295.0 avg score: 2.2868 memorylength: 131072 epsilon: 0.05043349144898523
Training...
episode: 3320 no of steps: 146 score: 575.0 avg score: 3.9384 memorylength: 131072 epsilon: 0.05038812173511484
Training...
episode: 3321 no of steps: 138 score: 396.0 avg score: 2.8696 memorylength: 131072 epsilon: 0.050342792835617704
Training...
episode: 3322 no of steps: 135 score: 840.0 avg score: 6.2222 memorylength: 131072 epsilon: 0.05029750471377744
Training...
episode: 3323 no of steps: 143 score: 719.0 avg score: 5.028 memorylength: 131072 epsilon: 0.05025225733291062
Training...
episode: 3324 no of steps: 132 score: 657.0 avg score: 4.9773 memorylength: 131072 epsilon: 0.05020705065636689
Training...
episode: 3325 no of steps: 156 score: 1080.0 avg score: 6.9231 memorylength: 131072 epsilon: 0.05016188464752886
Training...
episode: 3326 no of steps: 158 score: 1200.0 avg score: 7.5949 memorylength: 131072 epsilon: 0.05011675926981201
Training...
episode: 3327 no of steps: 181 score: 1532.0 avg score: 8.4641 memorylength: 131072 epsilon: 0.05007167448666481
Training...
episode: 3328 no of steps: 180 score: 1143.0 avg score: 6.35 memorylength: 131072 epsilon: 0.05002663026156859
Training...
episode: 3329 no of steps: 202 score: 929.0 avg score: 4.599 memorylength: 131072 epsilon: 0.04998162655803753
Training...
episode: 3330 no of steps: 176 score: 1057.0 avg score: 6.0057 memorylength: 131072 epsilon: 0.049936663339618596
Training...
episode: 3331 no of steps: 180 score: 1066.0 avg score: 5.9222 memorylength: 131072 epsilon: 0.0498917405698916
Training...
episode: 3332 no of steps: 191 score: 1008.0 avg score: 5.2775 memorylength: 131072 epsilon: 0.04984685821246909
Training...
episode: 3333 no of steps: 153 score: 886.0 avg score: 5.7908 memorylength: 131072 epsilon: 0.04980201623099638
Training...
episode: 3334 no of steps: 150 score: 630.0 avg score: 4.2 memorylength: 131072 epsilon: 0.049757214589151416
Training...
episode: 3335 no of steps: 130 score: 467.0 avg score: 3.5923 memorylength: 131072 epsilon: 0.04971245325064489
Training...
episode: 3336 no of steps: 125 score: 111.0 avg score: 0.888 memorylength: 131072 epsilon: 0.049667732179220145
Training...
episode: 3337 no of steps: 151 score: 517.0 avg score: 3.4238 memorylength: 131072 epsilon: 0.04962305133865305
Training...
episode: 3338 no of steps: 150 score: 710.0 avg score: 4.7333 memorylength: 131072 epsilon: 0.04957841069275216
Training...
episode: 3339 no of steps: 161 score: 439.0 avg score: 2.7267 memorylength: 131072 epsilon: 0.04953381020535853
Training...
episode: 3340 no of steps: 175 score: 619.0 avg score: 3.5371 memorylength: 131072 epsilon: 0.049489249840345806
Training...
episode: 3341 no of steps: 166 score: 714.0 avg score: 4.3012 memorylength: 131072 epsilon: 0.04944472956162003
Training...
episode: 3342 no of steps: 163 score: 1081.0 avg score: 6.6319 memorylength: 131072 epsilon: 0.04940024933311981
Training...
episode: 3343 no of steps: 136 score: 570.0 avg score: 4.1912 memorylength: 131072 epsilon: 0.049355809118816166
Training...
episode: 3344 no of steps: 150 score: 745.0 avg score: 4.9667 memorylength: 131072 epsilon: 0.049311408882712494
Training...
episode: 3345 no of steps: 145 score: 601.0 avg score: 4.1448 memorylength: 131072 epsilon: 0.049267048588844606
Training...
episode: 3346 no of steps: 156 score: 778.0 avg score: 4.9872 memorylength: 131072 epsilon: 0.049222728201280666
Training...
episode: 3347 no of steps: 154 score: 810.0 avg score: 5.2597 memorylength: 131072 epsilon: 0.04917844768412119
Training...
episode: 3348 no of steps: 162 score: 928.0 avg score: 5.7284 memorylength: 131072 epsilon: 0.049134207001498904
Training...
episode: 3349 no of steps: 156 score: 1178.0 avg score: 7.5513 memorylength: 131072 epsilon: 0.04909000611757887
Training...
episode: 3350 no of steps: 143 score: 838.0 avg score: 5.8601 memorylength: 131072 epsilon: 0.049045844996558376
saving states...
Training...
episode: 3351 no of steps: 154 score: 694.0 avg score: 4.5065 memorylength: 131072 epsilon: 0.049001723602666934
Training...
episode: 3352 no of steps: 134 score: 777.0 avg score: 5.7985 memorylength: 131072 epsilon: 0.04895764190016617
Training...
episode: 3353 no of steps: 143 score: 697.0 avg score: 4.8741 memorylength: 131072 epsilon: 0.04891359985334992
Training...
episode: 3354 no of steps: 127 score: 318.0 avg score: 2.5039 memorylength: 131072 epsilon: 0.04886959742654414
Training...
episode: 3355 no of steps: 152 score: 634.0 avg score: 4.1711 memorylength: 131072 epsilon: 0.04882563458410683
Training...
episode: 3356 no of steps: 138 score: 603.0 avg score: 4.3696 memorylength: 131072 epsilon: 0.04878171129042811
Training...
episode: 3357 no of steps: 153 score: 751.0 avg score: 4.9085 memorylength: 131072 epsilon: 0.0487378275099301
Training...
episode: 3358 no of steps: 148 score: 1118.0 avg score: 7.5541 memorylength: 131072 epsilon: 0.04869398320706696
Training...
episode: 3359 no of steps: 167 score: 976.0 avg score: 5.8443 memorylength: 131072 epsilon: 0.04865017834632475
Training...
episode: 3360 no of steps: 176 score: 1294.0 avg score: 7.3523 memorylength: 131072 epsilon: 0.04860641289222157
Training...
episode: 3361 no of steps: 206 score: 695.0 avg score: 3.3738 memorylength: 131072 epsilon: 0.04856268680930741
Training...
episode: 3362 no of steps: 169 score: 1102.0 avg score: 6.5207 memorylength: 131072 epsilon: 0.04851900006216409
Training...
episode: 3363 no of steps: 186 score: 1116.0 avg score: 6.0 memorylength: 131072 epsilon: 0.048475352615405386
Training...
episode: 3364 no of steps: 143 score: 857.0 avg score: 5.993 memorylength: 131072 epsilon: 0.04843174443367684
Training...
episode: 3365 no of steps: 170 score: 513.0 avg score: 3.0176 memorylength: 131072 epsilon: 0.04838817548165586
Training...
episode: 3366 no of steps: 174 score: 867.0 avg score: 4.9828 memorylength: 131072 epsilon: 0.048344645724051546
Training...
episode: 3367 no of steps: 166 score: 973.0 avg score: 5.8614 memorylength: 131072 epsilon: 0.04830115512560482
Training...
episode: 3368 no of steps: 140 score: 687.0 avg score: 4.9071 memorylength: 131072 epsilon: 0.04825770365108827
Training...
episode: 3369 no of steps: 171 score: 1059.0 avg score: 6.193 memorylength: 131072 epsilon: 0.04821429126530624
Training...
episode: 3370 no of steps: 148 score: 925.0 avg score: 6.25 memorylength: 131072 epsilon: 0.04817091793309466
Training...
episode: 3371 no of steps: 164 score: 1369.0 avg score: 8.3476 memorylength: 131072 epsilon: 0.04812758361932113
Training...
episode: 3372 no of steps: 156 score: 1419.0 avg score: 9.0962 memorylength: 131072 epsilon: 0.04808428828888489
Training...
episode: 3373 no of steps: 138 score: 1016.0 avg score: 7.3623 memorylength: 131072 epsilon: 0.048041031906716665
Training...
episode: 3374 no of steps: 148 score: 849.0 avg score: 5.7365 memorylength: 131072 epsilon: 0.04799781443777882
Training...
episode: 3375 no of steps: 154 score: 537.0 avg score: 3.487 memorylength: 131072 epsilon: 0.04795463584706519
Training...
episode: 3376 no of steps: 146 score: 926.0 avg score: 6.3425 memorylength: 131072 epsilon: 0.04791149609960114
Training...
episode: 3377 no of steps: 147 score: 837.0 avg score: 5.6939 memorylength: 131072 epsilon: 0.047868395160443424
Training...
episode: 3378 no of steps: 137 score: 483.0 avg score: 3.5255 memorylength: 131072 epsilon: 0.04782533299468031
Training...
episode: 3379 no of steps: 168 score: 884.0 avg score: 5.2619 memorylength: 131072 epsilon: 0.04778230956743143
Training...
episode: 3380 no of steps: 183 score: 1103.0 avg score: 6.0273 memorylength: 131072 epsilon: 0.047739324843847845
Training...
episode: 3381 no of steps: 179 score: 897.0 avg score: 5.0112 memorylength: 131072 epsilon: 0.04769637878911186
Training...
episode: 3382 no of steps: 176 score: 1034.0 avg score: 5.875 memorylength: 131072 epsilon: 0.04765347136843721
Training...
episode: 3383 no of steps: 171 score: 1108.0 avg score: 6.4795 memorylength: 131072 epsilon: 0.04761060254706889
Training...
episode: 3384 no of steps: 196 score: 1107.0 avg score: 5.648 memorylength: 131072 epsilon: 0.04756777229028312
Training...
episode: 3385 no of steps: 159 score: 674.0 avg score: 4.239 memorylength: 131072 epsilon: 0.0475249805633874
Training...
episode: 3386 no of steps: 171 score: 1018.0 avg score: 5.9532 memorylength: 131072 epsilon: 0.047482227331720445
Training...
episode: 3387 no of steps: 157 score: 904.0 avg score: 5.758 memorylength: 131072 epsilon: 0.04743951256065214
Training...
episode: 3388 no of steps: 158 score: 1266.0 avg score: 8.0127 memorylength: 131072 epsilon: 0.04739683621558348
Training...
episode: 3389 no of steps: 137 score: 1038.0 avg score: 7.5766 memorylength: 131072 epsilon: 0.047354198261946645
Training...
episode: 3390 no of steps: 137 score: 585.0 avg score: 4.2701 memorylength: 131072 epsilon: 0.047311598665204915
Training...
episode: 3391 no of steps: 152 score: 1093.0 avg score: 7.1908 memorylength: 131072 epsilon: 0.047269037390852565
Training...
episode: 3392 no of steps: 132 score: 720.0 avg score: 5.4545 memorylength: 131072 epsilon: 0.04722651440441499
Training...
episode: 3393 no of steps: 145 score: 740.0 avg score: 5.1034 memorylength: 131072 epsilon: 0.047184029671448566
Training...
episode: 3394 no of steps: 140 score: 697.0 avg score: 4.9786 memorylength: 131072 epsilon: 0.04714158315754068
Training...
episode: 3395 no of steps: 133 score: 576.0 avg score: 4.3308 memorylength: 131072 epsilon: 0.0470991748283096
Training...
episode: 3396 no of steps: 141 score: 409.0 avg score: 2.9007 memorylength: 131072 epsilon: 0.047056804649404614
Training...
episode: 3397 no of steps: 173 score: 847.0 avg score: 4.896 memorylength: 131072 epsilon: 0.047014472586505866
Training...
episode: 3398 no of steps: 151 score: 647.0 avg score: 4.2848 memorylength: 131072 epsilon: 0.0469721786053244
Training...
episode: 3399 no of steps: 191 score: 1034.0 avg score: 5.4136 memorylength: 131072 epsilon: 0.04692992267160205
Training...
episode: 3400 no of steps: 170 score: 634.0 avg score: 3.7294 memorylength: 131072 epsilon: 0.046887704751111536
saving states...
Training...
episode: 3401 no of steps: 170 score: 1195.0 avg score: 7.0294 memorylength: 131072 epsilon: 0.04684552480965635
Training...
episode: 3402 no of steps: 184 score: 890.0 avg score: 4.837 memorylength: 131072 epsilon: 0.0468033828130707
Training...
episode: 3403 no of steps: 174 score: 902.0 avg score: 5.1839 memorylength: 131072 epsilon: 0.04676127872721959
Training...
episode: 3404 no of steps: 157 score: 873.0 avg score: 5.5605 memorylength: 131072 epsilon: 0.0467192125179987
Training...
episode: 3405 no of steps: 169 score: 1008.0 avg score: 5.9645 memorylength: 131072 epsilon: 0.046677184151334435
Training...
episode: 3406 no of steps: 178 score: 659.0 avg score: 3.7022 memorylength: 131072 epsilon: 0.04663519359318376
Training...
episode: 3407 no of steps: 170 score: 441.0 avg score: 2.5941 memorylength: 131072 epsilon: 0.04659324080953434
Training...
episode: 3408 no of steps: 165 score: 625.0 avg score: 3.7879 memorylength: 131072 epsilon: 0.04655132576640445
Training...
episode: 3409 no of steps: 170 score: 782.0 avg score: 4.6 memorylength: 131072 epsilon: 0.04650944842984285
Training...
episode: 3410 no of steps: 142 score: 444.0 avg score: 3.1268 memorylength: 131072 epsilon: 0.04646760876592893
Training...
episode: 3411 no of steps: 130 score: 282.0 avg score: 2.1692 memorylength: 131072 epsilon: 0.04642580674077255
Training...
episode: 3412 no of steps: 123 score: 450.0 avg score: 3.6585 memorylength: 131072 epsilon: 0.04638404232051408
Training...
episode: 3413 no of steps: 147 score: 810.0 avg score: 5.5102 memorylength: 131072 epsilon: 0.04634231547132431
Training...
episode: 3414 no of steps: 165 score: 628.0 avg score: 3.8061 memorylength: 131072 epsilon: 0.0463006261594045
Training...
episode: 3415 no of steps: 141 score: 425.0 avg score: 3.0142 memorylength: 131072 epsilon: 0.04625897435098632
Training...
episode: 3416 no of steps: 136 score: 486.0 avg score: 3.5735 memorylength: 131072 epsilon: 0.04621736001233181
Training...
episode: 3417 no of steps: 150 score: 990.0 avg score: 6.6 memorylength: 131072 epsilon: 0.04617578310973332
Training...
episode: 3418 no of steps: 137 score: 863.0 avg score: 6.2993 memorylength: 131072 epsilon: 0.046134243609513556
Training...
episode: 3419 no of steps: 140 score: 720.0 avg score: 5.1429 memorylength: 131072 epsilon: 0.04609274147802558
Training...
episode: 3420 no of steps: 151 score: 1152.0 avg score: 7.6291 memorylength: 131072 epsilon: 0.04605127668165259
Training...
episode: 3421 no of steps: 170 score: 1053.0 avg score: 6.1941 memorylength: 131072 epsilon: 0.04600984918680814
Training...
episode: 3422 no of steps: 160 score: 990.0 avg score: 6.1875 memorylength: 131072 epsilon: 0.04596845895993593
Training...
episode: 3423 no of steps: 170 score: 1255.0 avg score: 7.3824 memorylength: 131072 epsilon: 0.04592710596750992
Training...
episode: 3424 no of steps: 187 score: 1299.0 avg score: 6.9465 memorylength: 131072 epsilon: 0.04588579017603414
Training...
episode: 3425 no of steps: 186 score: 812.0 avg score: 4.3656 memorylength: 131072 epsilon: 0.045844511552042805
Training...
episode: 3426 no of steps: 151 score: 916.0 avg score: 6.0662 memorylength: 131072 epsilon: 0.04580327006210026
Training...
episode: 3427 no of steps: 170 score: 963.0 avg score: 5.6647 memorylength: 131072 epsilon: 0.04576206567280084
Training...
episode: 3428 no of steps: 170 score: 673.0 avg score: 3.9588 memorylength: 131072 epsilon: 0.04572089835076903
Training...
episode: 3429 no of steps: 195 score: 885.0 avg score: 4.5385 memorylength: 131072 epsilon: 0.045679768062659276
Training...
episode: 3430 no of steps: 180 score: 872.0 avg score: 4.8444 memorylength: 131072 epsilon: 0.04563867477515606
Training...
episode: 3431 no of steps: 134 score: 850.0 avg score: 6.3433 memorylength: 131072 epsilon: 0.04559761845497381
Training...
episode: 3432 no of steps: 151 score: 435.0 avg score: 2.8808 memorylength: 131072 epsilon: 0.04555659906885688
Training...
episode: 3433 no of steps: 152 score: 650.0 avg score: 4.2763 memorylength: 131072 epsilon: 0.045515616583579596
Training...
episode: 3434 no of steps: 153 score: 618.0 avg score: 4.0392 memorylength: 131072 epsilon: 0.04547467096594616
Training...
episode: 3435 no of steps: 154 score: 945.0 avg score: 6.1364 memorylength: 131072 epsilon: 0.04543376218279056
Training...
episode: 3436 no of steps: 166 score: 472.0 avg score: 2.8434 memorylength: 131072 epsilon: 0.04539289020097672
Training...
episode: 3437 no of steps: 135 score: 738.0 avg score: 5.4667 memorylength: 131072 epsilon: 0.04535205498739834
Training...
episode: 3438 no of steps: 169 score: 692.0 avg score: 4.0947 memorylength: 131072 epsilon: 0.04531125650897887
Training...
episode: 3439 no of steps: 173 score: 1053.0 avg score: 6.0867 memorylength: 131072 epsilon: 0.045270494732671536
Training...
episode: 3440 no of steps: 130 score: 998.0 avg score: 7.6769 memorylength: 131072 epsilon: 0.04522976962545932
Training...
episode: 3441 no of steps: 158 score: 839.0 avg score: 5.3101 memorylength: 131072 epsilon: 0.04518908115435488
Training...
episode: 3442 no of steps: 163 score: 1008.0 avg score: 6.184 memorylength: 131072 epsilon: 0.045148429286400546
Training...
episode: 3443 no of steps: 153 score: 809.0 avg score: 5.2876 memorylength: 131072 epsilon: 0.04510781398866828
Training...
episode: 3444 no of steps: 156 score: 445.0 avg score: 2.8526 memorylength: 131072 epsilon: 0.045067235228259735
Training...
episode: 3445 no of steps: 144 score: 801.0 avg score: 5.5625 memorylength: 131072 epsilon: 0.04502669297230609
Training...
episode: 3446 no of steps: 129 score: 574.0 avg score: 4.4496 memorylength: 131072 epsilon: 0.0449861871879681
Training...
episode: 3447 no of steps: 142 score: 603.0 avg score: 4.2465 memorylength: 131072 epsilon: 0.044945717842436096
Training...
episode: 3448 no of steps: 130 score: 531.0 avg score: 4.0846 memorylength: 131072 epsilon: 0.04490528490292992
Training...
episode: 3449 no of steps: 128 score: 700.0 avg score: 5.4688 memorylength: 131072 epsilon: 0.04486488833669885
Training...
episode: 3450 no of steps: 133 score: 355.0 avg score: 2.6692 memorylength: 131072 epsilon: 0.04482452811102168
saving states...
Training...
episode: 3451 no of steps: 149 score: 724.0 avg score: 4.8591 memorylength: 131072 epsilon: 0.04478420419320664
Training...
episode: 3452 no of steps: 140 score: 841.0 avg score: 6.0071 memorylength: 131072 epsilon: 0.044743916550591366
Training...
episode: 3453 no of steps: 151 score: 1185.0 avg score: 7.8477 memorylength: 131072 epsilon: 0.04470366515054281
Training...
episode: 3454 no of steps: 156 score: 727.0 avg score: 4.6603 memorylength: 131072 epsilon: 0.04466344996045739
Training...
episode: 3455 no of steps: 167 score: 1210.0 avg score: 7.2455 memorylength: 131072 epsilon: 0.044623270947760786
Training...
episode: 3456 no of steps: 149 score: 967.0 avg score: 6.4899 memorylength: 131072 epsilon: 0.044583128079907976
Training...
episode: 3457 no of steps: 184 score: 774.0 avg score: 4.2065 memorylength: 131072 epsilon: 0.04454302132438324
Training...
episode: 3458 no of steps: 165 score: 823.0 avg score: 4.9879 memorylength: 131072 epsilon: 0.044502950648700114
Training...
episode: 3459 no of steps: 185 score: 740.0 avg score: 4.0 memorylength: 131072 epsilon: 0.04446291602040137
Training...
episode: 3460 no of steps: 168 score: 558.0 avg score: 3.3214 memorylength: 131072 epsilon: 0.044422917407058914
Training...
episode: 3461 no of steps: 174 score: 534.0 avg score: 3.069 memorylength: 131072 epsilon: 0.044382954776273895
Training...
episode: 3462 no of steps: 173 score: 669.0 avg score: 3.8671 memorylength: 131072 epsilon: 0.04434302809567656
Training...
episode: 3463 no of steps: 156 score: 601.0 avg score: 3.8526 memorylength: 131072 epsilon: 0.04430313733292633
Training...
episode: 3464 no of steps: 154 score: 846.0 avg score: 5.4935 memorylength: 131072 epsilon: 0.04426328245571164
Training...
episode: 3465 no of steps: 164 score: 1043.0 avg score: 6.3598 memorylength: 131072 epsilon: 0.044223463431750064
Training...
episode: 3466 no of steps: 144 score: 692.0 avg score: 4.8056 memorylength: 131072 epsilon: 0.0441836802287882
Training...
episode: 3467 no of steps: 137 score: 729.0 avg score: 5.3212 memorylength: 131072 epsilon: 0.04414393281460162
Training...
episode: 3468 no of steps: 132 score: 508.0 avg score: 3.8485 memorylength: 131072 epsilon: 0.04410422115699493
Training...
episode: 3469 no of steps: 137 score: 566.0 avg score: 4.1314 memorylength: 131072 epsilon: 0.04406454522380169
Training...
episode: 3470 no of steps: 143 score: 619.0 avg score: 4.3287 memorylength: 131072 epsilon: 0.044024904982884416
Training...
episode: 3471 no of steps: 139 score: 395.0 avg score: 2.8417 memorylength: 131072 epsilon: 0.04398530040213446
Training...
episode: 3472 no of steps: 135 score: 620.0 avg score: 4.5926 memorylength: 131072 epsilon: 0.043945731449472135
Training...
episode: 3473 no of steps: 163 score: 857.0 avg score: 5.2577 memorylength: 131072 epsilon: 0.04390619809284661
Training...
episode: 3474 no of steps: 140 score: 564.0 avg score: 4.0286 memorylength: 131072 epsilon: 0.04386670030023582
Training...
episode: 3475 no of steps: 154 score: 840.0 avg score: 5.4545 memorylength: 131072 epsilon: 0.04382723803964657
Training...
episode: 3476 no of steps: 153 score: 693.0 avg score: 4.5294 memorylength: 131072 epsilon: 0.04378781127911443
Training...
episode: 3477 no of steps: 174 score: 899.0 avg score: 5.1667 memorylength: 131072 epsilon: 0.043748419986703736
Training...
episode: 3478 no of steps: 170 score: 630.0 avg score: 3.7059 memorylength: 131072 epsilon: 0.0437090641305075
Training...
episode: 3479 no of steps: 164 score: 675.0 avg score: 4.1159 memorylength: 131072 epsilon: 0.04366974367864751
Training...
episode: 3480 no of steps: 192 score: 1179.0 avg score: 6.1406 memorylength: 131072 epsilon: 0.04363045859927418
Training...
episode: 3481 no of steps: 194 score: 1089.0 avg score: 5.6134 memorylength: 131072 epsilon: 0.043591208860566624
Training...
episode: 3482 no of steps: 217 score: 963.0 avg score: 4.4378 memorylength: 131072 epsilon: 0.04355199443073251
Training...
episode: 3483 no of steps: 175 score: 1300.0 avg score: 7.4286 memorylength: 131072 epsilon: 0.04351281527800816
Training...
episode: 3484 no of steps: 162 score: 826.0 avg score: 5.0988 memorylength: 131072 epsilon: 0.04347367137065849
Training...
episode: 3485 no of steps: 140 score: 1070.0 avg score: 7.6429 memorylength: 131072 epsilon: 0.04343456267697689
Training...
episode: 3486 no of steps: 150 score: 561.0 avg score: 3.74 memorylength: 131072 epsilon: 0.04339548916528533
Training...
episode: 3487 no of steps: 141 score: 971.0 avg score: 6.8865 memorylength: 131072 epsilon: 0.043356450803934264
Training...
episode: 3488 no of steps: 155 score: 945.0 avg score: 6.0968 memorylength: 131072 epsilon: 0.04331744756130263
Training...
episode: 3489 no of steps: 148 score: 686.0 avg score: 4.6351 memorylength: 131072 epsilon: 0.043278479405797786
Training...
episode: 3490 no of steps: 140 score: 738.0 avg score: 5.2714 memorylength: 131072 epsilon: 0.04323954630585552
Training...
episode: 3491 no of steps: 133 score: 497.0 avg score: 3.7368 memorylength: 131072 epsilon: 0.04320064822994005
Training...
episode: 3492 no of steps: 131 score: 549.0 avg score: 4.1908 memorylength: 131072 epsilon: 0.04316178514654388
Training...
episode: 3493 no of steps: 143 score: 738.0 avg score: 5.1608 memorylength: 131072 epsilon: 0.04312295702418795
Training...
episode: 3494 no of steps: 152 score: 376.0 avg score: 2.4737 memorylength: 131072 epsilon: 0.04308416383142146
Training...
episode: 3495 no of steps: 143 score: 561.0 avg score: 3.9231 memorylength: 131072 epsilon: 0.04304540553682194
Training...
episode: 3496 no of steps: 158 score: 549.0 avg score: 3.4747 memorylength: 131072 epsilon: 0.04300668210899516
Training...
episode: 3497 no of steps: 151 score: 725.0 avg score: 4.8013 memorylength: 131072 epsilon: 0.042967993516575126
Training...
episode: 3498 no of steps: 153 score: 823.0 avg score: 5.3791 memorylength: 131072 epsilon: 0.04292933972822409
Training...
episode: 3499 no of steps: 156 score: 812.0 avg score: 5.2051 memorylength: 131072 epsilon: 0.0428907207126325
Training...
episode: 3500 no of steps: 180 score: 917.0 avg score: 5.0944 memorylength: 131072 epsilon: 0.042852136438518915
saving states...
Training...
episode: 3501 no of steps: 199 score: 776.0 avg score: 3.8995