Skip to content

Commit 13db41a

Browse files
committed
Feat: Update rl examples
There are bugs on env.state() since the current version of gym are having bugs with these examples. This commit is to solve it
1 parent 30b310a commit 13db41a

File tree

2 files changed

+4
-4
lines changed

2 files changed

+4
-4
lines changed

reinforcement_learning/actor_critic.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -141,7 +141,7 @@ def main():
141141
for i_episode in count(1):
142142

143143
# reset environment and episode reward
144-
state, _ = env.reset()
144+
state = env.reset()
145145
ep_reward = 0
146146

147147
# for each episode, only run 9999 steps so that we don't
@@ -152,7 +152,7 @@ def main():
152152
action = select_action(state)
153153

154154
# take the action
155-
state, reward, done, _, _ = env.step(action)
155+
state, reward, done, _ = env.step(action)
156156

157157
if args.render:
158158
env.render()

reinforcement_learning/reinforce.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -81,11 +81,11 @@ def finish_episode():
8181
def main():
8282
running_reward = 10
8383
for i_episode in count(1):
84-
state, _ = env.reset()
84+
state = env.reset()
8585
ep_reward = 0
8686
for t in range(1, 10000): # Don't infinite loop while learning
8787
action = select_action(state)
88-
state, reward, done, _, _ = env.step(action)
88+
state, reward, done, _ = env.step(action)
8989
if args.render:
9090
env.render()
9191
policy.rewards.append(reward)

0 commit comments

Comments
 (0)