Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Patch rewards part in the document and fix GoToObjectEnv #333

Merged
merged 3 commits into from
Mar 14, 2023
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
22 changes: 11 additions & 11 deletions minigrid/envs/babyai/goto.py
Original file line number Diff line number Diff line change
Expand Up @@ -44,7 +44,7 @@ class GoToRedBallGrey(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -110,7 +110,7 @@ class GoToRedBall(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -173,7 +173,7 @@ class GoToRedBallNoDists(GoToRedBall):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -230,7 +230,7 @@ class GoToObj(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -297,7 +297,7 @@ class GoToLocal(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -373,7 +373,7 @@ class GoTo(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -463,7 +463,7 @@ class GoToImpUnlock(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -568,7 +568,7 @@ class GoToSeq(LevelGen):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -636,7 +636,7 @@ class GoToRedBlueBall(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -712,7 +712,7 @@ class GoToDoor(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -780,7 +780,7 @@ class GoToObjDoor(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down
10 changes: 5 additions & 5 deletions minigrid/envs/babyai/open.py
Original file line number Diff line number Diff line change
Expand Up @@ -51,7 +51,7 @@ class Open(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -121,7 +121,7 @@ class OpenRedDoor(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -183,7 +183,7 @@ class OpenDoor(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -267,7 +267,7 @@ class OpenTwoDoors(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -367,7 +367,7 @@ class OpenDoorsOrder(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down
10 changes: 5 additions & 5 deletions minigrid/envs/babyai/other.py
Original file line number Diff line number Diff line change
Expand Up @@ -64,7 +64,7 @@ class ActionObjDoor(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -142,7 +142,7 @@ class FindObjS5(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -211,7 +211,7 @@ class KeyCorridor(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -305,7 +305,7 @@ class OneRoomS8(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -372,7 +372,7 @@ class MoveTwoAcross(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down
10 changes: 5 additions & 5 deletions minigrid/envs/babyai/pickup.py
Original file line number Diff line number Diff line change
Expand Up @@ -47,7 +47,7 @@ class Pickup(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -110,7 +110,7 @@ class UnblockPickup(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -180,7 +180,7 @@ class PickupLoc(LevelGen):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -252,7 +252,7 @@ class PickupDist(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -328,7 +328,7 @@ class PickupAbove(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down
4 changes: 2 additions & 2 deletions minigrid/envs/babyai/putnext.py
Original file line number Diff line number Diff line change
Expand Up @@ -47,7 +47,7 @@ class PutNextLocal(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -119,7 +119,7 @@ class PutNext(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down
12 changes: 6 additions & 6 deletions minigrid/envs/babyai/synth.py
Original file line number Diff line number Diff line change
Expand Up @@ -64,7 +64,7 @@ class Synth(LevelGen):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -152,7 +152,7 @@ class SynthLoc(LevelGen):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -257,7 +257,7 @@ class SynthSeq(LevelGen):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -359,7 +359,7 @@ class MiniBossLevel(LevelGen):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -462,7 +462,7 @@ class BossLevel(LevelGen):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -558,7 +558,7 @@ class BossLevelNoUnlock(LevelGen):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down
12 changes: 6 additions & 6 deletions minigrid/envs/babyai/unlock.py
Original file line number Diff line number Diff line change
Expand Up @@ -48,7 +48,7 @@ class Unlock(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -144,7 +144,7 @@ class UnlockLocal(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -207,7 +207,7 @@ class KeyInBox(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -274,7 +274,7 @@ class UnlockPickup(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -349,7 +349,7 @@ class BlockedUnlockPickup(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down Expand Up @@ -422,7 +422,7 @@ class UnlockToUnlock(RoomGridLevel):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down
2 changes: 1 addition & 1 deletion minigrid/envs/blockedunlockpickup.py
Original file line number Diff line number Diff line change
Expand Up @@ -49,7 +49,7 @@ class BlockedUnlockPickupEnv(RoomGrid):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down
2 changes: 1 addition & 1 deletion minigrid/envs/crossing.py
Original file line number Diff line number Diff line change
Expand Up @@ -54,7 +54,7 @@ class CrossingEnv(MiniGridEnv):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down
2 changes: 1 addition & 1 deletion minigrid/envs/distshift.py
Original file line number Diff line number Diff line change
Expand Up @@ -45,7 +45,7 @@ class DistShiftEnv(MiniGridEnv):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down
2 changes: 1 addition & 1 deletion minigrid/envs/doorkey.py
Original file line number Diff line number Diff line change
Expand Up @@ -42,7 +42,7 @@ class DoorKeyEnv(MiniGridEnv):

## Rewards

A reward of '1' is given for success, and '0' for failure.
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.

## Termination

Expand Down
Loading