|
|
"""
Copied and adapted from https://github.com/mila-iqia/babyai. Levels described in the Baby AI ICLR 2019 submission, with the `Pick up` instruction. """
from __future__ import annotations
from minigrid.envs.babyai.core.levelgen import LevelGen from minigrid.envs.babyai.core.roomgrid_level import RejectSampling, RoomGridLevel from minigrid.envs.babyai.core.verifier import ObjDesc, PickupInstr
class Pickup(RoomGridLevel): """
## Description
Pick up an object, the object may be in another room.
## Mission Space
"pick up a {color} {type}"
{color} is the color of the box. Can be "red", "green", "blue", "purple", "yellow" or "grey".
{type} is the type of the object. Can be "ball", "box" or "key".
## Action Space
| Num | Name | Action | |-----|--------------|-------------------| | 0 | left | Turn left | | 1 | right | Turn right | | 2 | forward | Move forward | | 3 | pickup | Pick up an object | | 4 | drop | Unused | | 5 | toggle | Unused | | 6 | done | Unused |
## Observation Encoding
- Each tile is encoded as a 3 dimensional tuple: `(OBJECT_IDX, COLOR_IDX, STATE)` - `OBJECT_TO_IDX` and `COLOR_TO_IDX` mapping can be found in [minigrid/minigrid.py](minigrid/minigrid.py) - `STATE` refers to the door state with 0=open, 1=closed and 2=locked
## Rewards
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.
## Termination
The episode ends if any one of the following conditions is met:
1. The agent picks up the object. 2. Timeout (see `max_steps`).
## Registered Configurations
- `BabyAI-Pickup-v0`
"""
def gen_mission(self): self.place_agent() self.connect_all() objs = self.add_distractors(num_distractors=18, all_unique=False) self.check_objs_reachable() obj = self._rand_elem(objs) self.instrs = PickupInstr(ObjDesc(obj.type, obj.color))
class UnblockPickup(RoomGridLevel): """
## Description
Pick up an object, the object may be in another room. The path may be blocked by one or more obstructors.
## Mission Space
"pick up a/the {color} {type}"
{color} is the color of the box. Can be "red", "green", "blue", "purple", "yellow" or "grey".
{type} is the type of the object. Can be "ball", "box" or "key".
## Action Space
| Num | Name | Action | |-----|--------------|-------------------| | 0 | left | Turn left | | 1 | right | Turn right | | 2 | forward | Move forward | | 3 | pickup | Pick up an object | | 4 | drop | Unused | | 5 | toggle | Unused | | 6 | done | Unused |
## Observation Encoding
- Each tile is encoded as a 3 dimensional tuple: `(OBJECT_IDX, COLOR_IDX, STATE)` - `OBJECT_TO_IDX` and `COLOR_TO_IDX` mapping can be found in [minigrid/minigrid.py](minigrid/minigrid.py) - `STATE` refers to the door state with 0=open, 1=closed and 2=locked
## Rewards
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.
## Termination
The episode ends if any one of the following conditions is met:
1. The agent picks up the object. 2. Timeout (see `max_steps`).
## Registered Configurations
- `BabyAI-UnblockPickup-v0`
"""
def gen_mission(self): self.place_agent() self.connect_all() objs = self.add_distractors(num_distractors=20, all_unique=False)
# Ensure that at least one object is not reachable without unblocking # Note: the selected object will still be reachable most of the time if self.check_objs_reachable(raise_exc=False): raise RejectSampling("all objects reachable")
obj = self._rand_elem(objs) self.instrs = PickupInstr(ObjDesc(obj.type, obj.color))
class PickupLoc(LevelGen): """
## Description
Pick up an object which may be described using its location. This is a single room environment.
Competencies: PickUp, Loc. No unblocking.
## Mission Space
"pick up the {color} {type}"
{color} is the color of the box. Can be "red", "green", "blue", "purple", "yellow" or "grey".
{type} is the type of the object. Can be "ball", "box" or "key".
## Action Space
| Num | Name | Action | |-----|--------------|-------------------| | 0 | left | Turn left | | 1 | right | Turn right | | 2 | forward | Move forward | | 3 | pickup | Pick up an object | | 4 | drop | Unused | | 5 | toggle | Unused | | 6 | done | Unused |
## Observation Encoding
- Each tile is encoded as a 3 dimensional tuple: `(OBJECT_IDX, COLOR_IDX, STATE)` - `OBJECT_TO_IDX` and `COLOR_TO_IDX` mapping can be found in [minigrid/minigrid.py](minigrid/minigrid.py) - `STATE` refers to the door state with 0=open, 1=closed and 2=locked
## Rewards
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.
## Termination
The episode ends if any one of the following conditions is met:
1. The agent picks up the object. 2. Timeout (see `max_steps`).
## Registered Configurations
- `BabyAI-PickupLoc-v0`
"""
def __init__(self, **kwargs): # We add many distractors to increase the probability # of ambiguous locations within the same room super().__init__( action_kinds=["pickup"], instr_kinds=["action"], num_rows=1, num_cols=1, num_dists=8, locked_room_prob=0, locations=True, unblocking=False, **kwargs, )
class PickupDist(RoomGridLevel): """
## Description
Pick up an object The object to pick up is given by its type only, or by its color, or by its type and color. (in the current room, with distractors)
## Mission Space
"pick up a/the {color}/{type}/{color}{type}"
{color} is the color of the box. Can be "red", "green", "blue", "purple", "yellow" or "grey".
{type} is the type of the object. Can be "ball", "box" or "key".
## Action Space
| Num | Name | Action | |-----|--------------|-------------------| | 0 | left | Turn left | | 1 | right | Turn right | | 2 | forward | Move forward | | 3 | pickup | Pick up an object | | 4 | drop | Unused | | 5 | toggle | Unused | | 6 | done | Unused |
## Observation Encoding
- Each tile is encoded as a 3 dimensional tuple: `(OBJECT_IDX, COLOR_IDX, STATE)` - `OBJECT_TO_IDX` and `COLOR_TO_IDX` mapping can be found in [minigrid/minigrid.py](minigrid/minigrid.py) - `STATE` refers to the door state with 0=open, 1=closed and 2=locked
## Rewards
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.
## Termination
The episode ends if any one of the following conditions is met:
1. The agent picks up the object. 2. Timeout (see `max_steps`).
## Registered Configurations
- `BabyAI-PickupDist-v0` - `BabyAI-PickupDistDebug-v0`
"""
def __init__(self, debug=False, **kwargs): self.debug = debug super().__init__(num_rows=1, num_cols=1, room_size=7, **kwargs)
def gen_mission(self): # Add 5 random objects in the room objs = self.add_distractors(num_distractors=5) self.place_agent(0, 0) obj = self._rand_elem(objs) type = obj.type color = obj.color
select_by = self._rand_elem(["type", "color", "both"]) if select_by == "color": type = None elif select_by == "type": color = None
self.instrs = PickupInstr(ObjDesc(type, color), strict=self.debug)
class PickupAbove(RoomGridLevel): """
## Description
Pick up an object (in the room above) This task requires to use the compass to be solved effectively.
## Mission Space
"go to the {color} {type}"
{color} is the color of the box. Can be "red", "green", "blue", "purple", "yellow" or "grey".
{type} is the type of the object. Can be "ball", "box" or "key".
## Action Space
| Num | Name | Action | |-----|--------------|-------------------| | 0 | left | Turn left | | 1 | right | Turn right | | 2 | forward | Move forward | | 3 | pickup | Pick up an object | | 4 | drop | Unused | | 5 | toggle | Unused | | 6 | done | Unused |
## Observation Encoding
- Each tile is encoded as a 3 dimensional tuple: `(OBJECT_IDX, COLOR_IDX, STATE)` - `OBJECT_TO_IDX` and `COLOR_TO_IDX` mapping can be found in [minigrid/minigrid.py](minigrid/minigrid.py) - `STATE` refers to the door state with 0=open, 1=closed and 2=locked
## Rewards
A reward of '1 - 0.9 * (step_count / max_steps)' is given for success, and '0' for failure.
## Termination
The episode ends if any one of the following conditions is met:
1. The agent picks up the object. 2. Timeout (see `max_steps`).
## Registered Configurations
- `BabyAI-PickupAbove-v0`
"""
def __init__(self, max_steps: int | None = None, **kwargs): room_size = 6 if max_steps is None: max_steps = 8 * room_size**2
super().__init__(room_size=room_size, max_steps=max_steps, **kwargs)
def gen_mission(self): # Add a random object to the top-middle room obj, pos = self.add_object(1, 0) # Make sure the two rooms are directly connected self.add_door(1, 1, 3, locked=False) self.place_agent(1, 1) self.connect_all()
self.instrs = PickupInstr(ObjDesc(obj.type, obj.color))
|