PyPI - plancraft - Versions diffs - 0.3.0__py3-none-any.whl → 0.3.1__py3-none-any.whl - Mend

plancraft 0.3.0py3-none-any.whl → 0.3.1py3-none-any.whl

Files changed (13) hide show

plancraft/config.py +1 -10
plancraft/environment/__init__.py +21 -0
plancraft/environment/actions.py +152 -0
plancraft/environment/env.py +3 -1
plancraft/environment/prompts.py +29 -49
plancraft/environment/search.py +28 -1
plancraft/evaluator.py +30 -93
plancraft/models/oracle.py +0 -11
plancraft/utils.py +6 -5
{plancraft-0.3.0.dist-info → plancraft-0.3.1.dist-info}/METADATA +11 -7
{plancraft-0.3.0.dist-info → plancraft-0.3.1.dist-info}/RECORD +13 -13
{plancraft-0.3.0.dist-info → plancraft-0.3.1.dist-info}/WHEEL +0 -0
{plancraft-0.3.0.dist-info → plancraft-0.3.1.dist-info}/licenses/LICENSE +0 -0

plancraft/config.py CHANGED Viewed

@@ -1,6 +1,6 @@
 from typing import Literal, Optional, Union
-from pydantic import BaseModel, model_validator
+from pydantic import BaseModel
 from pydantic_settings import BaseSettings, SettingsConfigDict
 from plancraft.environment.recipes import RECIPES
@@ -40,15 +40,6 @@ class PlancraftConfig(BaseModel):
         False  # whether to use multimodal content format
     )
-    @model_validator(mode="after")
-    def validate(self):
-        assert set(
-            self.valid_actions
-        ).issubset(
-            {"move", "smelt", "think", "search", "impossible"}
-        ), "valid_actions should be subset of {'move', 'smelt', 'think', 'search', 'impossible'}"
-        return self
 class WandbConfig(BaseModel):
     project: str

plancraft/environment/__init__.py CHANGED Viewed

@@ -0,0 +1,21 @@
+from .actions import (
+    ImpossibleActionHandler,
+    MoveActionHandler,
+    SmeltActionHandler,
+    ThinkActionHandler,
+    convert_from_slot_index,
+    convert_to_slot_index,
+)
+from .env import PlancraftEnvironment
+from .search import GoldSearchActionHandler
+__all__ = [
+    "ImpossibleActionHandler",
+    "MoveActionHandler",
+    "SmeltActionHandler",
+    "ThinkActionHandler",
+    "PlancraftEnvironment",
+    "GoldSearchActionHandler",
+    "convert_from_slot_index",
+    "convert_to_slot_index",
+]

plancraft/environment/actions.py CHANGED Viewed

@@ -1,3 +1,7 @@
+import abc
+import re
+from typing import Optional
 from pydantic import BaseModel, field_validator, model_validator
@@ -40,6 +44,39 @@ def convert_from_slot_index(slot_index: int) -> str:
         return f"[I{slot_index-9}]"
+class ActionHandlerBase(abc.ABC):
+    @property
+    @abc.abstractmethod
+    def prompt_description(self) -> str:
+        """
+        Return the prompt description for the model
+        """
+        raise NotImplementedError()
+    @property
+    @abc.abstractmethod
+    def prompt_format_example(self) -> str:
+        """
+        Return the prompt format example for the model
+        """
+        raise NotImplementedError()
+    @property
+    @abc.abstractmethod
+    def action_name(self) -> str:
+        """
+        Return the action name for the model
+        """
+        raise NotImplementedError()
+    @abc.abstractmethod
+    def match(self, generated_text: str):
+        """
+        Match the generated text to the action/tool
+        """
+        raise NotImplementedError()
 class MoveAction(BaseModel):
     """ "Moves an item from one slot to another"""
@@ -152,3 +189,118 @@ class StopAction(BaseModel):
 # when symbolic action is true, can either move objects around or smelt
 SymbolicAction = MoveAction | SmeltAction
+class MoveActionHandler(ActionHandlerBase):
+    @property
+    def prompt_description(self) -> str:
+        return "Transfer a specific quantity of an item from one slot to another"
+    @property
+    def prompt_format_example(self) -> str:
+        return "`move: from [Source] to [Target] with quantity N`"
+    @property
+    def action_name(self) -> str:
+        return "move"
+    def match(self, generated_text: str) -> Optional[MoveAction | str]:
+        """
+        Parse the raw model response to a MoveAction
+        """
+        action_match = re.search(f"({self.action_name}):", generated_text)
+        if not action_match:
+            return
+        try:
+            slot_from = re.search(r" from (\[[ABCI]?\d+\])", generated_text).group(1)
+            slot_to = re.search(r" to (\[[ABCI]?\d+\])", generated_text).group(1)
+            quantity = re.search(r"with quantity (\d+)", generated_text).group(1)
+            action = MoveAction(
+                slot_from=slot_from,
+                slot_to=slot_to,
+                quantity=quantity,
+            )
+            return action
+        except AttributeError as e:
+            return f"Format Error: {e}"
+class SmeltActionHandler(ActionHandlerBase):
+    @property
+    def prompt_description(self) -> str:
+        return "Smelt an item in a furnace and moves the output to a specific slot"
+    @property
+    def prompt_format_example(self) -> str:
+        return "`smelt: from [Source] to [Target] with quantity N`"
+    @property
+    def action_name(self) -> str:
+        return "smelt"
+    def match(self, generated_text: str) -> Optional[SmeltAction | str]:
+        """
+        Parse the raw model response to a SmeltAction
+        """
+        action_match = re.search(f"({self.action_name}):", generated_text)
+        if not action_match:
+            return
+        try:
+            slot_from = re.search(r" from (\[[ABCI]?\d+\])", generated_text).group(1)
+            slot_to = re.search(r" to (\[[ABCI]?\d+\])", generated_text).group(1)
+            quantity = re.search(r"with quantity (\d+)", generated_text).group(1)
+            action = SmeltAction(
+                slot_from=slot_from,
+                slot_to=slot_to,
+                quantity=quantity,
+            )
+            return action
+        except AttributeError as e:
+            return f"Format Error: {e}"
+class ImpossibleActionHandler(ActionHandlerBase):
+    @property
+    def prompt_description(self) -> str:
+        return "Stop task if it is certain that it is impossible with given inventory"
+    @property
+    def prompt_format_example(self) -> str:
+        return "`impossible: <reason>`"
+    @property
+    def action_name(self) -> str:
+        return "impossible"
+    def match(self, generated_text) -> Optional[StopAction]:
+        """
+        Parse the raw model response to a StopAction
+        """
+        action_match = re.search(f"({self.action_name}):", generated_text)
+        if not action_match:
+            return
+        reason = re.search(r"impossible: (.*)", generated_text).group(1)
+        return StopAction(reason=reason)
+class ThinkActionHandler(ActionHandlerBase):
+    @property
+    def prompt_description(self) -> str:
+        return "Generate thoughts to help you decide on the next action"
+    @property
+    def prompt_format_example(self) -> str:
+        return "`think: <thought message>`"
+    @property
+    def action_name(self) -> str:
+        return "think"
+    def match(self, generated_text) -> Optional[str]:
+        """
+        Parse the raw model response to a ThinkAction
+        """
+        action_match = re.search(f"({self.action_name}):", generated_text)
+        if not action_match:
+            return
+        return "Ok"

plancraft/environment/env.py CHANGED Viewed

@@ -1,6 +1,5 @@
 import glob
 import os
-from collections import defaultdict
 from typing import Literal, Optional
 import numpy as np
@@ -323,6 +322,9 @@ class PlancraftEnvironment:
         # not enough
         if self.slot_empty(slot_from) or self.state[slot_from]["quantity"] < quantity:
             return
+        # if craft slot - must take all
+        if slot_from == 0 and self.state[slot_from]["quantity"] != quantity:
+            return
         item = self.state[slot_from]

plancraft/environment/prompts.py CHANGED Viewed

@@ -2,31 +2,11 @@ import numpy as np
 from plancraft.environment.env import PlancraftEnvironment
 from plancraft.environment.search import gold_search_recipe
-VALID_ACTIONS = ["move", "smelt", "think", "search", "impossible"]
-ACTIONS_DESCRIPTIONS = {
-    "move": {
-        "description": "Transfer a specific quantity of an item from one slot to another",
-        "format": "`move: from [Source] to [Target] with quantity N`",
-    },
-    "smelt": {
-        "description": "Smelt an item in a furnace and moves the output to a specific slot",
-        "format": "`smelt: from [Source] to [Target] with quantity N`",
-    },
-    "think": {
-        "description": "Generate thoughts to help you decide on the next action",
-        "format": "`think: <thought message>`",
-    },
-    "search": {
-        "description": "Search for a recipe to craft a specific item",
-        "format": "`search: <recipe name>`",
-    },
-    "impossible": {
-        "description": "Stop task if it is certain that it is impossible with given inventory",
-        "format": "`impossible: <reason>`",
-    },
-}
+from plancraft.environment.actions import (
+    ActionHandlerBase,
+    MoveActionHandler,
+    SmeltActionHandler,
+)
 BASE_SYSTEM_PROMPT = """You are crafting in Minecraft. You need to decide on the next action.
@@ -48,23 +28,6 @@ Constraints:
    - If an item is not in slot [0] then the recipe is incorrect
    - You need to move items from [0] to a free inventory slot to complete the crafting process"""
-def get_system_prompt(actions: list[str]):
-    assert set(actions).issubset(VALID_ACTIONS), f"Invalid actions: {actions}"
-    assert "move" in actions, "move should be one of the actions"
-    assert "smelt" in actions, "smelt should be one of the actions"
-    descriptions = ""
-    for action in actions:
-        descriptions += f"\n\t- {action}: {ACTIONS_DESCRIPTIONS[action]['description']}"
-    output_format = ""
-    for action in actions:
-        output_format += f"\n\t- {ACTIONS_DESCRIPTIONS[action]['format']}"
-    return f"{BASE_SYSTEM_PROMPT}\n\nActions:{descriptions}\n\nFormat{output_format}\n\n{BASE_SYSTEM_PROMPT_EXAMPLE}"
 CRAFTING_STEPS = [
     "Craft an item of type: andesite\ninventory:\n - diorite [I18] quantity 1\n - cobblestone [I30] quantity 1",
     "Craft an item of type: andesite\ninventory:\n - diorite [B1] quantity 1\n - cobblestone [I30] quantity 1",
@@ -94,8 +57,26 @@ SEARCH_STEPS = [
 ]
+def get_system_prompt(
+    handlers: list[ActionHandlerBase] = [MoveActionHandler(), SmeltActionHandler()],
+):
+    action_names = [handler.action_name for handler in handlers]
+    assert "move" in action_names, "MoveActionHandler should be one of the handlers"
+    assert "smelt" in action_names, "SmeltActionHandler should be one of the handlers"
+    descriptions = ""
+    for handler in handlers:
+        descriptions += f"\n\t- {handler.action_name}: {handler.prompt_description}"
+    output_format = ""
+    for handler in handlers:
+        output_format += f"\n\t- {handler.prompt_format_example}"
+    return f"{BASE_SYSTEM_PROMPT}\n\nActions:{descriptions}\n\nFormat{output_format}\n\n{BASE_SYSTEM_PROMPT_EXAMPLE}"
 def get_prompt_example(
-    actions: list[str],
+    handlers: list[ActionHandlerBase] = [MoveActionHandler(), SmeltActionHandler()],
     use_text_inventory=True,
     use_multimodal_content_format=False,
     use_images=False,
@@ -103,10 +84,9 @@ def get_prompt_example(
     """
     Generates a few-shot prompt for the crafting task
     """
-    assert set(actions).issubset(VALID_ACTIONS), f"Invalid actions: {actions}"
-    assert "move" in actions, "move should be one of the actions"
-    assert "smelt" in actions, "smelt should be one of the actions"
+    handler_names = [handler.action_name for handler in handlers]
+    assert "move" in handler_names, "move should be one of the actions"
+    assert "smelt" in handler_names, "smelt should be one of the actions"
     if use_images:
         assert (
@@ -120,12 +100,12 @@ def get_prompt_example(
             text = text.split("\ninventory:\n")[0]
         example_dialogue.append({"role": "user", "content": text})
-        if "search" in actions and SEARCH_STEPS[i]:
+        if "search" in handler_names and SEARCH_STEPS[i]:
             example_dialogue.append({"role": "assistant", "content": SEARCH_STEPS[i]})
             search_target = text.split("seach: ")[-1].strip()
             search_response = gold_search_recipe(search_target)
             example_dialogue.append({"role": "user", "content": search_response})
-        if "think" in actions:
+        if "think" in handler_names:
             example_dialogue.append({"role": "assistant", "content": THINK_STEPS[i]})
             example_dialogue.append({"role": "user", "content": "Ok"})
         example_dialogue.append({"role": "assistant", "content": BASE_ACTION_STEPS[i]})

plancraft/environment/search.py CHANGED Viewed

@@ -1,4 +1,7 @@
-from plancraft.environment.actions import convert_from_slot_index
+import re
+from typing import Optional
+from plancraft.environment.actions import convert_from_slot_index, ActionHandlerBase
 from plancraft.environment.recipes import RECIPES
@@ -24,3 +27,27 @@ def gold_search_recipe(recipe_name: str) -> str:
             recipe_instructions = f"smelt {r.ingredient}\n"
         out_string += f"recipe {i+1}:\n{recipe_instructions}"
     return out_string
+class GoldSearchActionHandler(ActionHandlerBase):
+    @property
+    def prompt_description(self) -> str:
+        return "Search for recipes to craft a specific item"
+    @property
+    def prompt_format_example(self) -> str:
+        return "`search: <recipe name>`"
+    @property
+    def action_name(self) -> str:
+        return "search"
+    def match(self, generated_text) -> Optional[str]:
+        """
+        Parse the raw model response to a SearchAction
+        """
+        action_match = re.search(f"({self.action_name}):", generated_text)
+        if not action_match:
+            return
+        search_target = re.search(r"search: (\w+)", generated_text).group(1)
+        return gold_search_recipe(search_target)

plancraft/evaluator.py CHANGED Viewed

@@ -1,7 +1,6 @@
 import json
 import os
 import random
-import re
 import string
 import time
@@ -12,15 +11,19 @@ from tqdm import tqdm
 import wandb
 from plancraft.config import EvalConfig, PlancraftExample
-from plancraft.environment.actions import MoveAction, SmeltAction, StopAction
+from plancraft.environment.actions import (
+    StopAction,
+    ActionHandlerBase,
+    MoveActionHandler,
+    SmeltActionHandler,
+)
 from plancraft.environment.env import (
     PlancraftEnvironment,
     get_objective_str,
     target_and_inventory_to_text_obs,
 )
-from plancraft.environment.search import gold_search_recipe
-from plancraft.models import get_model
 from plancraft.utils import History
+from plancraft.models.base import PlancraftBaseModel
 class Evaluator:
@@ -35,12 +38,18 @@ class Evaluator:
     Finally, it also saves the results of the evaluation and the images generated during the evaluation.
     """
-    def __init__(self, cfg: EvalConfig):
+    def __init__(
+        self,
+        cfg: EvalConfig,
+        run_name: str,
+        model: PlancraftBaseModel,
+        actions: list[ActionHandlerBase] = [MoveActionHandler(), SmeltActionHandler()],
+    ):
         self.cfg = cfg
-        self.output_dir = (
-            f"{cfg.plancraft.output_dir}/{self.evaluator_name()}/{cfg.plancraft.split}"
-        )
+        self.run_name = run_name
+        self.output_dir = f"{cfg.plancraft.output_dir}/{run_name}/{cfg.plancraft.split}"
         self.generation_number = 0
+        self.actions = actions
         # load all examples
         self.examples: list[PlancraftExample] = self.load_dataset(cfg.plancraft.split)
@@ -53,7 +62,7 @@ class Evaluator:
         # initialise history/dialogue tracking
         self.history = History(
-            valid_actions=cfg.plancraft.valid_actions,
+            actions=actions,
             use_multimodal_content_format=cfg.plancraft.use_multimodal_content_format,
             use_images=cfg.plancraft.use_images,
             use_text_inventory=cfg.plancraft.use_text_inventory,
@@ -61,45 +70,7 @@ class Evaluator:
         )
         # load model
-        self.model = get_model(cfg)
-    def evaluator_name(self) -> str:
-        if self.cfg.plancraft.use_text_inventory and self.cfg.plancraft.use_images:
-            name_str = "both"
-        elif self.cfg.plancraft.use_images:
-            name_str = "images"
-        elif self.cfg.plancraft.use_text_inventory:
-            name_str = "text"
-        else:
-            raise ValueError(
-                "At least one of use_text_inventory or use_images should be True"
-            )
-        if self.cfg.plancraft.use_fasterrcnn:
-            name_str += "_fasterrcnn"
-        model_name = self.cfg.plancraft.model.split("/")[-1]
-        if self.cfg.plancraft.adapter != "":
-            model_name = self.cfg.plancraft.adapter.split("/")[-1]
-        mode = self.cfg.plancraft.mode
-        if mode in ["dummy", "oracle"]:
-            return f"{mode}_{name_str}"
-        valid_actions_to_str = {
-            "move": "m",
-            "smelt": "s",
-            "think": "t",
-            "search": "se",
-            "impossible": "i",
-        }
-        actions = "|".join(
-            [
-                valid_actions_to_str[action]
-                for action in self.cfg.plancraft.valid_actions
-            ]
-        )
-        return f"{self.cfg.plancraft.mode}_{name_str}_{model_name}_{actions}"
+        self.model = model
     def save_results_dict(self, example: PlancraftExample, results_dict: dict):
         output_dir = f"{self.output_dir}/{self.generation_number}"
@@ -152,48 +123,17 @@ class Evaluator:
                 return True
         return False
-    def parse_raw_model_response(
-        self, content: str
-    ) -> str | MoveAction | SmeltAction | StopAction:
+    def parse_raw_model_response(self, generated_text: str):
         """
-        Given a message and set of valid actions, parse the content to return the action
+        Given a message and set of action handlers, parse the content to return the action
         or a message if the action is not valid/requires message response
         """
-        action_match = re.search(
-            f"({'|'.join(self.cfg.plancraft.valid_actions)}):", content
-        )
-        if action_match:
-            action = action_match.group(1)
-            if action == "think":
-                return "Ok"
-            elif action == "impossible":
-                reason = re.search(r"impossible: (.*)", content).group(1)
-                return StopAction(reason=reason)
-            elif action == "search":
-                search_target = re.search(r"search: (\w+)", content).group(1)
-                return gold_search_recipe(search_target)
-            else:
-                try:
-                    slot_from = re.search(r" from (\[[ABCI]?\d+\])", content).group(1)
-                    slot_to = re.search(r" to (\[[ABCI]?\d+\])", content).group(1)
-                    quantity = re.search(r"with quantity (\d+)", content).group(1)
-                    if action == "move":
-                        action = MoveAction(
-                            slot_from=slot_from,
-                            slot_to=slot_to,
-                            quantity=quantity,
-                        )
-                    else:
-                        action = SmeltAction(
-                            slot_from=slot_from,
-                            slot_to=slot_to,
-                            quantity=quantity,
-                        )
-                    return action
-                except AttributeError as e:
-                    return f"Format Error: {e}"
-        return f"Only select actions from the following: {', '.join(self.cfg.plancraft.valid_actions)}"
+        for handler in self.actions:
+            match_output = handler.match(generated_text)
+            if match_output:
+                return match_output
+        action_names = [handler.action_name for handler in self.actions]
+        return f"Only select actions from the following: {', '.join(action_names)}"
     def convert_observation_to_message(
         self,
@@ -230,11 +170,8 @@ class Evaluator:
         return {"content": content_list}
     def eval_example(self, example: PlancraftExample) -> dict:
-        """
-        Given the loaded model and an example from Plancraft
-        run the episode until success or termination.
-        Termination can happen from: early stopping (stuck) / max_steps / stop_action
-        """
+        """Given the loaded model and an example from Plancraft
+        run the episode until success or termination."""
         success = False
         num_non_env_actions = 0
         self.reset(example)
@@ -346,7 +283,7 @@ class Evaluator:
             f"Running evaluation over {len(self.examples)} examples {self.cfg.plancraft.num_generations} times."
         )
         run_name = (
-            f"{self.evaluator_name()} {self.cfg.plancraft.split}".replace(" ", "_")
+            f"{self.run_name} {self.cfg.plancraft.split}".replace(" ", "_")
             .replace(".", "_")
             .strip()
         )

plancraft/models/oracle.py CHANGED Viewed

@@ -38,8 +38,6 @@ def find_free_inventory_slot(inventory: dict, from_slot: int) -> int:
         if slot == from_slot:
             continue
         item_type = item["type"]
-        # if item["quantity"] == 0:
-        #     item_type = "air"
         if item_type not in type_to_slot:
             type_to_slot[item_type] = [slot]
         else:
@@ -57,12 +55,6 @@ def find_free_inventory_slot(inventory: dict, from_slot: int) -> int:
                 <= MAX_STACK_SIZE[from_item_type]
             ):
                 return slot
-    # if there is a free slot with air
-    # if "air" in type_to_slot:
-    #     for slot in type_to_slot["air"]:
-    #         if slot > 10:
-    #             return slot
     if len(empty_slots) > 0:
         return empty_slots.pop()
@@ -80,8 +72,6 @@ def get_inventory_counter(inventory: dict) -> Counter:
     for slot, item in inventory.items():
         if slot == 0:
             continue
-        # if item["type"] == "air":
-        #     continue
         counter[item["type"]] += item["quantity"]
     return counter
@@ -170,7 +160,6 @@ class OracleModel(PlancraftBaseModel):
         if isinstance(plan_recipe, ShapelessRecipe):
             crafting_slot = 1
             # add each item to crafting slots
             for item, quantity in items_to_use_counter.items():
                 n = 0

plancraft/utils.py CHANGED Viewed

@@ -7,6 +7,7 @@ import torch
 from loguru import logger
 from plancraft.environment.actions import (
+    ActionHandlerBase,
     MoveAction,
     SmeltAction,
 )
@@ -21,21 +22,21 @@ class History:
     """
     History class to keep track of dialogue, actions, inventory and images
     Args:
-        valid_actions: list of valid actions
+        valid_actions: list of valid actions names
         initial_dialogue: list of dialogue messages
         use_multimodal_content_format: whether to use multimodal content format (list of content with types)
     """
     def __init__(
         self,
-        valid_actions: list[str] = ["move", "smelt"],
+        actions: list[ActionHandlerBase] = [],
         use_multimodal_content_format=False,
         few_shot=False,
         use_images=False,
         use_text_inventory=False,
         resolution="high",
     ):
-        self.valid_actions = valid_actions
+        self.action_handlers = actions
         self.use_multimodal_content_format = use_multimodal_content_format
         self.few_shot = few_shot
         self.use_images = use_images
@@ -58,7 +59,7 @@ class History:
     def system_prompt(self):
         # kept separate from dialogue history because certain models deal with system prompt differently
-        system_prompt_text = get_system_prompt(self.valid_actions)
+        system_prompt_text = get_system_prompt(handlers=self.action_handlers)
         if self.use_multimodal_content_format:
             return {
                 "role": "system",
@@ -75,7 +76,7 @@ class History:
         if self.few_shot:
             self.prompt_examples = get_prompt_example(
-                self.valid_actions,
+                self.action_handlers,
                 use_text_inventory=self.use_text_inventory,
                 use_multimodal_content_format=self.use_multimodal_content_format,
                 use_images=self.use_images,

{plancraft-0.3.0.dist-info → plancraft-0.3.1.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: plancraft
-Version: 0.3.0
+Version: 0.3.1
 Summary: Plancraft: an evaluation dataset for planning with LLM agents
 License: MIT License
@@ -25,7 +25,6 @@ License: MIT License
         SOFTWARE.
 License-File: LICENSE
 Requires-Python: >=3.9
-Requires-Dist: accelerate>=1.1.1
 Requires-Dist: hydra-core>=1.3.2
 Requires-Dist: imageio>=2.36.0
 Requires-Dist: loguru
@@ -65,7 +64,7 @@ Description-Content-Type: text/markdown
 [Paper](https://arxiv.org/abs/2412.21033) | [Website](https://gautierdag.github.io/plancraft/)
-Plancraft is a minecraft environment and agent that innovates on planning LLM agents with a retriever
+Plancraft is a minecraft environment and agent that innovates on planning LLM agents with an oracle RAG retriever.
 You can install the package by running the following command:
@@ -123,8 +122,10 @@ from plancraft.config import EvalConfig
 def main():
     # Create the config
     config = EvalConfig(...)
+    # create model -- Note you can create your own model by subclassing PlancraftBaseModel
+    model = get_model(config)
     # Create the evaluator
-    evaluator = Evaluator(config)
+    evaluator = Evaluator(config, model=model)
     # Evaluate the agent
     evaluator.eval_all_seeds()
 ```
@@ -207,7 +208,7 @@ The observation returned by the `Evaluator` class is a dictionary with the follo
 To implement a model, you need to subclass the `PlancraftBaseModel` class and implement the `step` and `reset` method. See the `plancraft.models.dummy` module for an example of how to implement a basic model.
-You will also need to modify the `get_model` function in the `plancraft.models` module to return an instance of your model when the correct config is passed.
+You should then be able to use the `Evaluator` class to evaluate it.
 ## Reproducing the Results tables in the paper
@@ -225,10 +226,13 @@ The image is available on [Docker Hub](https://hub.docker.com/r/gautierdag/planc
 ## To Do
+Non-exhaustive list of things to do from highest to lowest priority:
+- [ ] Add minecraft wiki scrape and non-oracle search for pages
+- [ ] Improve planner to bring closer to optimal (the oracle planner does not consider  future crafting steps when moving items -- see paper for more details)
 - [ ] Rerun image models with better bounding box model
   - [ ] Track bounding box accuracy
-- [ ] Improve planner to bring closer to optimal (the oracle planner does not consider  future crafting steps when moving items -- see paper for more details)
-- [ ] Add minecraft wiki scrape and non-oracle search for pages
+- [ ] Implement a version of the image environment entirely on cuda/pytorch rather than cpu
 ## PRs Welcomed

{plancraft-0.3.0.dist-info → plancraft-0.3.1.dist-info}/RECORD RENAMED Viewed

@@ -1,8 +1,8 @@
 plancraft/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-plancraft/config.py,sha256=hsEv_YFk4St0xb6uiT2zuWqgUw4-fZAC1jB_U6DM7HU,4544
-plancraft/evaluator.py,sha256=iPONcYvozqGpJ-Wr2EvtbwMamyiZDhNf3HJCvXBtsBk,16391
+plancraft/config.py,sha256=HNHFDewz_0IF1EiPoS8B_ND5JfQvWjE4-0MbX-xvsRQ,4215
+plancraft/evaluator.py,sha256=0J1Mk-n5Y_7L-WhuH6UpoMWhMnGtdFAGW-aqZDhuhLk,13844
 plancraft/generate_dataset.py,sha256=DlrU-PmvWqSNJD1g1-8Lpb8n3N-Ogw3rje1nrRzjGKs,2382
-plancraft/utils.py,sha256=Fs9ZVaSjKxhSqn9UNNZx-dioB5Oyb7hO5c8QMkmW020,7011
+plancraft/utils.py,sha256=7VWKVlDhoMacRypRRSKM1K3hwwJ0nHR3zyx9jZH1C1g,7042
 plancraft/data/test.json,sha256=7ozxAb-PzoaOMQbMMh52RvN0pQBor6aAUwMrtc2C-y0,1670677
 plancraft/data/test.small.easy.json,sha256=IsrnRUACUWUdq2_BKGw_H2GptstqmFw66y0Grwmrwj8,238854
 plancraft/data/test.small.json,sha256=RnPJJf_wLhdUQydrQo0H4KJvcD5PkSEVy5Bbi--Il2U,342843
@@ -10,15 +10,15 @@ plancraft/data/train.json,sha256=pdArGse10i6Dg5Oa56EJPH_fOmotVzv2q5LPJpmS_bQ,342
 plancraft/data/val.json,sha256=bfVFVQ_dmDSTCLojRkv1XIlct5zkwSg4AzsMp0gUUGI,1654481
 plancraft/data/val.small.easy.json,sha256=vgBotEu-mH8441jUyCN_6DZIRX1O5SpZatdmK-I7yNA,240202
 plancraft/data/val.small.json,sha256=WO7xerSWVOPcnLH1_MBiWwdHmqWP0DDGMhuF2RycBRo,300799
-plancraft/environment/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-plancraft/environment/actions.py,sha256=r2BYSSoGt4GnNLzbWSVR99lfZ5oSkc0ENNBRqSwEzJ0,4829
-plancraft/environment/env.py,sha256=SY4ur1uLUApLmcGtgqDDcuiotFh5Cu8zLofWB6WLAh4,16190
+plancraft/environment/__init__.py,sha256=XFsFny4lH195AwAmL-WeCaF9ZCMgc7IgXIwhQ8FTdgE,505
+plancraft/environment/actions.py,sha256=D9QqBW7yWsbWCjxNyWp61Xtb0c6EtyXk3PZ1I8SRoBQ,9381
+plancraft/environment/env.py,sha256=_VQewLUv8YpKLaNp9uye25lq4HFHd9ddTQr1Lqv4eOs,16290
 plancraft/environment/items.py,sha256=Z9rhSyVDEoHF1pxRvhyiT94tyQJaWHi3wUHVcamz82o,221
 plancraft/environment/planner.py,sha256=eJExz3OxSzurIEdH9LOtMwFH9ApqMQ3CokVhmbV6Px0,3953
-plancraft/environment/prompts.py,sha256=qD7ezj-ASpl5XHGEsZ4UZkt5ubRRFgtXeCAFlRTjCok,7288
+plancraft/environment/prompts.py,sha256=OKxiv02NIhRk5FZJUEDRLkVWVMc-aXKJi7i7X61uUmk,6633
 plancraft/environment/recipes.py,sha256=0vwzOU86eZmGN2EpZVSIvzxpx0AOBWNPxTtAOFBN2A0,19570
 plancraft/environment/sampler.py,sha256=IZT-XjmWSZrs0zDyRTMjYytXxewdwYf5YGGdKsR5ll4,7643
-plancraft/environment/search.py,sha256=PUBrkgy9dgiZY8v1HyxVIxXW7n01xIQbdXXCfNHrYU4,1055
+plancraft/environment/search.py,sha256=uFHpLvW40rMKOxDabcyWrpOrhKLDZqAJOF_jew4_WXk,1837
 plancraft/environment/assets/constants.json,sha256=kyOIOh82CTTMMGEIS60k5k6M-6fkEmYDoGAnvi3Zx5k,1379016
 plancraft/environment/assets/minecraft_font.ttf,sha256=AzoK9cgggXwjFPHtIO7uz-YaDrminl3nvB-VsaTvTAk,60992
 plancraft/environment/assets/table.png,sha256=IKIViZKAPyR4FWnS0JP9AZ19vIEO3qoS5-YRGAO1ow8,5430
@@ -1917,10 +1917,10 @@ plancraft/models/base.py,sha256=uhG1tRmsBerJzW8qHoLyLEYpveDv0co7AAhi4mSfyO4,661
 plancraft/models/bbox_model.py,sha256=3b1IEspoHiVUR6GOWjEbp4YoxRhGkzKt-eOiwaN8NXo,17091
 plancraft/models/dummy.py,sha256=HVuX5Y9CPNDP8Ne4BNTe2qyWdxyhIgvPIIV3OhXxzD8,1062
 plancraft/models/generators.py,sha256=F76_iPiqxUjDIrQwF58tzM0bLM91OkZJ0sBqBuki5wY,13939
-plancraft/models/oracle.py,sha256=WkzupIoetppGzPst5kD0IRe_9VsQSRJzPB6N-_ULa-k,8750
+plancraft/models/oracle.py,sha256=jDCE6zVFvbwFpDzQZTkHIlRwMud1yMJ4LVIdfpt5ddU,8449
 plancraft/models/utils.py,sha256=E-sZohvolWgGbpHQKgAgkgIfUJoVnT5pMt6JP8xLHKg,4034
 plancraft/train/dataset.py,sha256=oFqEd4LG9oEQ-71teh0Wf7-jJbtybT2ZibfM2bBdBkM,5474
-plancraft-0.3.0.dist-info/METADATA,sha256=yPPTvrICB1iLuI3NquneaK6cPUuGH1w4Z8hxv5SGQnM,11119
-plancraft-0.3.0.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
-plancraft-0.3.0.dist-info/licenses/LICENSE,sha256=YGR8ehDB4t-T-lOQKMfKNR-2zsOU7E3E5NA8t25HKE0,1070
-plancraft-0.3.0.dist-info/RECORD,,
+plancraft-0.3.1.dist-info/METADATA,sha256=KKsWXHGTbWBXplk1E5F0b_AJvAAu7K91k5sR3eLtKM4,11306
+plancraft-0.3.1.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
+plancraft-0.3.1.dist-info/licenses/LICENSE,sha256=YGR8ehDB4t-T-lOQKMfKNR-2zsOU7E3E5NA8t25HKE0,1070
+plancraft-0.3.1.dist-info/RECORD,,

{plancraft-0.3.0.dist-info → plancraft-0.3.1.dist-info}/WHEEL RENAMED Viewed

File without changes

{plancraft-0.3.0.dist-info → plancraft-0.3.1.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

plancraft 0.3.0__py3-none-any.whl → 0.3.1__py3-none-any.whl

plancraft 0.3.0py3-none-any.whl → 0.3.1py3-none-any.whl