PyPI - plancraft - Versions diffs - 0.3.0__py3-none-any.whl → 0.3.1__py3-none-any.whl - Mend

plancraft 0.3.0py3-none-any.whl → 0.3.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

plancraft/config.py +1 -10
plancraft/environment/__init__.py +21 -0
plancraft/environment/actions.py +152 -0
plancraft/environment/env.py +3 -1
plancraft/environment/prompts.py +29 -49
plancraft/environment/search.py +28 -1
plancraft/evaluator.py +30 -93
plancraft/models/oracle.py +0 -11
plancraft/utils.py +6 -5
{plancraft-0.3.0.dist-info → plancraft-0.3.1.dist-info}/METADATA +11 -7
{plancraft-0.3.0.dist-info → plancraft-0.3.1.dist-info}/RECORD +13 -13
{plancraft-0.3.0.dist-info → plancraft-0.3.1.dist-info}/WHEEL +0 -0
{plancraft-0.3.0.dist-info → plancraft-0.3.1.dist-info}/licenses/LICENSE +0 -0

plancraft/config.py CHANGED Viewed

@@ -1,6 +1,6 @@
 from typing import Literal, Optional, Union
-from pydantic import BaseModel, model_validator
+from pydantic import BaseModel
 from pydantic_settings import BaseSettings, SettingsConfigDict
 from plancraft.environment.recipes import RECIPES
@@ -40,15 +40,6 @@ class PlancraftConfig(BaseModel):
         False  # whether to use multimodal content format
     )
-    @model_validator(mode="after")
-    def validate(self):
-        assert set(
-            self.valid_actions
-        ).issubset(
-            {"move", "smelt", "think", "search", "impossible"}
-        ), "valid_actions should be subset of {'move', 'smelt', 'think', 'search', 'impossible'}"
-        return self
 class WandbConfig(BaseModel):
     project: str

plancraft/environment/__init__.py CHANGED Viewed

@@ -0,0 +1,21 @@
+from .actions import (
+    ImpossibleActionHandler,
+    MoveActionHandler,
+    SmeltActionHandler,
+    ThinkActionHandler,
+    convert_from_slot_index,
+    convert_to_slot_index,
+)
+from .env import PlancraftEnvironment
+from .search import GoldSearchActionHandler
+__all__ = [
+    "ImpossibleActionHandler",
+    "MoveActionHandler",
+    "SmeltActionHandler",
+    "ThinkActionHandler",
+    "PlancraftEnvironment",
+    "GoldSearchActionHandler",
+    "convert_from_slot_index",
+    "convert_to_slot_index",
+]

plancraft/environment/actions.py CHANGED Viewed

@@ -1,3 +1,7 @@
+import abc
+import re
+from typing import Optional
 from pydantic import BaseModel, field_validator, model_validator
@@ -40,6 +44,39 @@ def convert_from_slot_index(slot_index: int) -> str:
         return f"[I{slot_index-9}]"
+class ActionHandlerBase(abc.ABC):
+    @property
+    @abc.abstractmethod
+    def prompt_description(self) -> str:
+        """
+        Return the prompt description for the model
+        """
+        raise NotImplementedError()
+    @property
+    @abc.abstractmethod
+    def prompt_format_example(self) -> str:
+        """
+        Return the prompt format example for the model
+        """
+        raise NotImplementedError()
+    @property
+    @abc.abstractmethod
+    def action_name(self) -> str:
+        """
+        Return the action name for the model
+        """
+        raise NotImplementedError()
+    @abc.abstractmethod
+    def match(self, generated_text: str):
+        """
+        Match the generated text to the action/tool
+        """
+        raise NotImplementedError()
 class MoveAction(BaseModel):
     """ "Moves an item from one slot to another"""
@@ -152,3 +189,118 @@ class StopAction(BaseModel):
 # when symbolic action is true, can either move objects around or smelt
 SymbolicAction = MoveAction | SmeltAction
+class MoveActionHandler(ActionHandlerBase):
+    @property
+    def prompt_description(self) -> str:
+        return "Transfer a specific quantity of an item from one slot to another"
+    @property
+    def prompt_format_example(self) -> str:
+        return "`move: from [Source] to [Target] with quantity N`"
+    @property
+    def action_name(self) -> str:
+        return "move"
+    def match(self, generated_text: str) -> Optional[MoveAction | str]:
+        """
+        Parse the raw model response to a MoveAction
+        """
+        action_match = re.search(f"({self.action_name}):", generated_text)
+        if not action_match:
+            return
+        try:
+            slot_from = re.search(r" from (\[[ABCI]?\d+\])", generated_text).group(1)
+            slot_to = re.search(r" to (\[[ABCI]?\d+\])", generated_text).group(1)
+            quantity = re.search(r"with quantity (\d+)", generated_text).group(1)
+            action = MoveAction(
+                slot_from=slot_from,
+                slot_to=slot_to,
+                quantity=quantity,
+            )
+            return action
+        except AttributeError as e:
+            return f"Format Error: {e}"
+class SmeltActionHandler(ActionHandlerBase):
+    @property
+    def prompt_description(self) -> str:
+        return "Smelt an item in a furnace and moves the output to a specific slot"
+    @property
+    def prompt_format_example(self) -> str:
+        return "`smelt: from [Source] to [Target] with quantity N`"
+    @property
+    def action_name(self) -> str:
+        return "smelt"
+    def match(self, generated_text: str) -> Optional[SmeltAction | str]:
+        """
+        Parse the raw model response to a SmeltAction
+        """
+        action_match = re.search(f"({self.action_name}):", generated_text)
+        if not action_match:
+            return
+        try:
+            slot_from = re.search(r" from (\[[ABCI]?\d+\])", generated_text).group(1)
+            slot_to = re.search(r" to (\[[ABCI]?\d+\])", generated_text).group(1)
+            quantity = re.search(r"with quantity (\d+)", generated_text).group(1)
+            action = SmeltAction(
+                slot_from=slot_from,
+                slot_to=slot_to,
+                quantity=quantity,
+            )
+            return action
+        except AttributeError as e:
+            return f"Format Error: {e}"
+class ImpossibleActionHandler(ActionHandlerBase):
+    @property
+    def prompt_description(self) -> str:
+        return "Stop task if it is certain that it is impossible with given inventory"
+    @property
+    def prompt_format_example(self) -> str:
+        return "`impossible: <reason>`"
+    @property
+    def action_name(self) -> str:
+        return "impossible"
+    def match(self, generated_text) -> Optional[StopAction]:
+        """
+        Parse the raw model response to a StopAction
+        """
+        action_match = re.search(f"({self.action_name}):", generated_text)
+        if not action_match:
+            return
+        reason = re.search(r"impossible: (.*)", generated_text).group(1)
+        return StopAction(reason=reason)
+class ThinkActionHandler(ActionHandlerBase):
+    @property
+    def prompt_description(self) -> str:
+        return "Generate thoughts to help you decide on the next action"
+    @property
+    def prompt_format_example(self) -> str:
+        return "`think: <thought message>`"
+    @property
+    def action_name(self) -> str:
+        return "think"
+    def match(self, generated_text) -> Optional[str]:
+        """
+        Parse the raw model response to a ThinkAction
+        """
+        action_match = re.search(f"({self.action_name}):", generated_text)
+        if not action_match:
+            return
+        return "Ok"

plancraft/environment/env.py CHANGED Viewed

@@ -1,6 +1,5 @@
 import glob
 import os
-from collections import defaultdict
 from typing import Literal, Optional
 import numpy as np
@@ -323,6 +322,9 @@ class PlancraftEnvironment:
         # not enough
         if self.slot_empty(slot_from) or self.state[slot_from]["quantity"] < quantity:
             return
+        # if craft slot - must take all
+        if slot_from == 0 and self.state[slot_from]["quantity"] != quantity:
+            return
         item = self.state[slot_from]

plancraft/environment/prompts.py CHANGED Viewed

@@ -2,31 +2,11 @@ import numpy as np
 from plancraft.environment.env import PlancraftEnvironment
 from plancraft.environment.search import gold_search_recipe
-VALID_ACTIONS = ["move", "smelt", "think", "search", "impossible"]
-ACTIONS_DESCRIPTIONS = {
-    "move": {
-        "description": "Transfer a specific quantity of an item from one slot to another",
-        "format": "`move: from [Source] to [Target] with quantity N`",
-    },
-    "smelt": {
-        "description": "Smelt an item in a furnace and moves the output to a specific slot",
-        "format": "`smelt: from [Source] to [Target] with quantity N`",
-    },
-    "think": {
-        "description": "Generate thoughts to help you decide on the next action",
-        "format": "`think: <thought message>`",
-    },
-    "search": {
-        "description": "Search for a recipe to craft a specific item",
-        "format": "`search: <recipe name>`",
-    },
-    "impossible": {
-        "description": "Stop task if it is certain that it is impossible with given inventory",
-        "format": "`impossible: <reason>`",
-    },
-}
+from plancraft.environment.actions import (
+    ActionHandlerBase,
+    MoveActionHandler,
+    SmeltActionHandler,
+)
 BASE_SYSTEM_PROMPT = """You are crafting in Minecraft. You need to decide on the next action.
@@ -48,23 +28,6 @@ Constraints:
    - If an item is not in slot [0] then the recipe is incorrect
    - You need to move items from [0] to a free inventory slot to complete the crafting process"""
-def get_system_prompt(actions: list[str]):
-    assert set(actions).issubset(VALID_ACTIONS), f"Invalid actions: {actions}"
-    assert "move" in actions, "move should be one of the actions"
-    assert "smelt" in actions, "smelt should be one of the actions"
-    descriptions = ""
-    for action in actions:
-        descriptions += f"\n\t- {action}: {ACTIONS_DESCRIPTIONS[action]['description']}"
-    output_format = ""
-    for action in actions:
-        output_format += f"\n\t- {ACTIONS_DESCRIPTIONS[action]['format']}"
-    return f"{BASE_SYSTEM_PROMPT}\n\nActions:{descriptions}\n\nFormat{output_format}\n\n{BASE_SYSTEM_PROMPT_EXAMPLE}"
 CRAFTING_STEPS = [
     "Craft an item of type: andesite\ninventory:\n - diorite [I18] quantity 1\n - cobblestone [I30] quantity 1",
     "Craft an item of type: andesite\ninventory:\n - diorite [B1] quantity 1\n - cobblestone [I30] quantity 1",
@@ -94,8 +57,26 @@ SEARCH_STEPS = [
 ]
+def get_system_prompt(
+    handlers: list[ActionHandlerBase] = [MoveActionHandler(), SmeltActionHandler()],
+):
+    action_names = [handler.action_name for handler in handlers]
+    assert "move" in action_names, "MoveActionHandler should be one of the handlers"
+    assert "smelt" in action_names, "SmeltActionHandler should be one of the handlers"
+    descriptions = ""
+    for handler in handlers:
+        descriptions += f"\n\t- {handler.action_name}: {handler.prompt_description}"
+    output_format = ""
+    for handler in handlers:
+        output_format += f"\n\t- {handler.prompt_format_example}"
+    return f"{BASE_SYSTEM_PROMPT}\n\nActions:{descriptions}\n\nFormat{output_format}\n\n{BASE_SYSTEM_PROMPT_EXAMPLE}"
 def get_prompt_example(
-    actions: list[str],
+    handlers: list[ActionHandlerBase] = [MoveActionHandler(), SmeltActionHandler()],
     use_text_inventory=True,
     use_multimodal_content_format=False,
     use_images=False,
@@ -103,10 +84,9 @@ def get_prompt_example(
     """
     Generates a few-shot prompt for the crafting task
     """
-    assert set(actions).issubset(VALID_ACTIONS), f"Invalid actions: {actions}"
-    assert "move" in actions, "move should be one of the actions"
-    assert "smelt" in actions, "smelt should be one of the actions"
+    handler_names = [handler.action_name for handler in handlers]
+    assert "move" in handler_names, "move should be one of the actions"
+    assert "smelt" in handler_names, "smelt should be one of the actions"
     if use_images:
         assert (
@@ -120,12 +100,12 @@ def get_prompt_example(
             text = text.split("\ninventory:\n")[0]
         example_dialogue.append({"role": "user", "content": text})
-        if "search" in actions and SEARCH_STEPS[i]:
+        if "search" in handler_names and SEARCH_STEPS[i]:
             example_dialogue.append({"role": "assistant", "content": SEARCH_STEPS[i]})
             search_target = text.split("seach: ")[-1].strip()
             search_response = gold_search_recipe(search_target)
             example_dialogue.append({"role": "user", "content": search_response})
-        if "think" in actions:
+        if "think" in handler_names:
             example_dialogue.append({"role": "assistant", "content": THINK_STEPS[i]})
             example_dialogue.append({"role": "user", "content": "Ok"})
         example_dialogue.append({"role": "assistant", "content": BASE_ACTION_STEPS[i]})

plancraft/environment/search.py CHANGED Viewed

@@ -1,4 +1,7 @@
-from plancraft.environment.actions import convert_from_slot_index
+import re
+from typing import Optional
+from plancraft.environment.actions import convert_from_slot_index, ActionHandlerBase
 from plancraft.environment.recipes import RECIPES
@@ -24,3 +27,27 @@ def gold_search_recipe(recipe_name: str) -> str:
             recipe_instructions = f"smelt {r.ingredient}\n"
         out_string += f"recipe {i+1}:\n{recipe_instructions}"
     return out_string
+class GoldSearchActionHandler(ActionHandlerBase):
+    @property
+    def prompt_description(self) -> str:
+        return "Search for recipes to craft a specific item"
+    @property
+    def prompt_format_example(self) -> str:
+        return "`search: <recipe name>`"
+    @property
+    def action_name(self) -> str:
+        return "search"
+    def match(self, generated_text) -> Optional[str]:
+        """
+        Parse the raw model response to a SearchAction
+        """
+        action_match = re.search(f"({self.action_name}):", generated_text)
+        if not action_match:
+            return
+        search_target = re.search(r"search: (\w+)", generated_text).group(1)
+        return gold_search_recipe(search_target)

plancraft/evaluator.py CHANGED Viewed

@@ -1,7 +1,6 @@
 import json
 import os
 import random
-import re
 import string
 import time
@@ -12,15 +11,19 @@ from tqdm import tqdm
 import wandb
 from plancraft.config import EvalConfig, PlancraftExample
-from plancraft.environment.actions import MoveAction, SmeltAction, StopAction
+from plancraft.environment.actions import (
+    StopAction,
+    ActionHandlerBase,
+    MoveActionHandler,
+    SmeltActionHandler,
+)
 from plancraft.environment.env import (
     PlancraftEnvironment,
     get_objective_str,
     target_and_inventory_to_text_obs,
 )
-from plancraft.environment.search import gold_search_recipe
-from plancraft.models import get_model
 from plancraft.utils import History
+from plancraft.models.base import PlancraftBaseModel
 class Evaluator:
@@ -35,12 +38,18 @@ class Evaluator:
     Finally, it also saves the results of the evaluation and the images generated during the evaluation.
     """
-    def __init__(self, cfg: EvalConfig):
+    def __init__(
+        self,
+        cfg: EvalConfig,
+        run_name: str,
+        model: PlancraftBaseModel,
+        actions: list[ActionHandlerBase] = [MoveActionHandler(), SmeltActionHandler()],
+    ):
         self.cfg = cfg
-        self.output_dir = (
-            f"{cfg.plancraft.output_dir}/{self.evaluator_name()}/{cfg.plancraft.split}"
-        )
+        self.run_name = run_name
+        self.output_dir = f"{cfg.plancraft.output_dir}/{run_name}/{cfg.plancraft.split}"
         self.generation_number = 0
+        self.actions = actions
         # load all examples
         self.examples: list[PlancraftExample] = self.load_dataset(cfg.plancraft.split)
@@ -53,7 +62,7 @@ class Evaluator:
         # initialise history/dialogue tracking
         self.history = History(
-            valid_actions=cfg.plancraft.valid_actions,
+            actions=actions,
             use_multimodal_content_format=cfg.plancraft.use_multimodal_content_format,
             use_images=cfg.plancraft.use_images,
             use_text_inventory=cfg.plancraft.use_text_inventory,
@@ -61,45 +70,7 @@ class Evaluator:
         )
         # load model
-        self.model = get_model(cfg)
-    def evaluator_name(self) -> str:
-        if self.cfg.plancraft.use_text_inventory and self.cfg.plancraft.use_images:
-            name_str = "both"
-        elif self.cfg.plancraft.use_images:
-            name_str = "images"
-        elif self.cfg.plancraft.use_text_inventory:
-            name_str = "text"
-        else:
-            raise ValueError(
-                "At least one of use_text_inventory or use_images should be True"
-            )
-        if self.cfg.plancraft.use_fasterrcnn:
-            name_str += "_fasterrcnn"
-        model_name = self.cfg.plancraft.model.split("/")[-1]
-        if self.cfg.plancraft.adapter != "":
-            model_name = self.cfg.plancraft.adapter.split("/")[-1]
-        mode = self.cfg.plancraft.mode
-        if mode in ["dummy", "oracle"]:
-            return f"{mode}_{name_str}"
-        valid_actions_to_str = {
-            "move": "m",
-            "smelt": "s",
-            "think": "t",
-            "search": "se",
-            "impossible": "i",
-        }
-        actions = "|".join(
-            [
-                valid_actions_to_str[action]
-                for action in self.cfg.plancraft.valid_actions
-            ]
-        )
-        return f"{self.cfg.plancraft.mode}_{name_str}_{model_name}_{actions}"
+        self.model = model
     def save_results_dict(self, example: PlancraftExample, results_dict: dict):
         output_dir = f"{self.output_dir}/{self.generation_number}"
@@ -152,48 +123,17 @@ class Evaluator:
                 return True
         return False
-    def parse_raw_model_response(
-        self, content: str
-    ) -> str | MoveAction | SmeltAction | StopAction:
+    def parse_raw_model_response(self, generated_text: str):
         """
-        Given a message and set of valid actions, parse the content to return the action
+        Given a message and set of action handlers, parse the content to return the action
         or a message if the action is not valid/requires message response
         """
-        action_match = re.search(
-            f"({'|'.join(self.cfg.plancraft.valid_actions)}):", content
-        )
-        if action_match:
-            action = action_match.group(1)
-            if action == "think":
-                return "Ok"
-            elif action == "impossible":
-                reason = re.search(r"impossible: (.*)", content).group(1)
-                return StopAction(reason=reason)
-            elif action == "search":
-                search_target = re.search(r"search: (\w+)", content).group(1)
-                return gold_search_recipe(search_target)
-            else:
-                try:
-                    slot_from = re.search(r" from (\[[ABCI]?\d+\])", content).group(1)
-                    slot_to = re.search(r" to (\[[ABCI]?\d+\])", content).group(1)
-                    quantity = re.search(r"with quantity (\d+)", content).group(1)
-                    if action == "move":
-                        action = MoveAction(
-                            slot_from=slot_from,
-                            slot_to=slot_to,
-                            quantity=quantity,
-                        )
-                    else:
-                        action = SmeltAction(
-                            slot_from=slot_from,
-                            slot_to=slot_to,
-                            quantity=quantity,
-                        )
-                    return action
-                except AttributeError as e:
-                    return f"Format Error: {e}"
-        return f"Only select actions from the following: {', '.join(self.cfg.plancraft.valid_actions)}"
+        for handler in self.actions:
+            match_output = handler.match(generated_text)
+            if match_output:
+                return match_output
+        action_names = [handler.action_name for handler in self.actions]
+        return f"Only select actions from the following: {', '.join(action_names)}"
     def convert_observation_to_message(
         self,
@@ -230,11 +170,8 @@ class Evaluator:
         return {"content": content_list}
     def eval_example(self, example: PlancraftExample) -> dict:
-        """
-        Given the loaded model and an example from Plancraft
-        run the episode until success or termination.
-        Termination can happen from: early stopping (stuck) / max_steps / stop_action
-        """
+        """Given the loaded model and an example from Plancraft
+        run the episode until success or termination."""
         success = False
         num_non_env_actions = 0
         self.reset(example)
@@ -346,7 +283,7 @@ class Evaluator:
             f"Running evaluation over {len(self.examples)} examples {self.cfg.plancraft.num_generations} times."
         )
         run_name = (
-            f"{self.evaluator_name()} {self.cfg.plancraft.split}".replace(" ", "_")
+            f"{self.run_name} {self.cfg.plancraft.split}".replace(" ", "_")
             .replace(".", "_")
             .strip()
         )

plancraft/models/oracle.py CHANGED Viewed

@@ -38,8 +38,6 @@ def find_free_inventory_slot(inventory: dict, from_slot: int) -> int:
         if slot == from_slot:
             continue
         item_type = item["type"]
-        # if item["quantity"] == 0:
-        #     item_type = "air"
         if item_type not in type_to_slot:
             type_to_slot[item_type] = [slot]
         else:
@@ -57,12 +55,6 @@ def find_free_inventory_slot(inventory: dict, from_slot: int) -> int:
                 <= MAX_STACK_SIZE[from_item_type]
             ):
                 return slot
-    # if there is a free slot with air
-    # if "air" in type_to_slot:
-    #     for slot in type_to_slot["air"]:
-    #         if slot > 10:
-    #             return slot
     if len(empty_slots) > 0:
         return empty_slots.pop()
@@ -80,8 +72,6 @@ def get_inventory_counter(inventory: dict) -> Counter:
     for slot, item in inventory.items():
         if slot == 0:
             continue
-        # if item["type"] == "air":
-        #     continue
         counter[item["type"]] += item["quantity"]
     return counter
@@ -170,7 +160,6 @@ class OracleModel(PlancraftBaseModel):
         if isinstance(plan_recipe, ShapelessRecipe):
             crafting_slot = 1
             # add each item to crafting slots
             for item, quantity in items_to_use_counter.items():
                 n = 0

plancraft/utils.py CHANGED Viewed

@@ -7,6 +7,7 @@ import torch
 from loguru import logger
 from plancraft.environment.actions import (
+    ActionHandlerBase,
     MoveAction,
     SmeltAction,
 )
@@ -21,21 +22,21 @@ class History:
     """
     History class to keep track of dialogue, actions, inventory and images
     Args:
-        valid_actions: list of valid actions
+        valid_actions: list of valid actions names
         initial_dialogue: list of dialogue messages
         use_multimodal_content_format: whether to use multimodal content format (list of content with types)
     """
     def __init__(
         self,
-        valid_actions: list[str] = ["move", "smelt"],
+        actions: list[ActionHandlerBase] = [],
         use_multimodal_content_format=False,
         few_shot=False,
         use_images=False,
         use_text_inventory=False,
         resolution="high",
     ):
-        self.valid_actions = valid_actions
+        self.action_handlers = actions
         self.use_multimodal_content_format = use_multimodal_content_format
         self.few_shot = few_shot
         self.use_images = use_images
@@ -58,7 +59,7 @@ class History:
     def system_prompt(self):
         # kept separate from dialogue history because certain models deal with system prompt differently
-        system_prompt_text = get_system_prompt(self.valid_actions)
+        system_prompt_text = get_system_prompt(handlers=self.action_handlers)
         if self.use_multimodal_content_format:
             return {
                 "role": "system",
@@ -75,7 +76,7 @@ class History:
         if self.few_shot:
             self.prompt_examples = get_prompt_example(
-                self.valid_actions,
+                self.action_handlers,
                 use_text_inventory=self.use_text_inventory,
                 use_multimodal_content_format=self.use_multimodal_content_format,
                 use_images=self.use_images,

{plancraft-0.3.0.dist-info → plancraft-0.3.1.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: plancraft
-Version: 0.3.0
+Version: 0.3.1
 Summary: Plancraft: an evaluation dataset for planning with LLM agents
 License: MIT License
@@ -25,7 +25,6 @@ License: MIT License
         SOFTWARE.
 License-File: LICENSE
 Requires-Python: >=3.9
-Requires-Dist: accelerate>=1.1.1
 Requires-Dist: hydra-core>=1.3.2
 Requires-Dist: imageio>=2.36.0
 Requires-Dist: loguru
@@ -65,7 +64,7 @@ Description-Content-Type: text/markdown
 [Paper](https://arxiv.org/abs/2412.21033) | [Website](https://gautierdag.github.io/plancraft/)
-Plancraft is a minecraft environment and agent that innovates on planning LLM agents with a retriever
+Plancraft is a minecraft environment and agent that innovates on planning LLM agents with an oracle RAG retriever.
 You can install the package by running the following command:
@@ -123,8 +122,10 @@ from plancraft.config import EvalConfig
 def main():
     # Create the config
     config = EvalConfig(...)
+    # create model -- Note you can create your own model by subclassing PlancraftBaseModel
+    model = get_model(config)
     # Create the evaluator
-    evaluator = Evaluator(config)
+    evaluator = Evaluator(config, model=model)
     # Evaluate the agent
     evaluator.eval_all_seeds()
 ```
@@ -207,7 +208,7 @@ The observation returned by the `Evaluator` class is a dictionary with the follo
 To implement a model, you need to subclass the `PlancraftBaseModel` class and implement the `step` and `reset` method. See the `plancraft.models.dummy` module for an example of how to implement a basic model.
-You will also need to modify the `get_model` function in the `plancraft.models` module to return an instance of your model when the correct config is passed.
+You should then be able to use the `Evaluator` class to evaluate it.
 ## Reproducing the Results tables in the paper
@@ -225,10 +226,13 @@ The image is available on [Docker Hub](https://hub.docker.com/r/gautierdag/planc
 ## To Do
+Non-exhaustive list of things to do from highest to lowest priority:
+- [ ] Add minecraft wiki scrape and non-oracle search for pages
+- [ ] Improve planner to bring closer to optimal (the oracle planner does not consider  future crafting steps when moving items -- see paper for more details)
 - [ ] Rerun image models with better bounding box model
   - [ ] Track bounding box accuracy
-- [ ] Improve planner to bring closer to optimal (the oracle planner does not consider  future crafting steps when moving items -- see paper for more details)
-- [ ] Add minecraft wiki scrape and non-oracle search for pages
+- [ ] Implement a version of the image environment entirely on cuda/pytorch rather than cpu
 ## PRs Welcomed

{plancraft-0.3.0.dist-info → plancraft-0.3.1.dist-info}/RECORD RENAMED Viewed

@@ -1,8 +1,8 @@
 plancraft/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-plancraft/config.py,sha256=hsEv_YFk4St0xb6uiT2zuWqgUw4-fZAC1jB_U6DM7HU,4544
-plancraft/evaluator.py,sha256=iPONcYvozqGpJ-Wr2EvtbwMamyiZDhNf3HJCvXBtsBk,16391
+plancraft/config.py,sha256=HNHFDewz_0IF1EiPoS8B_ND5JfQvWjE4-0MbX-xvsRQ,4215
+plancraft/evaluator.py,sha256=0J1Mk-n5Y_7L-WhuH6UpoMWhMnGtdFAGW-aqZDhuhLk,13844
 plancraft/generate_dataset.py,sha256=DlrU-PmvWqSNJD1g1-8Lpb8n3N-Ogw3rje1nrRzjGKs,2382
-plancraft/utils.py,sha256=Fs9ZVaSjKxhSqn9UNNZx-dioB5Oyb7hO5c8QMkmW020,7011
+plancraft/utils.py,sha256=7VWKVlDhoMacRypRRSKM1K3hwwJ0nHR3zyx9jZH1C1g,7042
 plancraft/data/test.json,sha256=7ozxAb-PzoaOMQbMMh52RvN0pQBor6aAUwMrtc2C-y0,1670677
 plancraft/data/test.small.easy.json,sha256=IsrnRUACUWUdq2_BKGw_H2GptstqmFw66y0Grwmrwj8,238854
 plancraft/data/test.small.json,sha256=RnPJJf_wLhdUQydrQo0H4KJvcD5PkSEVy5Bbi--Il2U,342843
@@ -10,15 +10,15 @@ plancraft/data/train.json,sha256=pdArGse10i6Dg5Oa56EJPH_fOmotVzv2q5LPJpmS_bQ,342
 plancraft/data/val.json,sha256=bfVFVQ_dmDSTCLojRkv1XIlct5zkwSg4AzsMp0gUUGI,1654481
 plancraft/data/val.small.easy.json,sha256=vgBotEu-mH8441jUyCN_6DZIRX1O5SpZatdmK-I7yNA,240202
 plancraft/data/val.small.json,sha256=WO7xerSWVOPcnLH1_MBiWwdHmqWP0DDGMhuF2RycBRo,300799
-plancraft/environment/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-plancraft/environment/actions.py,sha256=r2BYSSoGt4GnNLzbWSVR99lfZ5oSkc0ENNBRqSwEzJ0,4829
-plancraft/environment/env.py,sha256=SY4ur1uLUApLmcGtgqDDcuiotFh5Cu8zLofWB6WLAh4,16190
+plancraft/environment/__init__.py,sha256=XFsFny4lH195AwAmL-WeCaF9ZCMgc7IgXIwhQ8FTdgE,505
+plancraft/environment/actions.py,sha256=D9QqBW7yWsbWCjxNyWp61Xtb0c6EtyXk3PZ1I8SRoBQ,9381
+plancraft/environment/env.py,sha256=_VQewLUv8YpKLaNp9uye25lq4HFHd9ddTQr1Lqv4eOs,16290
 plancraft/environment/items.py,sha256=Z9rhSyVDEoHF1pxRvhyiT94tyQJaWHi3wUHVcamz82o,221
 plancraft/environment/planner.py,sha256=eJExz3OxSzurIEdH9LOtMwFH9ApqMQ3CokVhmbV6Px0,3953
-plancraft/environment/prompts.py,sha256=qD7ezj-ASpl5XHGEsZ4UZkt5ubRRFgtXeCAFlRTjCok,7288
+plancraft/environment/prompts.py,sha256=OKxiv02NIhRk5FZJUEDRLkVWVMc-aXKJi7i7X61uUmk,6633
 plancraft/environment/recipes.py,sha256=0vwzOU86eZmGN2EpZVSIvzxpx0AOBWNPxTtAOFBN2A0,19570
 plancraft/environment/sampler.py,sha256=IZT-XjmWSZrs0zDyRTMjYytXxewdwYf5YGGdKsR5ll4,7643
-plancraft/environment/search.py,sha256=PUBrkgy9dgiZY8v1HyxVIxXW7n01xIQbdXXCfNHrYU4,1055
+plancraft/environment/search.py,sha256=uFHpLvW40rMKOxDabcyWrpOrhKLDZqAJOF_jew4_WXk,1837
 plancraft/environment/assets/constants.json,sha256=kyOIOh82CTTMMGEIS60k5k6M-6fkEmYDoGAnvi3Zx5k,1379016
 plancraft/environment/assets/minecraft_font.ttf,sha256=AzoK9cgggXwjFPHtIO7uz-YaDrminl3nvB-VsaTvTAk,60992
 plancraft/environment/assets/table.png,sha256=IKIViZKAPyR4FWnS0JP9AZ19vIEO3qoS5-YRGAO1ow8,5430
@@ -1917,10 +1917,10 @@ plancraft/models/base.py,sha256=uhG1tRmsBerJzW8qHoLyLEYpveDv0co7AAhi4mSfyO4,661
 plancraft/models/bbox_model.py,sha256=3b1IEspoHiVUR6GOWjEbp4YoxRhGkzKt-eOiwaN8NXo,17091
 plancraft/models/dummy.py,sha256=HVuX5Y9CPNDP8Ne4BNTe2qyWdxyhIgvPIIV3OhXxzD8,1062
 plancraft/models/generators.py,sha256=F76_iPiqxUjDIrQwF58tzM0bLM91OkZJ0sBqBuki5wY,13939
-plancraft/models/oracle.py,sha256=WkzupIoetppGzPst5kD0IRe_9VsQSRJzPB6N-_ULa-k,8750
+plancraft/models/oracle.py,sha256=jDCE6zVFvbwFpDzQZTkHIlRwMud1yMJ4LVIdfpt5ddU,8449
 plancraft/models/utils.py,sha256=E-sZohvolWgGbpHQKgAgkgIfUJoVnT5pMt6JP8xLHKg,4034
 plancraft/train/dataset.py,sha256=oFqEd4LG9oEQ-71teh0Wf7-jJbtybT2ZibfM2bBdBkM,5474
-plancraft-0.3.0.dist-info/METADATA,sha256=yPPTvrICB1iLuI3NquneaK6cPUuGH1w4Z8hxv5SGQnM,11119
-plancraft-0.3.0.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
-plancraft-0.3.0.dist-info/licenses/LICENSE,sha256=YGR8ehDB4t-T-lOQKMfKNR-2zsOU7E3E5NA8t25HKE0,1070
-plancraft-0.3.0.dist-info/RECORD,,
+plancraft-0.3.1.dist-info/METADATA,sha256=KKsWXHGTbWBXplk1E5F0b_AJvAAu7K91k5sR3eLtKM4,11306
+plancraft-0.3.1.dist-info/WHEEL,sha256=qtCwoSJWgHk21S1Kb4ihdzI2rlJ1ZKaIurTj_ngOhyQ,87
+plancraft-0.3.1.dist-info/licenses/LICENSE,sha256=YGR8ehDB4t-T-lOQKMfKNR-2zsOU7E3E5NA8t25HKE0,1070
+plancraft-0.3.1.dist-info/RECORD,,

{plancraft-0.3.0.dist-info → plancraft-0.3.1.dist-info}/WHEEL RENAMED Viewed

File without changes

{plancraft-0.3.0.dist-info → plancraft-0.3.1.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

plancraft 0.3.0__py3-none-any.whl → 0.3.1__py3-none-any.whl

plancraft 0.3.0py3-none-any.whl → 0.3.1py3-none-any.whl