PyPI - devseeker - Versions diffs - 0.0.1__py3-none-any.whl - Mend

devseeker 0.0.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (62) hide show

devseeker/__init__.py +4 -0
devseeker/applications/__init__.py +0 -0
devseeker/applications/cli/__init__.py +0 -0
devseeker/applications/cli/cli_agent.py +232 -0
devseeker/applications/cli/collect.py +177 -0
devseeker/applications/cli/file_selector.py +540 -0
devseeker/applications/cli/learning.py +299 -0
devseeker/applications/cli/main.py +561 -0
devseeker/benchmark/__init__.py +0 -0
devseeker/benchmark/__main__.py +154 -0
devseeker/benchmark/bench_config.py +69 -0
devseeker/benchmark/benchmarks/apps/load.py +118 -0
devseeker/benchmark/benchmarks/apps/problem.py +25 -0
devseeker/benchmark/benchmarks/apps/problems.py +3 -0
devseeker/benchmark/benchmarks/gptme/load.py +104 -0
devseeker/benchmark/benchmarks/load.py +48 -0
devseeker/benchmark/benchmarks/mbpp/load.py +114 -0
devseeker/benchmark/benchmarks/mbpp/problem.py +25 -0
devseeker/benchmark/benchmarks/mbpp/problems.py +3 -0
devseeker/benchmark/default_bench_config.toml +16 -0
devseeker/benchmark/run.py +150 -0
devseeker/benchmark/types.py +94 -0
devseeker/core/__init__.py +0 -0
devseeker/core/ai.py +437 -0
devseeker/core/base_agent.py +31 -0
devseeker/core/base_execution_env.py +42 -0
devseeker/core/base_memory.py +15 -0
devseeker/core/chat_to_files.py +245 -0
devseeker/core/default/__init__.py +0 -0
devseeker/core/default/constants.py +12 -0
devseeker/core/default/disk_execution_env.py +111 -0
devseeker/core/default/disk_memory.py +326 -0
devseeker/core/default/file_store.py +62 -0
devseeker/core/default/paths.py +86 -0
devseeker/core/default/simple_agent.py +100 -0
devseeker/core/default/steps.py +397 -0
devseeker/core/diff.py +419 -0
devseeker/core/files_dict.py +115 -0
devseeker/core/git.py +85 -0
devseeker/core/linting.py +64 -0
devseeker/core/preprompts_holder.py +29 -0
devseeker/core/project_config.py +167 -0
devseeker/core/prompt.py +44 -0
devseeker/core/token_usage.py +297 -0
devseeker/core/version_manager.py +30 -0
devseeker/preprompts/clarify +3 -0
devseeker/preprompts/entrypoint +6 -0
devseeker/preprompts/file_format +20 -0
devseeker/preprompts/file_format_diff +41 -0
devseeker/preprompts/file_format_fix +22 -0
devseeker/preprompts/generate +15 -0
devseeker/preprompts/improve +15 -0
devseeker/preprompts/philosophy +12 -0
devseeker/preprompts/roadmap +2 -0
devseeker/tools/__init__.py +0 -0
devseeker/tools/custom_steps.py +233 -0
devseeker/tools/supported_languages.py +58 -0
devseeker-0.0.1.dist-info/LICENSE +22 -0
devseeker-0.0.1.dist-info/METADATA +120 -0
devseeker-0.0.1.dist-info/RECORD +62 -0
devseeker-0.0.1.dist-info/WHEEL +4 -0
devseeker-0.0.1.dist-info/entry_points.txt +7 -0

devseeker/__init__.py ADDED Viewed

@@ -0,0 +1,4 @@
+# Adding convenience imports to the package
+# from devseeker.tools import code_vector_repository
+# from devseeker.core.default import on_disk_repository

devseeker/applications/__init__.py ADDED Viewed

File without changes

devseeker/applications/cli/__init__.py ADDED Viewed

File without changes

devseeker/applications/cli/cli_agent.py ADDED Viewed

@@ -0,0 +1,232 @@
+"""
+This module provides the CliAgent class which manages the lifecycle of code generation and improvement
+using an AI model. It includes functionalities to initialize code generation, improve existing code,
+and process the code through various steps defined in the step bundle.
+"""
+from typing import Callable, Optional, TypeVar
+# from devseeker.core.default.git_version_manager import GitVersionManager
+from devseeker.core.ai import AI
+from devseeker.core.base_agent import BaseAgent
+from devseeker.core.base_execution_env import BaseExecutionEnv
+from devseeker.core.base_memory import BaseMemory
+from devseeker.core.default.disk_execution_env import DiskExecutionEnv
+from devseeker.core.default.disk_memory import DiskMemory
+from devseeker.core.default.paths import PREPROMPTS_PATH
+from devseeker.core.default.steps import (
+    execute_entrypoint,
+    gen_code,
+    gen_entrypoint,
+    improve_fn,
+)
+from devseeker.core.files_dict import FilesDict
+from devseeker.core.preprompts_holder import PrepromptsHolder
+from devseeker.core.prompt import Prompt
+CodeGenType = TypeVar("CodeGenType", bound=Callable[[AI, str, BaseMemory], FilesDict])
+CodeProcessor = TypeVar(
+    "CodeProcessor", bound=Callable[[AI, BaseExecutionEnv, FilesDict], FilesDict]
+)
+ImproveType = TypeVar(
+    "ImproveType", bound=Callable[[AI, str, FilesDict, BaseMemory], FilesDict]
+)
+class CliAgent(BaseAgent):
+    """
+    The `CliAgent` class is responsible for managing the lifecycle of code generation and improvement
+    using an AI model. It orchestrates the generation of new code and the improvement of existing code
+    based on given prompts and utilizes a memory system and execution environment for processing.
+    Parameters
+    ----------
+    memory : BaseMemory
+        An instance of a class that adheres to the BaseMemory interface, used for storing and retrieving
+        information during the code generation process.
+    execution_env : BaseExecutionEnv
+        An instance of a class that adheres to the BaseExecutionEnv interface, used for executing code
+        and managing the execution environment.
+    ai : AI, optional
+        An instance of the AI class that manages calls to the language model. If not provided, a default
+        instance is created.
+    code_gen_fn : CodeGenType, optional
+        A callable that takes an AI instance, a prompt, and a memory instance to generate code. Defaults
+        to the `gen_code` function.
+    improve_fn : ImproveType, optional
+        A callable that takes an AI instance, a prompt, a FilesDict instance, and a memory instance to
+        improve code. Defaults to the `improve` function.
+    process_code_fn : CodeProcessor, optional
+        A callable that takes an AI instance, an execution environment, and a FilesDict instance to
+        process code. Defaults to the `execute_entrypoint` function.
+    preprompts_holder : PrepromptsHolder, optional
+        An instance of PrepromptsHolder that manages preprompt templates. If not provided, a default
+        instance is created using the PREPROMPTS_PATH.
+    Attributes
+    ----------
+    memory : BaseMemory
+        The memory instance where the agent stores and retrieves information.
+    execution_env : BaseExecutionEnv
+        The execution environment instance where the agent executes and manages code.
+    ai : AI
+        The AI instance used for interacting with the language model.
+    code_gen_fn : CodeGenType
+        The function used for generating code.
+    improve_fn : ImproveType
+        The function used for improving code.
+    process_code_fn : CodeProcessor
+        The function used for processing code.
+    preprompts_holder : PrepromptsHolder
+        The holder for preprompt templates.
+    """
+    def __init__(
+        self,
+        memory: BaseMemory,
+        execution_env: BaseExecutionEnv,
+        ai: AI = None,
+        code_gen_fn: CodeGenType = gen_code,
+        improve_fn: ImproveType = improve_fn,
+        process_code_fn: CodeProcessor = execute_entrypoint,
+        preprompts_holder: PrepromptsHolder = None,
+    ):
+        self.memory = memory
+        self.execution_env = execution_env
+        self.ai = ai or AI()
+        self.code_gen_fn = code_gen_fn
+        self.process_code_fn = process_code_fn
+        self.improve_fn = improve_fn
+        self.preprompts_holder = preprompts_holder or PrepromptsHolder(PREPROMPTS_PATH)
+    @classmethod
+    def with_default_config(
+        cls,
+        memory: DiskMemory,
+        execution_env: DiskExecutionEnv,
+        ai: AI = None,
+        code_gen_fn: CodeGenType = gen_code,
+        improve_fn: ImproveType = improve_fn,
+        process_code_fn: CodeProcessor = execute_entrypoint,
+        preprompts_holder: PrepromptsHolder = None,
+        diff_timeout=3,
+    ):
+        """
+        Creates a new instance of CliAgent with default configurations for memory, execution environment,
+        AI, and other functional parameters.
+        Parameters
+        ----------
+        memory : DiskMemory
+            An instance of DiskMemory for storing and retrieving information.
+        execution_env : DiskExecutionEnv
+            An instance of DiskExecutionEnv for executing code.
+        ai : AI, optional
+            An instance of AI for interacting with the language model. Defaults to None, which will create
+            a new AI instance.
+        code_gen_fn : CodeGenType, optional
+            A function for generating code. Defaults to `gen_code`.
+        improve_fn : ImproveType, optional
+            A function for improving code. Defaults to `improve`.
+        process_code_fn : CodeProcessor, optional
+            A function for processing code. Defaults to `execute_entrypoint`.
+        preprompts_holder : PrepromptsHolder, optional
+            An instance of PrepromptsHolder for managing preprompt templates. Defaults to None, which will
+            create a new PrepromptsHolder instance using PREPROMPTS_PATH.
+        Returns
+        -------
+        CliAgent
+            An instance of CliAgent configured with the provided or default parameters.
+        """
+        return cls(
+            memory=memory,
+            execution_env=execution_env,
+            ai=ai,
+            code_gen_fn=code_gen_fn,
+            process_code_fn=process_code_fn,
+            improve_fn=improve_fn,
+            preprompts_holder=preprompts_holder or PrepromptsHolder(PREPROMPTS_PATH),
+        )
+    def init(self, prompt: Prompt) -> FilesDict:
+        """
+        Generates a new piece of code using the AI and step bundle based on the provided prompt.
+        Parameters
+        ----------
+        prompt : str
+            A string prompt that guides the code generation process.
+        Returns
+        -------
+        FilesDict
+            An instance of the `FilesDict` class containing the generated code.
+        """
+        files_dict = self.code_gen_fn(
+            self.ai, prompt, self.memory, self.preprompts_holder
+        )
+        entrypoint = gen_entrypoint(
+            self.ai, prompt, files_dict, self.memory, self.preprompts_holder
+        )
+        combined_dict = {**files_dict, **entrypoint}
+        files_dict = FilesDict(combined_dict)
+        files_dict = self.process_code_fn(
+            self.ai,
+            self.execution_env,
+            files_dict,
+            preprompts_holder=self.preprompts_holder,
+            prompt=prompt,
+            memory=self.memory,
+        )
+        return files_dict
+    def improve(
+        self,
+        files_dict: FilesDict,
+        prompt: Prompt,
+        execution_command: Optional[str] = None,
+        diff_timeout=3,
+    ) -> FilesDict:
+        """
+        Improves an existing piece of code using the AI and step bundle based on the provided prompt.
+        Parameters
+        ----------
+        files_dict : FilesDict
+            An instance of `FilesDict` containing the code to be improved.
+        prompt : str
+            A string prompt that guides the code improvement process.
+        execution_command : str, optional
+            An optional command to execute the code. If not provided, the default execution command is used.
+        Returns
+        -------
+        FilesDict
+            An instance of the `FilesDict` class containing the improved code.
+        """
+        files_dict = self.improve_fn(
+            self.ai,
+            prompt,
+            files_dict,
+            self.memory,
+            self.preprompts_holder,
+            diff_timeout=diff_timeout,
+        )
+        # entrypoint = gen_entrypoint(
+        #     self.ai, prompt, files_dict, self.memory, self.preprompts_holder
+        # )
+        # combined_dict = {**files_dict, **entrypoint}
+        # files_dict = FilesDict(combined_dict)
+        # files_dict = self.process_code_fn(
+        #     self.ai,
+        #     self.execution_env,
+        #     files_dict,
+        #     preprompts_holder=self.preprompts_holder,
+        #     prompt=prompt,
+        #     memory=self.memory,
+        # )
+        return files_dict

devseeker/applications/cli/collect.py ADDED Viewed

@@ -0,0 +1,177 @@
+"""
+Module `collect` - Data Handling and RudderStack Integration
+This module provides functionalities to handle and send learning data to RudderStack
+for the purpose of analysis and to improve the gpt-engineer system. The data is sent
+only when the user gives consent to share.
+Functions:
+    send_learning(learning): Sends learning data to RudderStack.
+    collect_learnings(prompt, model, temperature, config, memory, review): Processes and sends learning data.
+    collect_and_send_human_review(prompt, model, temperature, config, memory): Collects human feedback and sends it.
+Dependencies:
+    hashlib: For generating SHA-256 hash.
+    typing: For type annotations.
+    devseeker.core: Core functionalities of gpt-engineer.
+    devseeker.cli.learning: Handles the extraction of learning data.
+Notes:
+    Data sent to RudderStack is not shared with third parties and is used solely to
+    improve gpt-engineer and allow it to handle a broader range of use cases.
+    Consent logic is in devseeker/learning.py.
+"""
+from typing import Tuple
+from devseeker.applications.cli.learning import (
+    Learning,
+    Review,
+    extract_learning,
+    human_review_input,
+)
+from devseeker.core.default.disk_memory import DiskMemory
+from devseeker.core.prompt import Prompt
+def send_learning(learning: Learning):
+    """
+    Send the learning data to RudderStack for analysis.
+    Parameters
+    ----------
+    learning : Learning
+        An instance of the Learning class containing the data to be sent.
+    Notes
+    -----
+    This function is only called if consent is given to share data.
+    Data is not shared to a third party. It is used with the sole purpose of
+    improving gpt-engineer, and letting it handle more use cases.
+    Consent logic is in devseeker/learning.py.
+    """
+    import rudderstack.analytics as rudder_analytics
+    rudder_analytics.write_key = "2Re4kqwL61GDp7S8ewe6K5dbogG"
+    rudder_analytics.dataPlaneUrl = "https://gptengineerezm.dataplane.rudderstack.com"
+    rudder_analytics.track(
+        user_id=learning.session,
+        event="learning",
+        properties=learning.to_dict(),  # type: ignore
+    )
+def collect_learnings(
+    prompt: Prompt,
+    model: str,
+    temperature: float,
+    config: any,
+    memory: DiskMemory,
+    review: Review,
+):
+    """
+    Collect the learning data and send it to RudderStack for analysis.
+    Parameters
+    ----------
+    prompt : str
+        The initial prompt or question that was provided to the model.
+    model : str
+        The name of the model used for generating the response.
+    temperature : float
+        The temperature setting used in the model's response generation.
+    config : any
+        Configuration parameters used for the learning session.
+    memory : DiskMemory
+        An instance of DiskMemory for storing and retrieving data.
+    review : Review
+        An instance of Review containing human feedback on the model's response.
+    Notes
+    -----
+    This function attempts to send the learning data to RudderStack. If the data size exceeds
+    the maximum allowed size, it trims the data and retries sending it.
+    """
+    learnings = extract_learning(prompt, model, temperature, config, memory, review)
+    try:
+        send_learning(learnings)
+    except RuntimeError:
+        # try to remove some parts of learning that might be too big
+        # rudderstack max event size is 32kb
+        max_size = 32 << 10  # 32KB in bytes
+        current_size = len(learnings.to_json().encode("utf-8"))  # get size in bytes
+        overflow = current_size - max_size
+        # Add some extra characters for the "[REMOVED...]" string and for safety margin
+        remove_length = overflow + len(f"[REMOVED {overflow} CHARACTERS]") + 100
+        learnings.logs = (
+            learnings.logs[:-remove_length]
+            + f"\n\n[REMOVED {remove_length} CHARACTERS]"
+        )
+        print(
+            "WARNING: learning too big, removing some parts. "
+            "Please report if this results in a crash."
+        )
+        try:
+            send_learning(learnings)
+        except RuntimeError:
+            print(
+                "Sending learnings crashed despite truncation. Progressing without saving learnings."
+            )
+# def steps_file_hash():
+#     """
+#     Compute the SHA-256 hash of the steps file.
+#
+#     Returns
+#     -------
+#     str
+#         The SHA-256 hash of the steps file.
+#     """
+#     with open(steps.__file__, "r") as f:
+#         content = f.read()
+#         return hashlib.sha256(content.encode("utf-8")).hexdigest()
+def collect_and_send_human_review(
+    prompt: Prompt,
+    model: str,
+    temperature: float,
+    config: Tuple[str, ...],
+    memory: DiskMemory,
+):
+    """
+    Collects human feedback on the code and sends it for analysis.
+    Parameters
+    ----------
+    prompt : str
+        The initial prompt or question that was provided to the model.
+    model : str
+        The name of the model used for generating the response.
+    temperature : float
+        The temperature setting used in the model's response generation.
+    config : Tuple[str, ...]
+        Configuration parameters used for the learning session.
+    memory : DiskMemory
+        An instance of DiskMemory for storing and retrieving data.
+    Returns
+    -------
+    None
+    Notes
+    -----
+    This function prompts the user for a review of the generated or improved code using the
+    `human_review_input` function. If a valid review is provided, it's serialized to JSON format
+    and stored within the database's memory under the "review" key.
+    """
+    review = human_review_input()
+    if review:
+        collect_learnings(prompt, model, temperature, config, memory, review)