PyPI - polycoding - Versions diffs - 0.1.0__py3-none-any.whl - Mend

polycoding 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (41) hide show

cli/__init__.py +53 -0
cli/db.py +67 -0
cli/flow.py +187 -0
cli/main.py +44 -0
cli/project.py +166 -0
cli/server.py +127 -0
cli/utils.py +70 -0
cli/worker.py +124 -0
github_app/__init__.py +13 -0
github_app/app.py +224 -0
github_app/auth.py +137 -0
github_app/config.py +38 -0
github_app/installation_manager.py +194 -0
github_app/label_mapper.py +112 -0
github_app/models.py +112 -0
github_app/webhook_handler.py +217 -0
persistence/__init__.py +5 -0
persistence/config.py +12 -0
persistence/postgres.py +346 -0
persistence/registry.py +111 -0
persistence/tasks.py +178 -0
polycoding-0.1.0.dist-info/METADATA +225 -0
polycoding-0.1.0.dist-info/RECORD +41 -0
polycoding-0.1.0.dist-info/WHEEL +4 -0
polycoding-0.1.0.dist-info/entry_points.txt +3 -0
polycoding-0.1.0.dist-info/licenses/LICENSE +20 -0
project_manager/README.md +668 -0
project_manager/__init__.py +29 -0
project_manager/base.py +202 -0
project_manager/config.py +36 -0
project_manager/conversation/__init__.py +19 -0
project_manager/conversation/flow.py +233 -0
project_manager/conversation/types.py +64 -0
project_manager/flow_runner.py +160 -0
project_manager/git_utils.py +30 -0
project_manager/github.py +367 -0
project_manager/github_conversation.py +144 -0
project_manager/github_projects_client.py +329 -0
project_manager/hooks.py +377 -0
project_manager/module.py +66 -0
project_manager/types.py +79 -0

persistence/postgres.py ADDED Viewed

@@ -0,0 +1,346 @@
+"""PostgreSQL-based flow state persistence using SQLAlchemy with JSONB."""
+import logging
+from datetime import datetime, timezone
+from typing import Any, Optional
+from crewai.flow.async_feedback.types import PendingFeedbackContext
+from crewai.flow.persistence import FlowPersistence, SQLiteFlowPersistence
+from pydantic import BaseModel
+from sqlalchemy import Index, create_engine
+from sqlalchemy.dialects.postgresql import JSONB
+from sqlalchemy.orm import (
+    DeclarativeBase,
+    Mapped,
+    mapped_column,
+    sessionmaker,
+)
+from sqlalchemy.sql.expression import text
+from sqlalchemy.types import JSON, DateTime, Integer, String, TypeDecorator
+from persistence.config import settings
+DATABASE_URL = settings.DATABASE_URL
+engine = create_engine(DATABASE_URL)
+SessionLocal = sessionmaker(autocommit=False, autoflush=False, bind=engine)
+logger = logging.getLogger(__name__)
+class Base(DeclarativeBase):
+    """SQLAlchemy declarative base."""
+class JSONType(TypeDecorator):
+    """Platform-independent JSON type. Uses JSONB for PostgreSQL, JSON for others."""
+    impl = JSON
+    cache_ok = True
+    def load_dialect_impl(self, dialect):
+        if dialect.name == "postgresql":
+            return dialect.type_descriptor(JSONB())
+        return dialect.type_descriptor(JSON())
+class Payments(Base):
+    __tablename__ = "payments"
+    id: Mapped[int] = mapped_column(primary_key=True, autoincrement=True)
+    issue_number: Mapped[int] = mapped_column()
+    payment_id: Mapped[str] = mapped_column()
+    amount: Mapped[int] = mapped_column()
+    currency: Mapped[str] = mapped_column()
+    payment_method: Mapped[str] = mapped_column()
+    status: Mapped[str] = mapped_column()
+    created_at: Mapped[datetime | None] = mapped_column(server_default=text("CURRENT_TIMESTAMP"))
+    verified_at: Mapped[datetime | None] = mapped_column(default=None)
+class Requests(Base):
+    """Flow state table model."""
+    __tablename__ = "requests"
+    id: Mapped[int] = mapped_column(Integer, primary_key=True, autoincrement=True)
+    issue_number: Mapped[int] = mapped_column(Integer, nullable=False)
+    request_text: Mapped[str] = mapped_column(String, nullable=False)
+    status: Mapped[str] = mapped_column(String, nullable=False)
+    commit: Mapped[str] = mapped_column(String, nullable=True)
+    created_at: Mapped[datetime] = mapped_column(DateTime, default=lambda: datetime.now(timezone.utc))
+def update_request_status(
+    session: sessionmaker,
+    issue_number: int,
+    status: str,
+    commit: Optional[str] = None,
+) -> bool:
+    """Update the status of a request by issue_number.
+    Args:
+        session: SQLAlchemy session factory
+        issue_number: The issue_number to update
+        status: The new status value
+    Returns:
+        True if a row was updated, False otherwise
+    """
+    with session() as sess:
+        result = sess.query(Requests).filter_by(issue_number=issue_number).update({"status": status, "commit": commit})
+        sess.commit()
+        return result > 0
+def ensure_request_exists(
+    session: sessionmaker,
+    issue_number: int,
+    body: str,
+    status: str = "pending",
+) -> bool:
+    """Ensure a request exists for the given issue_number, inserting if needed.
+    Args:
+        session: SQLAlchemy session factory
+        issue_number: The issue_number to check/insert
+        body: The issue body text
+        status: The status for new requests (default: "pending")
+    Returns:
+        True if a new request was inserted, False if it already existed
+    """
+    with session() as sess:
+        existing = sess.query(Requests).filter_by(issue_number=issue_number).first()
+        if existing:
+            return False
+        new_payment = Payments(
+            issue_number=issue_number,
+            status="manual",
+            payment_id="none",
+            amount=0,
+            currency="USD",
+            payment_method="none",
+        )
+        new_request = Requests(issue_number=issue_number, request_text=body, status=status)
+        sess.add(new_payment)
+        sess.commit()
+        sess.add(new_request)
+        sess.commit()
+        return True
+class FlowState(Base):
+    """Flow state table model."""
+    __tablename__ = "flow_states"
+    id: Mapped[int] = mapped_column(Integer, primary_key=True, autoincrement=True)
+    flow_uuid: Mapped[str] = mapped_column(String(255), nullable=False)
+    method_name: Mapped[str] = mapped_column(String(255), nullable=False)
+    timestamp: Mapped[datetime] = mapped_column(DateTime(timezone=True), nullable=False)
+    state_json: Mapped[dict[str, Any]] = mapped_column(JSONType, nullable=False)
+    __table_args__ = (Index("idx_flow_states_uuid", "flow_uuid"),)
+class PendingFeedback(Base):
+    """Pending feedback table model for async HITL."""
+    __tablename__ = "pending_feedback"
+    id: Mapped[int] = mapped_column(Integer, primary_key=True, autoincrement=True)
+    flow_uuid: Mapped[str] = mapped_column(String(255), nullable=False, unique=True)
+    context_json: Mapped[dict[str, Any]] = mapped_column(JSONType, nullable=False)
+    state_json: Mapped[dict[str, Any]] = mapped_column(JSONType, nullable=False)
+    created_at: Mapped[datetime] = mapped_column(DateTime(timezone=True), nullable=False)
+    __table_args__ = (Index("idx_pending_feedback_uuid", "flow_uuid"),)
+class PostgresFlowPersistence(FlowPersistence):
+    """PostgreSQL-based implementation of flow state persistence.
+    This class provides production-grade persistence using PostgreSQL with SQLAlchemy
+    and JSONB for efficient querying of flow states.
+    Example:
+        ```python
+        persistence = PostgresFlowPersistence(
+            connection_string="postgresql://user:pass@localhost/db"
+        )
+        # Start a flow with async feedback
+        try:
+            flow = MyFlow(persistence=persistence)
+            result = flow.kickoff()
+        except HumanFeedbackPending as e:
+            # Flow is paused, state is already persisted
+            print(f"Waiting for feedback: {e.context.flow_id}")
+        # Later, resume with feedback
+        flow = MyFlow.from_pending("abc-123", persistence)
+        result = flow.resume("looks good!")
+        ```
+    """
+    def __init__(self, connection_string: str) -> None:
+        """Initialize PostgreSQL persistence.
+        Args:
+            connection_string: PostgreSQL connection string.
+                Format: postgresql://user:password@host:port/database
+        Raises:
+            ValueError: If connection_string is invalid
+        """
+        if not connection_string:
+            raise ValueError("Connection string must be provided")
+        self.connection_string = connection_string
+        self.engine = create_engine(connection_string)
+        self.Session = sessionmaker(bind=self.engine)
+        self.init_db()
+    def init_db(self) -> None:
+        """Create the necessary tables if they don't exist."""
+        Base.metadata.create_all(self.engine)
+    def save_state(
+        self,
+        flow_uuid: str,
+        method_name: str,
+        state_data: dict[str, Any] | BaseModel,
+    ) -> None:
+        """Save the current flow state to PostgreSQL.
+        Args:
+            flow_uuid: Unique identifier for the flow instance
+            method_name: Name of the method that just completed
+            state_data: Current state data (either dict or Pydantic model)
+        """
+        state_dict = self._to_dict(state_data)
+        with self.Session() as session:
+            state = FlowState(
+                flow_uuid=flow_uuid,
+                method_name=method_name,
+                timestamp=datetime.now(timezone.utc),
+                state_json=state_dict,
+            )
+            session.add(state)
+            session.commit()
+    def load_state(self, flow_uuid: str) -> dict[str, Any] | None:
+        """Load the most recent state for a given flow UUID.
+        Args:
+            flow_uuid: Unique identifier for the flow instance
+        Returns:
+            The most recent state as a dictionary, or None if no state exists
+        """
+        with self.Session() as session:
+            state = (
+                session.query(FlowState).filter(FlowState.flow_uuid == flow_uuid).order_by(FlowState.id.desc()).first()
+            )
+        if state:
+            return state.state_json
+        return None
+    def save_pending_feedback(
+        self,
+        flow_uuid: str,
+        context: PendingFeedbackContext,
+        state_data: dict[str, Any] | BaseModel,
+    ) -> None:
+        """Save state with a pending feedback marker.
+        This method stores both the flow state and the pending feedback context,
+        allowing the flow to be resumed later when feedback is received.
+        Args:
+            flow_uuid: Unique identifier for the flow instance
+            context: The pending feedback context with all resume information
+            state_data: Current state data
+        """
+        state_dict = self._to_dict(state_data)
+        self.save_state(flow_uuid, context.method_name, state_data)
+        with self.Session() as session:
+            existing = session.query(PendingFeedback).filter(PendingFeedback.flow_uuid == flow_uuid).first()
+            if existing:
+                existing.context_json = context.to_dict()
+                existing.state_json = state_dict
+                existing.created_at = datetime.now(timezone.utc)
+            else:
+                pending = PendingFeedback(
+                    flow_uuid=flow_uuid,
+                    context_json=context.to_dict(),
+                    state_json=state_dict,
+                    created_at=datetime.now(timezone.utc),
+                )
+                session.add(pending)
+            session.commit()
+    def load_pending_feedback(
+        self,
+        flow_uuid: str,
+    ) -> tuple[dict[str, Any], PendingFeedbackContext] | None:
+        """Load state and pending feedback context.
+        Args:
+            flow_uuid: Unique identifier for the flow instance
+        Returns:
+            Tuple of (state_data, pending_context) if pending feedback exists,
+            None otherwise.
+        """
+        with self.Session() as session:
+            pending = session.query(PendingFeedback).filter(PendingFeedback.flow_uuid == flow_uuid).first()
+        if pending:
+            context = PendingFeedbackContext.from_dict(pending.context_json)
+            return (pending.state_json, context)
+        return None
+    def clear_pending_feedback(self, flow_uuid: str) -> None:
+        """Clear the pending feedback marker after successful resume.
+        Args:
+            flow_uuid: Unique identifier for the flow instance
+        """
+        with self.Session() as session:
+            session.query(PendingFeedback).filter(PendingFeedback.flow_uuid == flow_uuid).delete()
+            session.commit()
+    def _to_dict(self, state_data: dict[str, Any] | BaseModel) -> dict[str, Any]:
+        """Convert state_data to dict.
+        Args:
+            state_data: Current state data (either dict or Pydantic model)
+        Returns:
+            Dictionary representation of state_data
+        Raises:
+            ValueError: If state_data is not a dict or Pydantic model
+        """
+        if isinstance(state_data, BaseModel):
+            return state_data.model_dump()
+        elif isinstance(state_data, dict):
+            return state_data
+        else:
+            raise ValueError(f"state_data must be either a Pydantic BaseModel or dict, got {type(state_data)}")
+if DATABASE_URL and DATABASE_URL.startswith("postgres"):
+    logger.info("📊 Connecting persistence with postgres")
+    persistence = PostgresFlowPersistence(connection_string=DATABASE_URL)
+else:
+    persistence = SQLiteFlowPersistence()

persistence/registry.py ADDED Viewed

@@ -0,0 +1,111 @@
+"""SQLAlchemy model registry with auto-registration via __init_subclass__."""
+import logging
+from typing import Type
+from sqlalchemy import MetaData
+from sqlalchemy.orm import DeclarativeBase
+log = logging.getLogger(__name__)
+METADATA = MetaData(
+    naming_convention={
+        "ix": "ix_%(column_0_label)s",
+        "uq": "uq_%(table_name)s_%(column_0_name)s",
+        "ck": "ck_%(table_name)s_%(constraint_name)s",
+        "fk": "fk_%(table_name)s_%(column_0_name)s_%(referred_table_name)s",
+        "pk": "pk_%(table_name)s",
+    }
+)
+class ModelRegistry:
+    """Central registry for ORM models from all modules."""
+    _models: dict[str, Type[DeclarativeBase]] = {}
+    _modules: set[str] = set()
+    @classmethod
+    def register_model(cls, model: Type[DeclarativeBase], module_name: str) -> None:
+        """Register a single model under its module name."""
+        key = f"{module_name}.{model.__tablename__}"
+        cls._models[key] = model
+    @classmethod
+    def register_module(cls, module_name: str) -> None:
+        """Mark a module as having been processed."""
+        cls._modules.add(module_name)
+    @classmethod
+    def is_registered(cls, module_name: str) -> bool:
+        return module_name in cls._modules
+    @classmethod
+    def create_all(cls, engine) -> None:
+        """Create all registered tables in one pass."""
+        METADATA.create_all(bind=engine)
+        log.info(f"📊 Created {len(cls._models)} tables from {len(cls._modules)} modules")
+    @classmethod
+    def get_models_for_module(cls, module_name: str) -> list[Type[DeclarativeBase]]:
+        """Return all models belonging to a module."""
+        prefix = f"{module_name}."
+        return [m for key, m in cls._models.items() if key.startswith(prefix)]
+    @classmethod
+    def all_models(cls) -> dict[str, Type[DeclarativeBase]]:
+        """Return all registered models as {module.table: model}."""
+        return dict(cls._models)
+    @classmethod
+    def reset(cls) -> None:
+        """Clear registry (for testing)."""
+        cls._models.clear()
+        cls._modules.clear()
+class RegisteredBase(DeclarativeBase):
+    """Base class for ORM models with auto-registration.
+    All models across all modules inherit from this. Each model must
+    declare __module_name__ to identify its owning module.
+    Usage:
+        class MyModel(RegisteredBase):
+            __module_name__ = "my_module"
+            __tablename__ = "my_table"
+            id: Mapped[int] = mapped_column(primary_key=True)
+    The __init_subclass__ hook automatically registers the model with
+    ModelRegistry when the class is defined (at import time).
+    If __module_name__ is omitted, the registry attempts to infer it from
+    the class's __module__ attribute (e.g., 'src.retro.persistence' -> 'retro').
+    """
+    metadata = METADATA
+    __module_name__: str
+    def __init_subclass__(cls, **kwargs) -> None:
+        super().__init_subclass__(**kwargs)
+        if getattr(cls, "__abstract__", False):
+            return
+        module_name = getattr(cls, "__module_name__", None)
+        if not module_name:
+            parts = cls.__module__.split(".")
+            if len(parts) >= 2 and parts[0] == "src":
+                module_name = parts[1]
+        if module_name:
+            ModelRegistry.register_model(cls, module_name)
+            ModelRegistry.register_module(module_name)
+            log.debug(f"📊 Auto-registered: {module_name}.{cls.__tablename__}")
+        else:
+            log.warning(
+                f"⚠️ {cls.__name__} has no __module_name__ and cannot be inferred from __module__={cls.__module__!r}"
+            )

persistence/tasks.py ADDED Viewed

@@ -0,0 +1,178 @@
+"""Celery task tracking in PostgreSQL."""
+from datetime import datetime, timedelta, timezone
+from sqlalchemy import Index
+from sqlalchemy.orm import Mapped, mapped_column
+from sqlalchemy.types import DateTime, Integer, String, Text
+from .postgres import Base
+class CeleryTask(Base):
+    """Celery task tracking model.
+    Tracks all Celery tasks for monitoring and debugging purposes.
+    """
+    __tablename__ = "tasks"
+    id: Mapped[int] = mapped_column(Integer, primary_key=True, autoincrement=True)
+    task_id: Mapped[str] = mapped_column(String(255), nullable=False, unique=True)
+    flow_id: Mapped[str] = mapped_column(String(255), nullable=False)
+    task_type: Mapped[str] = mapped_column(String(100), nullable=False)
+    status: Mapped[str] = mapped_column(String(50), nullable=False)
+    created_at: Mapped[datetime] = mapped_column(DateTime(timezone=True), nullable=False)
+    started_at: Mapped[datetime | None] = mapped_column(DateTime(timezone=True), nullable=True)
+    completed_at: Mapped[datetime | None] = mapped_column(DateTime(timezone=True), nullable=True)
+    result: Mapped[str | None] = mapped_column(Text, nullable=True)
+    error_message: Mapped[str | None] = mapped_column(Text, nullable=True)
+    retry_count: Mapped[int] = mapped_column(Integer, default=0)
+    issue_number: Mapped[int | None] = mapped_column(Integer, nullable=True)
+    __table_args__ = (
+        Index("idx_tasks_flow_id", "flow_id"),
+        Index("idx_tasks_status", "status"),
+        Index("idx_tasks_task_type", "task_type"),
+    )
+class CeleryTaskTracker:
+    """Track Celery tasks in PostgreSQL."""
+    def __init__(self, session_factory):
+        """Initialize task tracker.
+        Args:
+            session_factory: SQLAlchemy session factory
+        """
+        self.Session = session_factory
+    def create_task(
+        self,
+        task_id: str,
+        flow_id: str,
+        task_type: str,
+        issue_number: int | None = None,
+    ) -> None:
+        """Create a new task record.
+        Args:
+            task_id: Celery task ID
+            flow_id: Flow ID this task belongs to
+            task_type: Type of task (e.g., 'implement_story', 'test_story')
+            issue_number: Optional GitHub issue number
+        """
+        with self.Session() as session:
+            task = CeleryTask(
+                task_id=task_id,
+                flow_id=flow_id,
+                task_type=task_type,
+                status="pending",
+                created_at=datetime.now(timezone.utc),
+                issue_number=issue_number,
+            )
+            session.add(task)
+            session.commit()
+    def update_task_started(self, task_id: str) -> None:
+        """Mark task as started.
+        Args:
+            task_id: Celery task ID
+        """
+        with self.Session() as session:
+            task = session.query(CeleryTask).filter(CeleryTask.task_id == task_id).first()
+            if task:
+                task.status = "running"
+                task.started_at = datetime.now(timezone.utc)
+                session.commit()
+    def update_task_completed(self, task_id: str, result: str | None = None) -> None:
+        """Mark task as completed.
+        Args:
+            task_id: Celery task ID
+            result: Optional result data
+        """
+        with self.Session() as session:
+            task = session.query(CeleryTask).filter(CeleryTask.task_id == task_id).first()
+            if task:
+                task.status = "completed"
+                task.completed_at = datetime.now(timezone.utc)
+                task.result = result
+                session.commit()
+    def update_task_failed(self, task_id: str, error_message: str) -> None:
+        """Mark task as failed.
+        Args:
+            task_id: Celery task ID
+            error_message: Error message
+        """
+        with self.Session() as session:
+            task = session.query(CeleryTask).filter(CeleryTask.task_id == task_id).first()
+            if task:
+                task.status = "failed"
+                task.completed_at = datetime.now(timezone.utc)
+                task.error_message = error_message
+                session.commit()
+    def increment_retry(self, task_id: str) -> None:
+        """Increment retry count.
+        Args:
+            task_id: Celery task ID
+        """
+        with self.Session() as session:
+            task = session.query(CeleryTask).filter(CeleryTask.task_id == task_id).first()
+            if task:
+                task.retry_count += 1
+                session.commit()
+    def get_task(self, task_id: str) -> CeleryTask | None:
+        """Get task by ID.
+        Args:
+            task_id: Celery task ID
+        Returns:
+            CeleryTask if found, None otherwise
+        """
+        with self.Session() as session:
+            return session.query(CeleryTask).filter(CeleryTask.task_id == task_id).first()
+    def get_flow_tasks(self, flow_id: str) -> list[CeleryTask]:
+        """Get all tasks for a flow.
+        Args:
+            flow_id: Flow ID
+        Returns:
+            List of CeleryTask objects
+        """
+        with self.Session() as session:
+            return session.query(CeleryTask).filter(CeleryTask.flow_id == flow_id).order_by(CeleryTask.created_at).all()
+    def cleanup_completed_tasks(self, days_old: int = 7) -> int:
+        """Delete completed/failed tasks older than specified days.
+        Args:
+            days_old: Number of days to keep completed tasks
+        Returns:
+            Number of tasks deleted
+        """
+        cutoff_date = datetime.now(timezone.utc) - timedelta(days=days_old)
+        with self.Session() as session:
+            deleted = (
+                session.query(CeleryTask)
+                .filter(
+                    CeleryTask.status.in_(["completed", "failed"]),
+                    CeleryTask.completed_at < cutoff_date,
+                )
+                .delete()
+            )
+            session.commit()
+            return deleted