PyPI - pearmut - Versions diffs - 1.0.1__py3-none-any.whl → 1.0.3__py3-none-any.whl - Mend

pearmut 1.0.1py3-none-any.whl → 1.0.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (20) hide show

pearmut/app.py +56 -25
pearmut/assignment.py +340 -105
pearmut/cli.py +185 -104
pearmut/results_export.py +1 -1
pearmut/static/annotate.bundle.js +1 -0
pearmut/static/annotate.html +164 -0
pearmut/static/dashboard.bundle.js +1 -1
pearmut/static/dashboard.html +6 -1
pearmut/static/index.html +1 -1
pearmut/static/style.css +46 -0
pearmut/utils.py +40 -21
{pearmut-1.0.1.dist-info → pearmut-1.0.3.dist-info}/METADATA +119 -65
pearmut-1.0.3.dist-info/RECORD +20 -0
{pearmut-1.0.1.dist-info → pearmut-1.0.3.dist-info}/WHEEL +1 -1
pearmut/static/basic.bundle.js +0 -1
pearmut/static/basic.html +0 -133
pearmut-1.0.1.dist-info/RECORD +0 -20
{pearmut-1.0.1.dist-info → pearmut-1.0.3.dist-info}/entry_points.txt +0 -0
{pearmut-1.0.1.dist-info → pearmut-1.0.3.dist-info}/licenses/LICENSE +0 -0
{pearmut-1.0.1.dist-info → pearmut-1.0.3.dist-info}/top_level.txt +0 -0

pearmut/cli.py CHANGED Viewed

@@ -3,20 +3,49 @@ Command-line interface for managing and running the Pearmut server.
 """
 import argparse
+import atexit
+import fcntl
 import hashlib
 import json
 import os
 import urllib.parse
-import psutil
-from .utils import ROOT, load_progress_data, save_progress_data
+from .utils import (
+    ROOT,
+    TOKEN_MAIN,
+    is_form_document,
+    load_progress_data,
+    save_progress_data,
+)
 os.makedirs(f"{ROOT}/data/tasks", exist_ok=True)
 load_progress_data(warn=None)
 def _run(args_unknown):
+    # Acquire lock before starting server
+    lock_file = f"{ROOT}/data/.lock"
+    try:
+        lock_fd = open(lock_file, "a+")
+        fcntl.flock(lock_fd.fileno(), fcntl.LOCK_EX | fcntl.LOCK_NB)
+        lock_fd.seek(0)
+        lock_fd.truncate()
+        lock_fd.write(str(os.getpid()))
+        lock_fd.flush()
+    except BlockingIOError:
+        try:
+            with open(lock_file, "r") as f:
+                pid = f.read().strip()
+            print("You can't run multiple instances of Pearmut in the same directory.")
+            if pid:
+                print(f"Another instance (PID {pid}) is holding the lock.")
+        except (FileNotFoundError, PermissionError, OSError):
+            print("You can't run multiple instances of Pearmut in the same directory.")
+        exit(1)
+    # Register cleanup to remove lock file on exit
+    atexit.register(lambda: os.path.exists(lock_file) and os.remove(lock_file))
     import uvicorn
     from .app import app, tasks_data
@@ -33,29 +62,29 @@ def _run(args_unknown):
     args = args.parse_args(args_unknown)
     # print access dashboard URL for all campaigns
-    if tasks_data:
-        dashboard_url = (
-            args.server
-            + "/dashboard.html?"
-            + "&".join(
-                [
-                    f"campaign_id={urllib.parse.quote_plus(campaign_id)}&token={campaign_data["token"]}"
-                    for campaign_id, campaign_data in tasks_data.items()
-                ]
-            )
-        )
-        print(
-            "\033[92mNow serving Pearmut, use the following URL to access the everything-dashboard:\033[0m"
+    dashboard_url = (
+        args.server
+        + "/dashboard?"
+        + f"token_main={TOKEN_MAIN}"
+        + "".join(
+            [
+                f"&campaign_id={urllib.parse.quote_plus(campaign_id)}&token={campaign_data['token']}"
+                for campaign_id, campaign_data in tasks_data.items()
+            ]
         )
-        print("🍐", dashboard_url + "\n", flush=True)
+    )
+    print(
+        "\033[92mNow serving Pearmut, use the following URL to access the everything-dashboard:\033[0m"
+    )
+    print("🍐", dashboard_url + "\n", flush=True)
     # disable startup message
     uvicorn.config.LOGGING_CONFIG["loggers"]["uvicorn.error"]["level"] = "WARNING"
     # set time logging
     uvicorn.config.LOGGING_CONFIG["formatters"]["access"]["datefmt"] = "%Y-%m-%d %H:%M"
-    uvicorn.config.LOGGING_CONFIG["formatters"]["access"][
-        "fmt"
-    ] = "%(asctime)s %(levelprefix)s %(client_addr)s - %(request_line)s %(status_code)s"
+    uvicorn.config.LOGGING_CONFIG["formatters"]["access"]["fmt"] = (
+        "%(asctime)s %(levelprefix)s %(client_addr)s - %(request_line)s %(status_code)s"
+    )
     uvicorn.run(
         app,
         host="0.0.0.0",
@@ -67,8 +96,11 @@ def _run(args_unknown):
 def _validate_item_structure(items):
     """
     Validate that items have the correct structure.
-    Items should be lists of dictionaries with 'tgt' and optionally 'src' and/or 'ref' keys.
-    The 'tgt' field should be a dictionary mapping model names to translations.
+    Items can be either:
+    1. Evaluation items: dictionaries with 'tgt' and optionally 'src' and/or 'ref' keys
+    2. Form items: dictionaries with 'text' and 'form' keys
+    A document must contain either all evaluation items or all form items (not mixed).
     Args:
         items: List of item dictionaries to validate
@@ -76,68 +108,100 @@ def _validate_item_structure(items):
     if not isinstance(items, list):
         raise ValueError("Items must be a list")
-    for item in items:
-        if not isinstance(item, dict):
-            raise ValueError("Each item must be a dictionary with 'tgt' key")
-        if "tgt" not in item:
-            raise ValueError("Each item must contain 'tgt' key")
+    if not items:
+        raise ValueError("Items list cannot be empty")
-        # Validate src is a string if present
-        if "src" in item and not isinstance(item["src"], str):
-            raise ValueError("Item 'src' must be a string")
+    # Check if first item is a form item or evaluation item
+    first_item = items[0]
+    if not isinstance(first_item, dict):
+        raise ValueError("Each item must be a dictionary")
-        # Validate ref is a string if present
-        if "ref" in item and not isinstance(item["ref"], str):
-            raise ValueError("Item 'ref' must be a string")
+    first_item_is_form = "text" in first_item and "form" in first_item
-        # Validate tgt is a dictionary (basic template with model names)
-        if isinstance(item["tgt"], str):
-            # String not allowed - suggest using dictionary (don't include user input to prevent injection)
-            raise ValueError(
-                'Item \'tgt\' must be a dictionary mapping model names to translations. For single translation, use {"default": "your_translation"}'
-            )
-        elif isinstance(item["tgt"], dict):
-            # Dictionary mapping model names to translations
-            # Validate that model names don't contain only numbers (JavaScript ordering issue)
-            for model_name, translation in item["tgt"].items():
-                if not isinstance(model_name, str):
-                    raise ValueError("Model names in 'tgt' dictionary must be strings")
-                if model_name.isdigit():
-                    raise ValueError(
-                        f"Model name '{model_name}' cannot be only numeric digits (would cause issues in JS/TS)"
-                    )
-                if not isinstance(translation, str):
-                    raise ValueError(
-                        f"Translation for model '{model_name}' must be a string"
-                    )
+    for item in items:
+        if not isinstance(item, dict):
+            raise ValueError("Each item must be a dictionary")
+        # Check consistency: all items must be same type (form or evaluation)
+        current_is_form = "text" in item and "form" in item
+        if current_is_form != first_item_is_form:
+            raise ValueError("Document cannot mix form items and evaluation items")
+        if first_item_is_form:
+            # Validate form item structure
+            if "text" not in item:
+                raise ValueError("Form item must contain 'text' key")
+            if "form" not in item:
+                raise ValueError("Form item must contain 'form' key")
+            if not isinstance(item["text"], str):
+                raise ValueError("Form item 'text' must be a string")
+            if item["form"] not in {None, "number", "string", "choices", "script"}:
+                raise ValueError(
+                    "Form item 'form' must be null, 'number', 'string', 'choices', or 'script'"
+                )
         else:
-            raise ValueError(
-                "Item 'tgt' must be a dictionary mapping model names to translations"
-            )
+            # Validate evaluation item structure
+            if "tgt" not in item:
+                raise ValueError("Each item must contain 'tgt' key")
+            # Validate src is a string if present
+            if "src" in item and not isinstance(item["src"], str):
+                raise ValueError("Item 'src' must be a string")
+            # Validate ref is a string if present
+            if "ref" in item and not isinstance(item["ref"], str):
+                raise ValueError("Item 'ref' must be a string")
-        # Validate error_spans structure if present
-        if "error_spans" in item:
-            if not isinstance(item["error_spans"], dict):
+            # Validate tgt is a dictionary (annotate template with model names)
+            if isinstance(item["tgt"], str):
+                # String not allowed - suggest using dictionary (don't include user input to prevent injection)
                 raise ValueError(
-                    "'error_spans' must be a dictionary mapping model names to error span lists"
+                    'Item \'tgt\' must be a dictionary mapping model names to translations. For single translation, use {"default": "your_translation"}'
                 )
-            for model_name, spans in item["error_spans"].items():
-                if not isinstance(spans, list):
-                    raise ValueError(
-                        f"Error spans for model '{model_name}' must be a list"
-                    )
-        # Validate validation structure if present
-        if "validation" in item:
-            if not isinstance(item["validation"], dict):
+            elif isinstance(item["tgt"], dict):
+                # Dictionary mapping model names to translations
+                # Validate that model names don't contain only numbers (JavaScript ordering issue)
+                for model_name, translation in item["tgt"].items():
+                    if not isinstance(model_name, str):
+                        raise ValueError(
+                            "Model names in 'tgt' dictionary must be strings"
+                        )
+                    if model_name.isdigit():
+                        raise ValueError(
+                            f"Model name '{model_name}' cannot be only numeric digits (would cause issues in JS/TS)"
+                        )
+                    if not isinstance(translation, str):
+                        raise ValueError(
+                            f"Translation for model '{model_name}' must be a string"
+                        )
+            else:
                 raise ValueError(
-                    "'validation' must be a dictionary mapping model names to validation rules"
+                    "Item 'tgt' must be a dictionary mapping model names to translations"
                 )
-            for model_name, val_rule in item["validation"].items():
-                if not isinstance(val_rule, dict):
+            # Validate error_spans structure if present
+            if "error_spans" in item:
+                if not isinstance(item["error_spans"], dict):
+                    raise ValueError(
+                        "'error_spans' must be a dictionary mapping model names to error span lists"
+                    )
+                for model_name, spans in item["error_spans"].items():
+                    if not isinstance(spans, list):
+                        raise ValueError(
+                            f"Error spans for model '{model_name}' must be a list"
+                        )
+            # Validate validation structure if present
+            if "validation" in item:
+                if not isinstance(item["validation"], dict):
                     raise ValueError(
-                        f"Validation rule for model '{model_name}' must be a dictionary"
+                        "'validation' must be a dictionary mapping model names to validation rules"
                     )
+                for model_name, val_rule in item["validation"].items():
+                    if not isinstance(val_rule, dict):
+                        raise ValueError(
+                            f"Validation rule for model '{model_name}' must be a dictionary"
+                        )
 def _validate_document_models(doc):
@@ -185,6 +249,10 @@ def _shuffle_campaign_data(campaign_data, rng):
     def shuffle_document(doc):
         """Shuffle a single document (list of items) by reordering models in tgt dict."""
+        # Skip shuffling for form documents (they don't have tgt)
+        if is_form_document(doc):
+            return  # Form documents don't need shuffling
         # Validate that all items have the same models
         _validate_document_models(doc)
@@ -238,7 +306,7 @@ def _add_single_campaign(campaign_data, overwrite, server):
     if "assignment" not in campaign_data["info"]:
         raise ValueError("Campaign 'info' must contain 'assignment' field.")
-    # Template defaults to "basic" if not specified
+    # Template defaults to "annotate" if not specified
     assignment = campaign_data["info"]["assignment"]
     # use random words for identifying users
     rng = random.Random()
@@ -248,6 +316,20 @@ def _add_single_campaign(campaign_data, overwrite, server):
     users_spec = campaign_data["info"].get("users")
     user_tokens = {}  # user_id -> {"pass": ..., "fail": ...}
+    # Validate and process data_welcome if present
+    data_welcome = campaign_data.get("data_welcome", [])
+    if data_welcome:
+        if not isinstance(data_welcome, list):
+            raise ValueError("'data_welcome' must be a list of documents.")
+        # Validate welcome documents structure - each should be a list of items
+        for doc_i, doc in enumerate(data_welcome):
+            if not isinstance(doc, list):
+                raise ValueError(f"Welcome document {doc_i} must be a list of items.")
+            try:
+                _validate_item_structure(doc)
+            except ValueError as e:
+                raise ValueError(f"Welcome document {doc_i}: {e}")
     if assignment == "task-based":
         tasks = campaign_data["data"]
         if not isinstance(tasks, list):
@@ -303,14 +385,14 @@ def _add_single_campaign(campaign_data, overwrite, server):
         # Validate dynamic-specific parameters
         if "dynamic_top" not in campaign_data["info"]:
             campaign_data["info"]["dynamic_top"] = 2
-        if "dynamic_first" not in campaign_data["info"]:
-            campaign_data["info"]["dynamic_first"] = 5
+        if "dynamic_warmup" not in campaign_data["info"]:
+            campaign_data["info"]["dynamic_warmup"] = 5
         if "dynamic_contrastive_models" not in campaign_data["info"]:
             campaign_data["info"]["dynamic_contrastive_models"] = 1
-        # Validate that dynamic_first is at least 1
-        assert (
-            campaign_data["info"]["dynamic_first"] >= 1
-        ), "dynamic_first must be at least 1"
+        # Validate that dynamic_warmup is at least 1
+        assert campaign_data["info"]["dynamic_warmup"] >= 1, (
+            "dynamic_warmup must be at least 1"
+        )
         # Validate that dynamic_contrastive_models is at most dynamic_top
         assert (
             campaign_data["info"]["dynamic_contrastive_models"]
@@ -324,9 +406,9 @@ def _add_single_campaign(campaign_data, overwrite, server):
         for item in campaign_data["data"]:
             if item and len(item) > 0:
                 item_models = set(item[0]["tgt"].keys())
-                assert (
-                    item_models == all_models
-                ), "All items must have the same model outputs"
+                assert item_models == all_models, (
+                    "All items must have the same model outputs"
+                )
     else:
         raise ValueError(f"Unknown campaign assignment type: {assignment}")
@@ -391,13 +473,20 @@ def _add_single_campaign(campaign_data, overwrite, server):
         if os.path.exists(output_file):
             os.remove(output_file)
+    # Prepend data_welcome to tasks if present
+    if data_welcome:
+        if assignment == "task-based":
+            tasks = [task for task in tasks]
+        elif assignment in ["single-stream", "dynamic"]:
+            tasks = data_welcome + tasks
     # For task-based, data is a dict mapping user_id -> tasks
     # For single-stream and dynamic, data is a flat list (shared among all users)
     if assignment == "task-based":
         campaign_data["data"] = {
             user_id: task for user_id, task in zip(user_ids, tasks)
         }
-    elif assignment in ["single-stream", "dynamic"]:
+    elif assignment in {"single-stream", "dynamic"}:
         campaign_data["data"] = tasks
     # generate a token for dashboard access if not present
@@ -413,25 +502,24 @@ def _add_single_campaign(campaign_data, overwrite, server):
     user_progress = {
         user_id: {
-            # TODO: progress tracking could be based on the assignment type
+            # Progress tracking: None | "completed" for task-based,
+            # None | "completed" | "completed_foreign" for single-stream/dynamic
             "progress": (
-                [False] * len(campaign_data["data"][user_id])
+                [None] * len(campaign_data["data"][user_id])
                 if assignment == "task-based"
-                else (
-                    [False] * len(campaign_data["data"])
-                    if assignment == "single-stream"
-                    else (
-                        [list() for _ in range(len(campaign_data["data"]))]
-                        if assignment == "dynamic"
-                        else []
-                    )
-                )
+                else [None] * len(campaign_data["data"])
+                if assignment == "single-stream"
+                else [{model: None for model in all_models}]
+                * len(campaign_data["data"])
+                if assignment == "dynamic"
+                else int(f"Invalid assignment: {assignment}")
             ),
+            "progress_welcome": [None] * len(data_welcome),
             "time_start": None,
             "time_end": None,
             "time": 0,
             "url": (
-                f"{campaign_data['info'].get("template", "basic")}.html"
+                f"{campaign_data['info'].get('template', 'annotate')}"
                 f"?campaign_id={urllib.parse.quote_plus(campaign_data['campaign_id'])}"
                 f"&user_id={user_id}"
             ),
@@ -527,7 +615,7 @@ def _add_single_campaign(campaign_data, overwrite, server):
     )
     for user_id, user_val in user_progress.items():
         # point to the protocol URL
-        print(f'🧑 {server}/{user_val["url"]}')
+        print(f"🧑 {server}/{user_val['url']}")
     print()
@@ -578,13 +666,6 @@ def main():
     )
     args, args_unknown = args.parse_known_args()
-    # enforce that only one pearmut process is running
-    for p in psutil.process_iter():
-        if "pearmut" == p.name() and p.pid != os.getpid():
-            print("Exit all running pearmut processes before running more commands.")
-            print(p)
-            exit(1)
     if args.command == "run":
         _run(args_unknown)
     elif args.command == "add":

pearmut/results_export.py CHANGED Viewed

@@ -39,7 +39,7 @@ def compute_model_scores(campaign_id):
     # Compute model scores from annotations
     model_scores = collections.defaultdict(dict)
-    # Iterate through all tasks to find items with 'models' field (basic template)
+    # Iterate through all tasks to find items with 'models' field (annotate template)
     log = get_db_log(campaign_id)
     for entry in log:
         if "item" not in entry or "annotation" not in entry:

pearmut 1.0.1__py3-none-any.whl → 1.0.3__py3-none-any.whl

pearmut 1.0.1py3-none-any.whl → 1.0.3py3-none-any.whl