PyPI - pearmut - Versions diffs - 1.0.1__py3-none-any.whl → 1.0.3__py3-none-any.whl - Mend

pearmut 1.0.1py3-none-any.whl → 1.0.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (20) hide show

pearmut/app.py +56 -25
pearmut/assignment.py +340 -105
pearmut/cli.py +185 -104
pearmut/results_export.py +1 -1
pearmut/static/annotate.bundle.js +1 -0
pearmut/static/annotate.html +164 -0
pearmut/static/dashboard.bundle.js +1 -1
pearmut/static/dashboard.html +6 -1
pearmut/static/index.html +1 -1
pearmut/static/style.css +46 -0
pearmut/utils.py +40 -21
{pearmut-1.0.1.dist-info → pearmut-1.0.3.dist-info}/METADATA +119 -65
pearmut-1.0.3.dist-info/RECORD +20 -0
{pearmut-1.0.1.dist-info → pearmut-1.0.3.dist-info}/WHEEL +1 -1
pearmut/static/basic.bundle.js +0 -1
pearmut/static/basic.html +0 -133
pearmut-1.0.1.dist-info/RECORD +0 -20
{pearmut-1.0.1.dist-info → pearmut-1.0.3.dist-info}/entry_points.txt +0 -0
{pearmut-1.0.1.dist-info → pearmut-1.0.3.dist-info}/licenses/LICENSE +0 -0
{pearmut-1.0.1.dist-info → pearmut-1.0.3.dist-info}/top_level.txt +0 -0

pearmut/static/dashboard.html CHANGED Viewed

@@ -20,6 +20,11 @@
             cursor: pointer;
         }
+        .abutton[disabled] {
+            pointer-events: none;
+            opacity: 0.6;
+        }
         .ranking-content input[type="button"]:not(:last-child) {
             margin-right: 5px;
         }
@@ -93,4 +98,4 @@
             .white-box {
                 overflow-x: auto;
             }
-        }</style><script defer="defer" src="dashboard.bundle.js?0d289122fd490c931aec"></script><link href="style.css?0d289122fd490c931aec" rel="stylesheet"></head><body style="padding-top: 50px; padding-bottom: 50px;"><div id="main_div" style="width: calc(100% - 200px); min-width: 1300px; margin-left: auto; margin-right: auto;"><div style="margin-bottom: 15px; font-size: 0.9em; color: #555;">💤not started &nbsp;&nbsp; ✍️in progress &nbsp;&nbsp; ✅completed & passed &nbsp;&nbsp;❌completed & failed &nbsp;&nbsp; 🔗annotator link &nbsp;&nbsp; 👁️anotator link (view-only) &nbsp;&nbsp; 🗑️reset progress/campaign &nbsp;&nbsp; ⚖️show model ranking</div><div id="dashboard_div"></div><br><a class="abutton" id="download_progress" style="margin-right: 20px;">Download progress metadata 💾</a> <a class="abutton" id="download_annotations" style="margin-right: 20px;">Download all annotations 💾</a> <button class="abutton" id="add_campaign" style="width: 180px; margin-right: 20px;">Add new campaign 📤</button> <input type="file" id="campaign_file_input" accept=".json" style="display: none;"></div></body></html>
+        }</style><script defer="defer" src="dashboard.bundle.js?ee803f203a3b5ee1305d"></script><link href="style.css?ee803f203a3b5ee1305d" rel="stylesheet"></head><body style="padding-top: 50px; padding-bottom: 50px;"><div id="main_div" style="width: calc(100% - 200px); min-width: 1300px; margin-left: auto; margin-right: auto;"><div style="margin-bottom: 15px; font-size: 0.9em; color: #555;">💤not started &nbsp;&nbsp; ✍️in progress &nbsp;&nbsp; ✅completed & passed &nbsp;&nbsp;❌completed & failed &nbsp;&nbsp; 🔗annotator link &nbsp;&nbsp; 👁️anotator link (view-only) &nbsp;&nbsp; 🗑️reset progress/campaign &nbsp;&nbsp; ⚖️show model ranking</div><div id="dashboard_div"></div><br><a class="abutton" id="download_progress" style="margin-right: 20px;">Download progress metadata 💾</a> <a class="abutton" id="download_annotations" style="margin-right: 20px;">Download all annotations 💾</a> <button class="abutton" id="add_campaign" style="width: 180px; margin-right: 20px;">Add new campaign 📤</button> <input type="file" id="campaign_file_input" accept=".json" style="display: none;"></div></body></html>

pearmut/static/index.html CHANGED Viewed

	@@ -1 +1 @@
1	- <!doctype html><html lang="en" style="height: 100%;"><head><meta charset="UTF-8"><meta name="viewport" content="width=900px"><title>Pearmut Evaluation</title><link rel="icon" type="image/svg+xml" href="favicon.svg"><script defer="defer" src="index.bundle.js?~~0d289122fd490c931aec~~"></script><link href="style.css?~~0d289122fd490c931aec~~" rel="stylesheet"></head><body><div class="white-box" style="width: max-content; font-size: large; position: absolute; top: 50%; left: 50%; transform: translate(-50%, -50%);">You have reached the Pearmut🍐 evaluation interface.<ul><li>If you are an annotator, you should have received a specialized link that takes you to the annotations.</li><li>If you are annotation manager, then you should distribute these links.</li></ul><br><br>See the <a href="https://github.com/zouharvi/pearmut">Pearmut project on GitHub</a>. Made with 💚 by Vilém Zouhar and others in 2025-2026.</div></body></html>
1	+ <!doctype html><html lang="en" style="height: 100%;"><head><meta charset="UTF-8"><meta name="viewport" content="width=900px"><title>Pearmut Evaluation</title><link rel="icon" type="image/svg+xml" href="favicon.svg"><script defer="defer" src="index.bundle.js?ee803f203a3b5ee1305d"></script><link href="style.css?ee803f203a3b5ee1305d" rel="stylesheet"></head><body><div class="white-box" style="width: max-content; font-size: large; position: absolute; top: 50%; left: 50%; transform: translate(-50%, -50%);">You have reached the Pearmut🍐 evaluation interface.<ul><li>If you are an annotator, you should have received a specialized link that takes you to the annotations.</li><li>If you are annotation manager, then you should distribute these links.</li></ul><br><br>See the <a href="https://github.com/zouharvi/pearmut">Pearmut project on GitHub</a>. Made with 💚 by Vilém Zouhar and others in 2025-2026.</div></body></html>

pearmut/static/style.css CHANGED Viewed

@@ -3,6 +3,12 @@ body {
     padding: 0;
     background: linear-gradient(135deg, #b9e2a1 0%, #e7e2cf 100%);
     background-attachment: fixed;
+    /* never rescale for phone */
+    text-size-adjust: none;
+    -webkit-text-size-adjust: none;
+    -ms-text-size-adjust: none;
+    -moz-text-size-adjust: none;
 }
 * {
@@ -63,6 +69,14 @@ label {
     margin-bottom: 30pt;
 }
+.model_name {
+    font-weight: bold;
+    font-size: 0.9em;
+    color: #555;
+    margin-bottom: 5px;
+    padding: 2px 0;
+}
 /* Character hover and highlighting */
 .tgt_char:hover {
     background-color: #ccc;
@@ -236,3 +250,35 @@ input[type="button"].error_delete:hover {
 .char_missing {
     font-family: monospace;
 }
+/* Form styling */
+.form-container {
+    max-width: 600px;
+    margin: 20px auto;
+    padding: 20px;
+}
+.form-field {
+    margin-bottom: 20px;
+}
+.form-label {
+    font-size: 14pt;
+    margin-bottom: 8px;
+    color: #333;
+}
+.form-input {
+    width: 100%;
+    padding: 10px;
+    font-size: 12pt;
+    border: 1px solid #ccc;
+    border-radius: 4px;
+    box-sizing: border-box;
+}
+.form-input:focus {
+    outline: none;
+    border-color: #4CAF50;
+    box-shadow: 0 0 5px rgba(76, 175, 80, 0.3);
+}

pearmut/utils.py CHANGED Viewed

@@ -1,10 +1,13 @@
+import hashlib
 import json
 import os
+import random
 ROOT = "."
 # Sentinel value to indicate a task reset - masks all prior annotations
 RESET_MARKER = "__RESET__"
+TOKEN_MAIN = hashlib.sha256(random.randbytes(16)).hexdigest()[:10]
 def load_progress_data(warn: str | None = None):
@@ -15,7 +18,7 @@ def load_progress_data(warn: str | None = None):
             f.write(json.dumps({}))
     with open(f"{ROOT}/data/progress.json", "r") as f:
         data = json.load(f)
     return data
@@ -36,42 +39,43 @@ def get_db_log(campaign_id: str) -> list[dict]:
         log_path = f"{ROOT}/data/outputs/{campaign_id}.jsonl"
         if os.path.exists(log_path):
             with open(log_path, "r") as f:
-                _logs[campaign_id] = [
-                    json.loads(line) for line in f.readlines()
-                ]
+                _logs[campaign_id] = [json.loads(line) for line in f.readlines()]
         else:
             _logs[campaign_id] = []
     return _logs[campaign_id]
-def get_db_log_item(campaign_id: str, user_id: str | None, item_i: int | None) -> list[dict]:
+def get_db_log_item(
+    campaign_id: str, user_id: str | None, item_i: int | str | None
+) -> list[dict]:
     """
     Returns the log item for the given campaign_id, user_id and item_i.
     Can be empty. Respects reset markers - if a reset marker is found,
     only entries after the last reset are returned.
     """
     log = get_db_log(campaign_id)
     # Filter matching entries
     matching = [
-        entry for entry in log
+        entry
+        for entry in log
         if (
-            (user_id is None or entry.get("user_id") == user_id) and
-            (item_i is None or entry.get("item_i") == item_i)
+            (user_id is None or entry.get("user_id") == user_id)
+            and (item_i is None or entry.get("item_i") == item_i)
         )
     ]
     # Find the last reset marker for this user (if any)
     last_reset_idx = -1
     for i, entry in enumerate(matching):
         if entry.get("annotation") == RESET_MARKER:
             last_reset_idx = i
     # Return only entries after the last reset
     if last_reset_idx >= 0:
-        matching = matching[last_reset_idx + 1:]
+        matching = matching[last_reset_idx + 1 :]
     return matching
@@ -87,7 +91,13 @@ def save_db_payload(campaign_id: str, payload: dict):
     log_path = f"{ROOT}/data/outputs/{campaign_id}.jsonl"
     os.makedirs(os.path.dirname(log_path), exist_ok=True)
     with open(log_path, "a") as log_file:
-        log_file.write(json.dumps(payload, ensure_ascii=False,) + "\n")
+        log_file.write(
+            json.dumps(
+                payload,
+                ensure_ascii=False,
+            )
+            + "\n"
+        )
     log.append(payload)
@@ -100,20 +110,20 @@ def check_validation_threshold(
 ) -> bool:
     """
     Check if user passes the validation threshold.
     The threshold is defined in campaign info as 'validation_threshold':
     - If integer: pass if number of failed checks <= threshold
-    - If float in [0, 1): pass if proportion of failed checks <= threshold
+    - If float in [0, 1): pass if proportion of failed checks <= threshold
     - If float >= 1: always fail
     - If None/not set: defaults to 0 (fail on any failed check)
     Returns True if validation passes, False otherwise.
     """
     threshold = tasks_data[campaign_id]["info"].get("validation_threshold", 0)
     user_progress = progress_data[campaign_id][user_id]
     validations = user_progress.get("validations", {})
     # Count failed checks (validations is dict of item_i -> list of bools)
     total_checks = 0
     failed_checks = 0
@@ -126,11 +136,11 @@ def check_validation_threshold(
     # If no validation checks exist, pass
     if total_checks == 0:
         return True
     # Float >= 1: always fail
     if isinstance(threshold, float) and threshold >= 1:
         return False
     # Check threshold based on type
     if isinstance(threshold, float):
         # Float in [0, 1): proportion-based, pass if failed proportion <= threshold
@@ -138,3 +148,12 @@ def check_validation_threshold(
     else:
         # Integer: count-based, pass if failed count <= threshold
         return failed_checks <= threshold
+def is_form_document(items):
+    """Check if a document contains form items instead of evaluation items."""
+    if not items:
+        return False
+    # Check if first item has 'text' and 'form' keys (form item)
+    first_item = items[0]
+    return "text" in first_item and "form" in first_item

{pearmut-1.0.1.dist-info → pearmut-1.0.3.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: pearmut
-Version: 1.0.1
+Version: 1.0.3
 Summary: A tool for evaluation of model outputs, primarily MT.
 Author-email: Vilém Zouhar <vilem.zouhar@gmail.com>
 License: MIT
@@ -19,7 +19,7 @@ Provides-Extra: dev
 Requires-Dist: pytest; extra == "dev"
 Dynamic: license-file
-# 🍐Pearmut &nbsp; &nbsp; [![PyPi version](https://badgen.net/pypi/v/pearmut/)](https://pypi.org/project/pearmut) [![PyPI download/month](https://img.shields.io/pypi/dm/pearmut.svg)](https://pypi.python.org/pypi/pearmut/) [![PyPi license](https://badgen.net/pypi/license/pearmut/)](https://pypi.org/project/pearmut/) [![build status](https://github.com/zouharvi/pearmut/actions/workflows/test.yml/badge.svg)](https://github.com/zouharvi/pearmut/actions/workflows/test.yml)
+# 🍐Pearmut <br> [![PyPi version](https://badgen.net/pypi/v/pearmut/)](https://pypi.org/project/pearmut) [![PyPI download/month](https://img.shields.io/pypi/dm/pearmut.svg)](https://pypi.python.org/pypi/pearmut/) [![PyPi license](https://badgen.net/pypi/license/pearmut/)](https://pypi.org/project/pearmut/) [![build status](https://github.com/zouharvi/pearmut/actions/workflows/test.yml/badge.svg)](https://github.com/zouharvi/pearmut/actions/workflows/test.yml) [![arXiv](https://img.shields.io/badge/arXiv-2601.02933-b31b1b.svg?style=flat)](https://arxiv.org/abs/2601.02933)
 **Platform for Evaluation and Reviewing of Multilingual Tasks**: Evaluate model outputs for translation and NLP tasks with support for multimodal data (text, video, audio, images) and multiple annotation protocols ([DA](https://aclanthology.org/N15-1124/), [ESA](https://aclanthology.org/2024.wmt-1.131/), [ESA<sup>AI</sup>](https://aclanthology.org/2025.naacl-long.255/), [MQM](https://doi.org/10.1162/tacl_a_00437), and more!).
@@ -35,12 +35,15 @@ Dynamic: license-file
   - [Assignment Types](#assignment-types)
 - [Advanced Features](#advanced-features)
   - [Pre-filled Error Spans (ESA<sup>AI</sup>)](#pre-filled-error-spans-esaai)
+  - [Custom MQM Taxonomy](#custom-mqm-taxonomy)
   - [Tutorial and Attention Checks](#tutorial-and-attention-checks)
+  - [Form Items for User Metadata](#form-items-for-user-metadata)
   - [Pre-defined User IDs and Tokens](#pre-defined-user-ids-and-tokens)
   - [Multimodal Annotations](#multimodal-annotations)
   - [Hosting Assets](#hosting-assets)
 - [Campaign Management](#campaign-management)
   - [Custom Completion Messages](#custom-completion-messages)
+  - [Prolific Integration](#prolific-integration)
 - [CLI Commands](#cli-commands)
 - [Terminology](#terminology)
 - [Development](#development)
@@ -141,6 +144,22 @@ The `shuffle` parameter in campaign `info` controls this behavior:
   "data": [...]
 }
 ```
+Documents in `data_welcome` are not shuffled and so don't require to have the same models in all documents.
+### Showing Model Names
+By default, model names are hidden to avoid biasing annotators. To display model names on top of each output block, set `show_model_names` to `true`:
+```python
+{
+  "info": {
+    "assignment": "task-based",
+    "protocol": "ESA",
+    "show_model_names": true  # Default: false.
+  },
+  "campaign_id": "my_campaign",
+  "data": [...]
+}
+```
 ### Custom Score Sliders
@@ -163,6 +182,52 @@ For multi-dimensional evaluation tasks (e.g., assessing fluency on a Likert scal
 When `sliders` is specified, only the custom sliders are shown. Each slider must have `name`, `min`, `max`, and `step` properties. All sliders must be answered before proceeding.
+### Textfield for Post-editing/Translation
+Enable a textfield for post-editing or translation tasks using the `textfield` parameter in `info`. The textfield content is stored in annotations alongside scores and error spans.
+```python
+{
+  "info": {
+    "protocol": "DA",
+    "textfield": "prefilled"  # Options: null, "hidden", "visible", "prefilled"
+  }
+}
+```
+**Textfield modes:**
+- `null` or omitted: No textfield (default)
+- `"hidden"`: Textfield hidden by default, shown by clicking a button
+- `"visible"`: Textfield always visible
+- `"prefilled"`: Textfield visible and pre-filled with model output for post-editing
+### Custom MQM Taxonomy
+For MQM protocol campaigns, you can define a custom error taxonomy instead of using the default MQM categories. Specify `mqm_categories` in the campaign `info` section as a dictionary mapping main categories to lists of subcategories:
+```python
+{
+  "info": {
+    "assignment": "task-based",
+    "protocol": "MQM",
+    "mqm_categories": {
+      "": [],                          # Empty selection option
+      "General": ["", "Accuracy", "Fluency"],
+      "Audio-specific": ["", "Inaudible", "Background noise", "Speaker overlap", "Misinterpretation"],
+      "Style": ["", "Awkward", "Embarassing"],
+      "Unknown": []                    # Category with no subcategories
+    }
+  },
+  "campaign_id": "custom_mqm_example",
+  "data": [...]
+}
+```
+If `mqm_categories` is not provided, the default MQM taxonomy will be used. The empty string key `""` provides an unselected state in the dropdown. Categories with empty subcategory lists (e.g., `"Style": []`) do not require a subcategory selection.
+See [examples/custom_mqm.json](examples/custom_mqm.json) for a complete example.
 ### Custom Instructions
 Set campaign-level instructions using the `instructions` field in `info` (supports HTML).
@@ -252,6 +317,34 @@ The `score_greaterthan` field specifies the index of the candidate that must hav
 See [examples/tutorial/esa_deen.json](examples/tutorial/esa_deen.json) for a mock campaign with a fully prepared ESA tutorial.
 To use it, simply extract the `data` attribute and prefix it to each task in your campaign.
+#### Universal Tutorial Items with `data_welcome`
+Use `data_welcome` to add tutorial items that users must complete before starting regular tasks. The structure is a list of documents (same as `data`). Welcome items have IDs `welcome_0`, `welcome_1`, etc. and are tracked separately via `progress_welcome`.
+### Form Items for User Metadata
+Collect user information (demographics, expertise) before annotation tasks using form items in `data_welcome`.
+Form items have `text` (label/question) and `form` (field type: `null`, `"string"`, `"number"`, `"choices"`, and `"script"`).
+Documents must be homogeneous: all form items or all evaluation items.
+```python
+{
+  "data_welcome": [
+    [
+      {"text": "What is your native language?", "form": "string"},
+      {"text": "Rate your expertise (1-10)", "form": "number"}
+    ]
+  ]
+}
+```
+<img width="400" alt="Screenshot of a user form" src="https://github.com/user-attachments/assets/2310e8dc-98e9-4abf-8a27-6781b0094efe" />
+It is possible to automatically collect additional information from the host system using `"script"` field type.
+Typically such a form document (or their sequence) would be stored in `"data_welcome"` such that it is both mandatory and show to all users.
+See [examples/user_info_form.json](examples/user_info_form.json).
 ### Single-stream Assignment
 All annotators draw from a shared pool with random assignment:
@@ -265,11 +358,14 @@ All annotators draw from a shared pool with random assignment:
         # ESA: error spans and scores
         "protocol": "ESA",
         "users": 50,                           # number of annotators (can also be a list, see below)
+        "docs_per_user": 10,                   # optional: show goodbye after N documents per user
     },
     "data": [...], # list of all items (shared among all annotators)
 }
 ```
+Set `docs_per_user` to limit how many documents each user annotates before seeing the goodbye message (for single-stream, this is the number of documents).
 ### Dynamic Assignment
 The `dynamic` assignment type intelligently selects items based on current model performance to focus annotation effort on top-performing models using contrastive comparisons.
@@ -286,11 +382,14 @@ All items must contain outputs from all models for this assignment type to work
         "dynamic_contrastive_models": 2,       # how many models to compare per item (optional, default: 1)
         "dynamic_first": 5,                    # annotations per model before dynamic kicks in (optional, default: 5)
         "dynamic_backoff": 0.1,                # probability of uniform sampling (optional, default: 0)
+        "docs_per_user": 20,                   # optional: show goodbye after N documents per user
     },
     "data": [...], # list of all items (shared among all annotators)
 }
 ```
+Set `docs_per_user` to limit how many documents each user annotates before seeing the goodbye message (for dynamic, this is roughly the number of documents × models).
 **How it works:**
 1. Initial phase: Each model gets `dynamic_first` annotations with fully random contrastive evaluation
 2. Dynamic phase: After the initial phase, top `dynamic_top` models (by average score) are identified
@@ -378,6 +477,14 @@ When tokens are supplied, the dashboard will try to show model rankings based on
 Customize the goodbye message shown to users when they complete all annotations using the `instructions_goodbye` field in campaign info. Supports arbitrary HTML for styling and formatting with variable replacement: `${TOKEN}` (completion token) and `${USER_ID}` (user ID). Default: `"If someone asks you for a token of completion, show them: ${TOKEN}"`.
+### Prolific Integration
+Use task-based assignment with Prolific. For each task, Pearmut generates a unique URL which can be uploaded to Prolific's interface. Add redirect (on completion) to `instructions_goodbye`:
+```json
+"instructions_goodbye": "<a href='https://app.prolific.com/submissions/complete?cc=${TOKEN}'>Click here to return to Prolific</a>"
+```
+The `${TOKEN}` is automatically replaced based on passing attention checks (see [Attention checks](#tutorial-and-attention-checks) and [Pre-defined tokens](#pre-defined-user-ids-and-tokens)).
 ## Terminology
 - **Campaign**: An annotation project that contains configuration, data, and user assignments. Each campaign has a unique identifier and is defined in a JSON file.
@@ -401,7 +508,7 @@ Customize the goodbye message shown to users when they complete all annotations
   - **Score**: Numeric quality rating (0-100)
   - **Error Spans**: Text highlights marking errors with severity (`minor`, `major`)
   - **Error Categories**: MQM taxonomy labels for errors
-- **Template**: The annotation interface type. The `basic` template supports comparing multiple outputs simultaneously.
+- **Template**: The annotation interface type. The `annotate` template supports comparing multiple outputs simultaneously.
 - **Assignment**: The method for distributing items to users:
   - **Task-based**: Each user has predefined items
   - **Single-stream**: Users draw from a shared pool with random assignment
@@ -432,7 +539,7 @@ pearmut run
 2. Add build rule to `webpack.config.js`
 3. Reference as `info->template` in campaign JSON
-See [web/src/basic.ts](web/src/basic.ts) for example.
+See [web/src/annotate.ts](web/src/annotate.ts) for example.
 ### Deployment
@@ -443,68 +550,15 @@ Run on public server or tunnel local port to public IP/domain and run locally.
 If you use this work in your paper, please cite as following.
 ```bibtex
 @misc{zouhar2026pearmut,
-  author = {Zouhar, Vilém},
-  title = {Pearmut: Human Evaluation of Translation Made Trivial},
-  year = {2026}
+      title={Pearmut: Human Evaluation of Translation Made Trivial},
+      author={Vilém Zouhar and Tom Kocmi},
+      year={2026},
+      eprint={2601.02933},
+      archivePrefix={arXiv},
+      primaryClass={cs.CL},
+      url={https://arxiv.org/abs/2601.02933},
 }
 ```
 Contributions are welcome! Please reach out to [Vilém Zouhar](mailto:vilem.zouhar@gmail.com).
-# Changelog
-- v1.0.1
-  - Support RTL languages
-  - Add boxes for references
-  - Add custom score sliders for multi-dimensional evaluation
-  - Make instructions customizable and protocol-dependent
-  - Support custom sliders
-  - Purge/reset whole tasks from dashboard
-  - Fix resetting individual users in single-stream/dynamic
-  - Fix notification stacking
-  - Add campaigns from dashboard
-- v0.3.3
-  - Rename `doc_id` to `item_id`
-  - Add Typst, LaTeX, and PDF export for model ranking tables. Hide them by default.
-  - Add dynamic assignment type with contrastive model comparison
-  - Add `instructions_goodbye` field with variable substitution
-  - Add visual anchors at 33% and 66% on sliders
-  - Add German→English ESA tutorial with attention checks
-  - Validate document model consistency before shuffle
-  - Fix UI block on any interaction
-- v0.3.2
-  - Revert seeding of user IDs
-  - Set ESA (Error Span Annotation) as default
-  - Update server IP address configuration
-  - Show approximate alignment by default
-  - Unify pointwise and listwise interfaces into `basic`
-  - Refactor protocol configuration (breaking change)
-- v0.2.11
-  - Add comment field in settings panel
-  - Add `score_gt` validation for listwise comparisons
-  - Add Content-Disposition headers for proper download filenames
-  - Add model results display to dashboard with rankings
-  - Add campaign file structure validation
-  - Purge command now unlinks assets
-- v0.2.6
-  - Add frozen annotation links feature for view-only mode
-  - Add word-level annotation mode toggle for error spans
-  - Add `[missing]` token support
-  - Improve frontend speed and cleanup toolboxes on item load
-  - Host assets via symlinks
-  - Add validation threshold for success/fail tokens
-  - Implement reset masking for annotations
-  - Allow pre-defined user IDs and tokens in campaign data
-- v0.1.1
-  - Set server defaults and add VM launch scripts
-  - Add warning dialog when navigating away with unsaved work
-  - Add tutorial validation support for pointwise and listwise
-  - Add ability to preview existing annotations via progress bar
-  - Add support for ESA<sup>AI</sup> pre-filled error_spans
-  - Rename pairwise to listwise and update layout
-  - Implement single-stream assignment type
-- v0.0.3
-  - Support multimodal inputs and outputs
-  - Add dashboard
-  - Implement ESA (Error Span Annotation) and MQM support
+See changes in [CHANGELOG.md](CHANGELOG.md).

pearmut-1.0.3.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,20 @@
+pearmut/app.py,sha256=BWbzUHtE8G3jNkiSIW8MGlYWQeIu0PtN7wELO6E5M_0,13873
+pearmut/assignment.py,sha256=o_66Gq6L6f-JIX_lzIDJi1cAMrvLoqS5x4orwlu2GnI,32244
+pearmut/cli.py,sha256=OMNNc1gxX6ZplS0UoCiNN86v9nsIn9hkjzRoaity2Fg,29904
+pearmut/constants.py,sha256=iYONCk2kyYcKy3kikhSKyXRKZ1lWVaVFdcWh6kUYTrQ,4844
+pearmut/results_export.py,sha256=YoVE_mXDBNzsiv88CzZhZeWLMg5FWTOuH6NrbzUZQs4,5746
+pearmut/utils.py,sha256=a5nLLXk4SDASoArlXEvVqKXCbxdSgHTn_4fnJKaNa4A,4778
+pearmut/static/annotate.bundle.js,sha256=HwSm0RODsVnDmPD4xUBdmdLgOYF6-sRyPbC_EmN_EL8,121895
+pearmut/static/annotate.html,sha256=4e_3Ol-swrp_FISaxnLYS-iN05XgN5obuZyy-a5C4K8,5698
+pearmut/static/dashboard.bundle.js,sha256=27izHS7KUPMmQjw-rKGxxpu-RjaocyJYFwrZF8CcPFg,105264
+pearmut/static/dashboard.html,sha256=wzRKZCvV9p3FkL97GEMC2Y23lRvUDQt1EwuAVr8dehI,3456
+pearmut/static/favicon.svg,sha256=gVPxdBlyfyJVkiMfh8WLaiSyH4lpwmKZs8UiOeX8YW4,7347
+pearmut/static/index.bundle.js,sha256=-koQkaoRCei-H40wozYnvf0PnrAoZbtOXHotJcTn5OM,346
+pearmut/static/index.html,sha256=1ug6svDibld7Tl33PZ3e_VZUFjXKC86sXYLXWBH_TJg,930
+pearmut/static/style.css,sha256=kTzbun0LkbS0tn-bdCf-oajIQvda5YJcYeDrCV1PR-o,4885
+pearmut-1.0.3.dist-info/licenses/LICENSE,sha256=GtR6RcTdRn-P23h5pKFuWSLZrLPD0ytHAwSOBt7aLpI,1071
+pearmut-1.0.3.dist-info/METADATA,sha256=9k_RBzLNkrWNkWB8BsI4kvDveeCS0POANRl58sW3VaU,24332
+pearmut-1.0.3.dist-info/WHEEL,sha256=wUyA8OaulRlbfwMtmQsvNngGrxQHAvkKcvRmdizlJi0,92
+pearmut-1.0.3.dist-info/entry_points.txt,sha256=eEA9LVWsS3neQbMvL_nMvEw8I0oFudw8nQa1iqxOiWM,45
+pearmut-1.0.3.dist-info/top_level.txt,sha256=CdgtUM-SKQDt6o5g0QreO-_7XTBP9_wnHMS1P-Rl5Go,8
+pearmut-1.0.3.dist-info/RECORD,,

{pearmut-1.0.1.dist-info → pearmut-1.0.3.dist-info}/WHEEL RENAMED Viewed

@@ -1,5 +1,5 @@
 Wheel-Version: 1.0
-Generator: setuptools (80.9.0)
+Generator: setuptools (80.10.2)
 Root-Is-Purelib: true
 Tag: py3-none-any

pearmut 1.0.1__py3-none-any.whl → 1.0.3__py3-none-any.whl

pearmut 1.0.1py3-none-any.whl → 1.0.3py3-none-any.whl