PyPI - pearmut - Versions diffs - 0.2.8__py3-none-any.whl → 0.2.9__py3-none-any.whl - Mend

pearmut 0.2.8py3-none-any.whl → 0.2.9py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

pearmut/app.py +55 -0
pearmut/cli.py +3 -1
pearmut/static/dashboard.bundle.js +1 -1
pearmut/static/dashboard.html +28 -1
pearmut/static/listwise.bundle.js +1 -1
pearmut/static/pointwise.bundle.js +1 -1
{pearmut-0.2.8.dist-info → pearmut-0.2.9.dist-info}/METADATA +13 -3
pearmut-0.2.9.dist-info/RECORD +19 -0
pearmut-0.2.8.dist-info/RECORD +0 -19
{pearmut-0.2.8.dist-info → pearmut-0.2.9.dist-info}/WHEEL +0 -0
{pearmut-0.2.8.dist-info → pearmut-0.2.9.dist-info}/entry_points.txt +0 -0
{pearmut-0.2.8.dist-info → pearmut-0.2.9.dist-info}/licenses/LICENSE +0 -0
{pearmut-0.2.8.dist-info → pearmut-0.2.9.dist-info}/top_level.txt +0 -0

pearmut/app.py CHANGED Viewed

@@ -1,5 +1,7 @@
+import collections
 import json
 import os
+import statistics
 from typing import Any
 from fastapi import FastAPI, Query
@@ -12,6 +14,7 @@ from .assignment import get_i_item, get_next_item, reset_task, update_progress
 from .utils import (
     ROOT,
     check_validation_threshold,
+    get_db_log,
     load_progress_data,
     save_db_payload,
     save_progress_data,
@@ -191,6 +194,58 @@ async def _dashboard_data(request: DashboardDataRequest):
     )
+class DashboardResultsRequest(BaseModel):
+    campaign_id: str
+    token: str
+@app.post("/dashboard-results")
+async def _dashboard_results(request: DashboardResultsRequest):
+    campaign_id = request.campaign_id
+    token = request.token
+    if campaign_id not in progress_data:
+        return JSONResponse(content="Unknown campaign ID", status_code=400)
+    # Check if token is valid
+    if token != tasks_data[campaign_id]["token"]:
+        return JSONResponse(content="Invalid token", status_code=400)
+    # Compute model scores from annotations
+    model_scores = collections.defaultdict(dict)
+    # Iterate through all tasks to find items with 'model' field
+    log = get_db_log(campaign_id)
+    for entry in log:
+        if "item" not in entry or "annotations" not in entry:
+            continue
+        for item, annotation in zip(entry["item"], entry["annotations"]):
+            if "model" in item:
+                # pointwise
+                if "score" in annotation:
+                    # make sure to only keep the latest score for each item
+                    # json.dumps(item) creates a unique item key
+                    model_scores[item["model"]][json.dumps(item)] = annotation["score"]
+            elif "models" in item:
+                # listwise
+                for model, annotation_cand in zip(item["models"], annotation):
+                    if "score" in annotation_cand:
+                        model_scores[model][json.dumps(item)] = (
+                            annotation_cand["score"]
+                        )
+    results = [
+        {
+            "model": model,
+            "score": statistics.mean(scores.values()),
+            "count": len(scores),
+        }
+        for model, scores in model_scores.items()
+    ]
+    results.sort(key=lambda x: x["score"], reverse=True)
+    return JSONResponse(content=results, status_code=200)
 class ResetTaskRequest(BaseModel):
     campaign_id: str
     user_id: str

pearmut/cli.py CHANGED Viewed

@@ -41,7 +41,9 @@ def _run(args_unknown):
             args.server + "/dashboard.html?" + "&".join([
                 f"campaign_id={urllib.parse.quote_plus(campaign_id)}&token={campaign_data["token"]}"
                 for campaign_id, campaign_data in tasks_data.items()
-            ])
+            ]),
+            # this is important to flush
+            flush=True,
         )
     uvicorn.run(

pearmut 0.2.8__py3-none-any.whl → 0.2.9__py3-none-any.whl

pearmut 0.2.8py3-none-any.whl → 0.2.9py3-none-any.whl