npm - @openhands/extensions - Versions diffs - 0.1.0 → 0.2.0 - Mend

@openhands/extensions 0.1.0 → 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (347) hide show

package/.agents/skills/custom-codereview-guide.md +25 -0
package/.github/pull_request_template.md +38 -0
package/.github/release.yml +14 -0
package/.github/workflows/check-extensions.yml +72 -0
package/.github/workflows/npm-publish.yml +89 -0
package/.github/workflows/pr.yml +30 -0
package/.github/workflows/release.yml +24 -0
package/.github/workflows/tests.yml +25 -0
package/.github/workflows/vulnerability-scan.yml +87 -0
package/.release-please-manifest.json +3 -0
package/AGENTS.md +132 -0
package/README.md +10 -0
package/analysis_results.md +162 -0
package/marketplaces/large-codebase.json +66 -0
package/marketplaces/openhands-extensions.json +682 -0
package/package.json +4 -10
package/plugins/README.md +30 -0
package/plugins/city-weather/.plugin/plugin.json +13 -0
package/plugins/city-weather/README.md +145 -0
package/plugins/city-weather/commands/now.md +56 -0
package/plugins/cobol-modernization/.plugin/plugin.json +19 -0
package/plugins/cobol-modernization/README.md +201 -0
package/plugins/cobol-modernization/references/troubleshooting.md +18 -0
package/plugins/cobol-modernization/skills/build-setup/SKILL.md +78 -0
package/plugins/cobol-modernization/skills/build-setup/scripts/install-gnucobol.sh +32 -0
package/plugins/cobol-modernization/skills/cobol-modernization-overview/SKILL.md +113 -0
package/plugins/cobol-modernization/skills/mainfraime-removal/SKILL.md +62 -0
package/plugins/cobol-modernization/skills/mainfraime-removal/references/cics-transformation-examples.md +45 -0
package/plugins/cobol-modernization/skills/mainframe-planning/SKILL.md +78 -0
package/plugins/cobol-modernization/skills/to-java-migration/SKILL.md +59 -0
package/plugins/cobol-modernization/skills/to-java-migration/references/cobol-to-java-example.md +58 -0
package/plugins/cobol-modernization/skills/to-java-migration/references/datatype-mappings.md +19 -0
package/plugins/issue-duplicate-checker/.plugin/plugin.json +13 -0
package/plugins/issue-duplicate-checker/README.md +51 -0
package/plugins/issue-duplicate-checker/action.yml +349 -0
package/plugins/issue-duplicate-checker/scripts/auto_close_duplicate_issues.py +569 -0
package/plugins/issue-duplicate-checker/scripts/issue_duplicate_check_openhands.py +681 -0
package/plugins/issue-duplicate-checker/scripts/post_duplicate_notice.js +220 -0
package/plugins/issue-duplicate-checker/scripts/remove_duplicate_candidate_label.js +27 -0
package/plugins/magic-test/.plugin/plugin.json +13 -0
package/plugins/magic-test/skills/magic-word/SKILL.md +33 -0
package/plugins/migration-scoring/.plugin/plugin.json +19 -0
package/plugins/migration-scoring/README.md +244 -0
package/plugins/migration-scoring/skills/migration-mapping/SKILL.md +72 -0
package/plugins/migration-scoring/skills/migration-report/SKILL.md +118 -0
package/plugins/migration-scoring/skills/migration-scoring-overview/SKILL.md +126 -0
package/plugins/migration-scoring/skills/score-quality/SKILL.md +54 -0
package/plugins/migration-scoring/skills/score-quality/references/scoring-criteria.md +30 -0
package/plugins/migration-scoring/skills/score-style/SKILL.md +106 -0
package/plugins/onboarding/.plugin/plugin.json +20 -0
package/plugins/onboarding/README.md +30 -0
package/plugins/onboarding/references/criteria.md +144 -0
package/plugins/onboarding/skills/agent-readiness-report/README.md +23 -0
package/plugins/onboarding/skills/agent-readiness-report/SKILL.md +122 -0
package/plugins/onboarding/skills/agent-readiness-report/scripts/scan_agent_instructions.sh +88 -0
package/plugins/onboarding/skills/agent-readiness-report/scripts/scan_build_env.sh +114 -0
package/plugins/onboarding/skills/agent-readiness-report/scripts/scan_feedback_loops.sh +133 -0
package/plugins/onboarding/skills/agent-readiness-report/scripts/scan_policy.sh +113 -0
package/plugins/onboarding/skills/agent-readiness-report/scripts/scan_workflows.sh +127 -0
package/plugins/onboarding/skills/improve-agent-readiness/README.md +19 -0
package/plugins/onboarding/skills/improve-agent-readiness/SKILL.md +167 -0
package/plugins/onboarding/skills/setup-agents-md/README.md +15 -0
package/plugins/onboarding/skills/setup-agents-md/SKILL.md +150 -0
package/plugins/onboarding/skills/setup-openhands/README.md +20 -0
package/plugins/onboarding/skills/setup-openhands/SKILL.md +56 -0
package/plugins/onboarding/skills/setup-pr-review/README.md +23 -0
package/plugins/onboarding/skills/setup-pr-review/SKILL.md +72 -0
package/plugins/openhands/.plugin/plugin.json +13 -0
package/plugins/openhands/README.md +52 -0
package/plugins/openhands/SKILL.md +61 -0
package/plugins/openhands/commands/create.md +55 -0
package/plugins/openhands/commands/openhands-cloud.md +8 -0
package/plugins/openhands/scripts/run.sh +69 -0
package/plugins/pr-review/.plugin/plugin.json +13 -0
package/plugins/pr-review/README.md +393 -0
package/plugins/pr-review/action.yml +298 -0
package/plugins/pr-review/scripts/agent_script.py +1282 -0
package/plugins/pr-review/scripts/evaluate_review.py +655 -0
package/plugins/pr-review/scripts/prompt.py +260 -0
package/plugins/pr-review/workflows/pr-review-by-openhands.yml +51 -0
package/plugins/pr-review/workflows/pr-review-evaluation.yml +85 -0
package/plugins/qa-changes/.plugin/plugin.json +11 -0
package/plugins/qa-changes/README.md +185 -0
package/plugins/qa-changes/action.yml +181 -0
package/plugins/qa-changes/scripts/agent_script.py +406 -0
package/plugins/qa-changes/scripts/evaluate_qa_changes.py +385 -0
package/plugins/qa-changes/scripts/prompt.py +174 -0
package/plugins/qa-changes/workflows/qa-changes-by-openhands.yml +50 -0
package/plugins/qa-changes/workflows/qa-changes-evaluation.yml +85 -0
package/plugins/release-notes/.plugin/plugin.json +19 -0
package/plugins/release-notes/README.md +283 -0
package/plugins/release-notes/SKILL.md +83 -0
package/plugins/release-notes/action.yml +117 -0
package/plugins/release-notes/commands/release-notes.md +8 -0
package/plugins/release-notes/scripts/agent_script.py +292 -0
package/plugins/release-notes/scripts/generate_release_notes.py +733 -0
package/plugins/release-notes/scripts/prompt.py +90 -0
package/plugins/release-notes/scripts/validate_release_notes.py +328 -0
package/plugins/release-notes/workflows/release-notes.yml +76 -0
package/plugins/vulnerability-remediation/.plugin/plugin.json +19 -0
package/plugins/vulnerability-remediation/README.md +217 -0
package/plugins/vulnerability-remediation/action.yml +187 -0
package/plugins/vulnerability-remediation/scripts/scan_and_remediate.py +561 -0
package/plugins/vulnerability-remediation/workflows/vulnerability-scan.yml +87 -0
package/pyproject.toml +12 -0
package/release-please-config.json +16 -0
package/scripts/sync_extensions.py +494 -0
package/scripts/sync_openhands_sdk_skill.py +264 -0
package/skills/README.md +159 -0
package/skills/add-javadoc/.plugin/plugin.json +18 -0
package/skills/add-javadoc/README.md +40 -0
package/skills/add-javadoc/SKILL.md +35 -0
package/skills/add-javadoc/references/example.md +32 -0
package/skills/add-skill/.plugin/plugin.json +18 -0
package/skills/add-skill/README.md +67 -0
package/skills/add-skill/SKILL.md +47 -0
package/skills/add-skill/scripts/fetch_skill.py +259 -0
package/skills/agent-creator/.plugin/plugin.json +20 -0
package/skills/agent-creator/README.md +104 -0
package/skills/agent-creator/SKILL.md +190 -0
package/skills/agent-creator/commands/agent-creator.md +8 -0
package/skills/agent-creator/references/fallback.md +117 -0
package/skills/agent-memory/.plugin/plugin.json +18 -0
package/skills/agent-memory/README.md +35 -0
package/skills/agent-memory/SKILL.md +30 -0
package/skills/agent-memory/commands/remember.md +8 -0
package/skills/agent-sdk-builder/.plugin/plugin.json +18 -0
package/skills/agent-sdk-builder/README.md +40 -0
package/skills/agent-sdk-builder/SKILL.md +37 -0
package/skills/agent-sdk-builder/commands/agent-builder.md +8 -0
package/skills/azure-devops/.plugin/plugin.json +18 -0
package/skills/azure-devops/README.md +55 -0
package/skills/azure-devops/SKILL.md +50 -0
package/skills/bitbucket/.plugin/plugin.json +17 -0
package/skills/bitbucket/README.md +50 -0
package/skills/bitbucket/SKILL.md +45 -0
package/skills/code-review/.plugin/plugin.json +19 -0
package/skills/code-review/README.md +18 -0
package/skills/code-review/SKILL.md +208 -0
package/skills/code-review/commands/codereview-roasted.md +8 -0
package/skills/code-review/commands/codereview.md +8 -0
package/skills/code-review/references/risk-evaluation.md +41 -0
package/skills/code-review/references/supply-chain-security.md +31 -0
package/skills/code-simplifier/.plugin/plugin.json +21 -0
package/skills/code-simplifier/README.md +30 -0
package/skills/code-simplifier/SKILL.md +91 -0
package/skills/code-simplifier/commands/simplify.md +8 -0
package/skills/code-simplifier/references/code-quality-review.md +86 -0
package/skills/code-simplifier/references/code-reuse-review.md +63 -0
package/skills/code-simplifier/references/efficiency-review.md +81 -0
package/skills/datadog/.plugin/plugin.json +19 -0
package/skills/datadog/README.md +100 -0
package/skills/datadog/SKILL.md +95 -0
package/skills/deno/.plugin/plugin.json +18 -0
package/skills/deno/README.md +5 -0
package/skills/deno/SKILL.md +99 -0
package/skills/deno/references/README.md +6 -0
package/skills/discord/.plugin/plugin.json +18 -0
package/skills/discord/README.md +31 -0
package/skills/discord/SKILL.md +109 -0
package/skills/discord/__init__.py +0 -0
package/skills/discord/references/REFERENCE.md +78 -0
package/skills/discord/scripts/__init__.py +0 -0
package/skills/discord/scripts/_http.py +127 -0
package/skills/discord/scripts/post_webhook.py +106 -0
package/skills/discord/scripts/send_message.py +102 -0
package/skills/docker/.plugin/plugin.json +17 -0
package/skills/docker/README.md +34 -0
package/skills/docker/SKILL.md +29 -0
package/skills/evidence-based-citations/.plugin/plugin.json +20 -0
package/skills/evidence-based-citations/README.md +31 -0
package/skills/evidence-based-citations/SKILL.md +59 -0
package/skills/flarglebargle/.plugin/plugin.json +16 -0
package/skills/flarglebargle/README.md +14 -0
package/skills/flarglebargle/SKILL.md +9 -0
package/skills/frontend-design/.plugin/plugin.json +21 -0
package/skills/frontend-design/LICENSE.txt +177 -0
package/skills/frontend-design/README.md +42 -0
package/skills/frontend-design/SKILL.md +42 -0
package/skills/github/.plugin/plugin.json +19 -0
package/skills/github/README.md +42 -0
package/skills/github/SKILL.md +106 -0
package/skills/github-pr-review/.plugin/plugin.json +18 -0
package/skills/github-pr-review/README.md +145 -0
package/skills/github-pr-review/SKILL.md +148 -0
package/skills/github-pr-review/commands/github-pr-review.md +8 -0
package/skills/github-pr-reviewer/.plugin/plugin.json +20 -0
package/skills/github-pr-reviewer/README.md +34 -0
package/skills/github-pr-reviewer/SKILL.md +89 -0
package/skills/github-pr-reviewer/commands/pr-reviewer:setup.md +8 -0
package/skills/github-repo-monitor/.plugin/plugin.json +22 -0
package/skills/github-repo-monitor/README.md +70 -0
package/skills/github-repo-monitor/SKILL.md +316 -0
package/skills/github-repo-monitor/commands/github-monitor:poll.md +8 -0
package/skills/github-repo-monitor/references/github-api.md +241 -0
package/skills/github-repo-monitor/references/state-schema.md +160 -0
package/skills/github-repo-monitor/scripts/main.py +915 -0
package/skills/github-repo-monitor/tests/test_main.py +400 -0
package/skills/gitlab/.plugin/plugin.json +17 -0
package/skills/gitlab/README.md +37 -0
package/skills/gitlab/SKILL.md +32 -0
package/skills/incident-retrospective/.plugin/plugin.json +21 -0
package/skills/incident-retrospective/README.md +34 -0
package/skills/incident-retrospective/SKILL.md +98 -0
package/skills/incident-retrospective/commands/incident-retro:setup.md +8 -0
package/skills/iterate/.plugin/plugin.json +13 -0
package/skills/iterate/README.md +25 -0
package/skills/iterate/SKILL.md +399 -0
package/skills/iterate/commands/babysit.md +8 -0
package/skills/iterate/commands/iterate.md +8 -0
package/skills/iterate/commands/verify.md +8 -0
package/skills/iterate/references/heuristics.md +58 -0
package/skills/iterate/references/verification.md +96 -0
package/skills/jupyter/.plugin/plugin.json +18 -0
package/skills/jupyter/README.md +55 -0
package/skills/jupyter/SKILL.md +50 -0
package/skills/kubernetes/.plugin/plugin.json +18 -0
package/skills/kubernetes/README.md +53 -0
package/skills/kubernetes/SKILL.md +48 -0
package/skills/learn-from-code-review/.plugin/plugin.json +19 -0
package/skills/learn-from-code-review/README.md +64 -0
package/skills/learn-from-code-review/SKILL.md +186 -0
package/skills/learn-from-code-review/commands/learn-from-reviews.md +8 -0
package/skills/linear/.plugin/plugin.json +19 -0
package/skills/linear/README.md +58 -0
package/skills/linear/SKILL.md +213 -0
package/skills/linear-triage/.plugin/plugin.json +21 -0
package/skills/linear-triage/README.md +34 -0
package/skills/linear-triage/SKILL.md +91 -0
package/skills/linear-triage/commands/linear-triage:setup.md +8 -0
package/skills/notion/.plugin/plugin.json +17 -0
package/skills/notion/README.md +114 -0
package/skills/notion/SKILL.md +109 -0
package/skills/npm/.plugin/plugin.json +17 -0
package/skills/npm/README.md +14 -0
package/skills/npm/SKILL.md +9 -0
package/skills/openhands-api/.plugin/plugin.json +22 -0
package/skills/openhands-api/README.md +48 -0
package/skills/openhands-api/SKILL.md +399 -0
package/skills/openhands-api/references/README.md +33 -0
package/skills/openhands-api/references/TROUBLESHOOTING.md +81 -0
package/skills/openhands-api/references/example_prompt.md +12 -0
package/skills/openhands-api/scripts/openhands_api.py +606 -0
package/skills/openhands-api/scripts/openhands_api.ts +252 -0
package/skills/openhands-automation/.plugin/plugin.json +19 -0
package/skills/openhands-automation/README.md +89 -0
package/skills/openhands-automation/SKILL.md +875 -0
package/skills/openhands-automation/commands/automation:create.md +8 -0
package/skills/openhands-automation/references/ab-testing.md +185 -0
package/skills/openhands-automation/references/custom-automation.md +644 -0
package/skills/openhands-sdk/.plugin/plugin.json +20 -0
package/skills/openhands-sdk/README.md +22 -0
package/skills/openhands-sdk/SKILL.md +229 -0
package/skills/openhands-sdk/commands/sdk.md +8 -0
package/skills/pdflatex/.plugin/plugin.json +18 -0
package/skills/pdflatex/README.md +39 -0
package/skills/pdflatex/SKILL.md +34 -0
package/skills/prd/.plugin/plugin.json +19 -0
package/skills/prd/README.md +28 -0
package/skills/prd/SKILL.md +237 -0
package/skills/prd/commands/prd.md +8 -0
package/skills/qa-changes/README.md +18 -0
package/skills/qa-changes/SKILL.md +229 -0
package/skills/qa-changes/commands/qa-changes.md +8 -0
package/skills/release-notes/README.md +24 -0
package/skills/release-notes/SKILL.md +19 -0
package/skills/release-notes/commands/release-notes.md +8 -0
package/skills/research-brief/.plugin/plugin.json +20 -0
package/skills/research-brief/README.md +34 -0
package/skills/research-brief/SKILL.md +99 -0
package/skills/research-brief/commands/research-brief:setup.md +8 -0
package/skills/security/.plugin/plugin.json +18 -0
package/skills/security/README.md +38 -0
package/skills/security/SKILL.md +33 -0
package/skills/skill-creator/.plugin/plugin.json +17 -0
package/skills/skill-creator/LICENSE.txt +202 -0
package/skills/skill-creator/README.md +182 -0
package/skills/skill-creator/SKILL.md +545 -0
package/skills/skill-creator/references/output-patterns.md +82 -0
package/skills/skill-creator/references/workflows.md +28 -0
package/skills/skill-creator/scripts/init_skill.py +303 -0
package/skills/skill-creator/scripts/quick_validate.py +95 -0
package/skills/slack-channel-monitor/.plugin/plugin.json +21 -0
package/skills/slack-channel-monitor/README.md +91 -0
package/skills/slack-channel-monitor/SKILL.md +276 -0
package/skills/slack-channel-monitor/commands/slack-monitor:poll.md +8 -0
package/skills/slack-channel-monitor/references/slack-api.md +207 -0
package/skills/slack-channel-monitor/references/state-schema.md +180 -0
package/skills/slack-channel-monitor/scripts/main.py +962 -0
package/skills/slack-standup-digest/.plugin/plugin.json +21 -0
package/skills/slack-standup-digest/README.md +34 -0
package/skills/slack-standup-digest/SKILL.md +92 -0
package/skills/slack-standup-digest/commands/standup-digest:setup.md +8 -0
package/skills/spark-version-upgrade/.plugin/plugin.json +20 -0
package/skills/spark-version-upgrade/README.md +54 -0
package/skills/spark-version-upgrade/SKILL.md +233 -0
package/skills/ssh/.plugin/plugin.json +18 -0
package/skills/ssh/README.md +140 -0
package/skills/ssh/SKILL.md +135 -0
package/skills/swift-linux/.plugin/plugin.json +17 -0
package/skills/swift-linux/README.md +86 -0
package/skills/swift-linux/SKILL.md +81 -0
package/skills/theme-factory/.plugin/plugin.json +19 -0
package/skills/theme-factory/LICENSE.txt +202 -0
package/skills/theme-factory/README.md +58 -0
package/skills/theme-factory/SKILL.md +59 -0
package/skills/theme-factory/theme-showcase.pdf +0 -0
package/skills/theme-factory/themes/arctic-frost.md +19 -0
package/skills/theme-factory/themes/botanical-garden.md +19 -0
package/skills/theme-factory/themes/desert-rose.md +19 -0
package/skills/theme-factory/themes/forest-canopy.md +19 -0
package/skills/theme-factory/themes/golden-hour.md +19 -0
package/skills/theme-factory/themes/midnight-galaxy.md +19 -0
package/skills/theme-factory/themes/modern-minimalist.md +19 -0
package/skills/theme-factory/themes/ocean-depths.md +19 -0
package/skills/theme-factory/themes/sunset-boulevard.md +19 -0
package/skills/theme-factory/themes/tech-innovation.md +19 -0
package/skills/uv/.plugin/plugin.json +18 -0
package/skills/uv/README.md +5 -0
package/skills/uv/SKILL.md +95 -0
package/skills/uv/references/README.md +5 -0
package/skills/vercel/.plugin/plugin.json +18 -0
package/skills/vercel/README.md +108 -0
package/skills/vercel/SKILL.md +103 -0
package/tests/test_add_skill_installs_to_agents_dir.py +42 -0
package/tests/test_catalogs.py +109 -0
package/tests/test_code_review_risk_evaluation.py +94 -0
package/tests/test_issue_duplicate_checker.py +240 -0
package/tests/test_openhands_api_python.py +152 -0
package/tests/test_plugin_manifest.py +83 -0
package/tests/test_pr_review_diff_payload.py +202 -0
package/tests/test_pr_review_feedback.py +263 -0
package/tests/test_pr_review_prompt.py +152 -0
package/tests/test_pr_review_review_context.py +253 -0
package/tests/test_qa_changes.py +232 -0
package/tests/test_qa_changes_evaluation.py +259 -0
package/tests/test_release_notes_generator.py +990 -0
package/tests/test_sdk_loading.py +150 -0
package/tests/test_skill_plugin_loading.py +149 -0
package/tests/test_skills_have_readme.py +66 -0
package/tests/test_sync_extensions.py +292 -0
package/tests/test_workflow_sync.py +46 -0
package/utils/analysis/README.md +7 -0
package/utils/analysis/laminar_signals/README.md +211 -0
package/utils/analysis/laminar_signals/analyze.py +780 -0
package/utils/analysis/laminar_signals/templates/default.j2 +49 -0
package/utils/analysis/laminar_signals/templates/pr_review.j2 +61 -0

package/tests/test_qa_changes_evaluation.py ADDED Viewed

@@ -0,0 +1,259 @@
+"""Tests for the qa-changes evaluation script (evaluate_qa_changes.py)."""
+import importlib.util
+import json
+import sys
+import types
+from pathlib import Path
+import pytest
+_SCRIPTS_DIR = (
+    Path(__file__).parent.parent / "plugins" / "qa-changes" / "scripts"
+)
+def _load_eval_module():
+    """Load evaluate_qa_changes.py, stubbing out lmnr which needs a project key."""
+    lmnr_mod = types.ModuleType("lmnr")
+    class _FakeLaminar:
+        @staticmethod
+        def initialize():
+            pass
+        @staticmethod
+        def get_trace_id():
+            return None
+        @staticmethod
+        def get_laminar_span_context():
+            return None
+        @staticmethod
+        def set_trace_metadata(meta):
+            pass
+        @staticmethod
+        def set_span_output(output):
+            pass
+        @staticmethod
+        def flush():
+            pass
+        @staticmethod
+        def start_as_current_span(**kwargs):
+            import contextlib
+            return contextlib.nullcontext()
+    class _FakeClient:
+        class evaluators:
+            @staticmethod
+            def score(**kwargs):
+                pass
+        class tags:
+            @staticmethod
+            def tag(trace_id, tags):
+                pass
+    lmnr_mod.Laminar = _FakeLaminar
+    lmnr_mod.LaminarClient = _FakeClient
+    saved = sys.modules.get("lmnr")
+    sys.modules["lmnr"] = lmnr_mod
+    try:
+        path = _SCRIPTS_DIR / "evaluate_qa_changes.py"
+        spec = importlib.util.spec_from_file_location("evaluate_qa_changes", path)
+        module = importlib.util.module_from_spec(spec)
+        sys.modules[spec.name] = module
+        spec.loader.exec_module(module)
+        return module
+    finally:
+        if saved is None:
+            sys.modules.pop("lmnr", None)
+        else:
+            sys.modules["lmnr"] = saved
+@pytest.fixture(scope="module")
+def eval_mod():
+    return _load_eval_module()
+# ===================================================================
+# extract_qa_report
+# ===================================================================
+class TestExtractQaReport:
+    def test_extracts_agent_comments(self, eval_mod):
+        comments = [
+            {"user": {"login": "openhands-agent"}, "id": 1, "body": "QA report", "created_at": "2024-01-01"},
+            {"user": {"login": "human-dev"}, "id": 2, "body": "looks good", "created_at": "2024-01-02"},
+            {"user": {"login": "all-hands-bot"}, "id": 3, "body": "another report", "created_at": "2024-01-03"},
+        ]
+        result = eval_mod.extract_qa_report(comments)
+        assert len(result) == 2
+        assert result[0]["id"] == 1
+        assert result[0]["type"] == "qa_report"
+        assert result[1]["id"] == 3
+    def test_empty_comments(self, eval_mod):
+        assert eval_mod.extract_qa_report([]) == []
+    def test_no_agent_comments(self, eval_mod):
+        comments = [
+            {"user": {"login": "human"}, "id": 1, "body": "test", "created_at": "2024-01-01"},
+        ]
+        assert eval_mod.extract_qa_report(comments) == []
+# ===================================================================
+# extract_human_responses
+# ===================================================================
+class TestExtractHumanResponses:
+    def test_extracts_human_comments(self, eval_mod):
+        comments = [
+            {"user": {"login": "openhands-agent"}, "id": 1, "body": "QA report", "created_at": "2024-01-01"},
+            {"user": {"login": "dev-alice"}, "id": 2, "body": "thanks", "created_at": "2024-01-02"},
+            {"user": {"login": "dev-bob"}, "id": 3, "body": "agreed", "created_at": "2024-01-03"},
+        ]
+        result = eval_mod.extract_human_responses(comments)
+        assert len(result) == 2
+        assert result[0]["user"] == "dev-alice"
+        assert result[1]["user"] == "dev-bob"
+    def test_empty_comments(self, eval_mod):
+        assert eval_mod.extract_human_responses([]) == []
+    def test_all_agent_comments(self, eval_mod):
+        comments = [
+            {"user": {"login": "openhands-agent"}, "id": 1, "body": "report", "created_at": "2024-01-01"},
+        ]
+        assert eval_mod.extract_human_responses(comments) == []
+    def test_custom_agent_users(self, eval_mod):
+        comments = [
+            {"user": {"login": "my-bot"}, "id": 1, "body": "report", "created_at": "2024-01-01"},
+            {"user": {"login": "human"}, "id": 2, "body": "ok", "created_at": "2024-01-02"},
+        ]
+        result = eval_mod.extract_human_responses(comments, agent_users={"my-bot"})
+        assert len(result) == 1
+        assert result[0]["user"] == "human"
+# ===================================================================
+# truncate_text
+# ===================================================================
+class TestTruncateText:
+    def test_short_text_unchanged(self, eval_mod):
+        assert eval_mod.truncate_text("hello") == "hello"
+    def test_exact_limit(self, eval_mod):
+        text = "x" * 100
+        assert eval_mod.truncate_text(text, max_chars=100) == text
+    def test_over_limit(self, eval_mod):
+        text = "x" * 200
+        result = eval_mod.truncate_text(text, max_chars=100)
+        assert result.startswith("x" * 100)
+        assert "truncated" in result
+        assert "200" in result
+    def test_default_limit_is_50k(self, eval_mod):
+        text = "x" * 50000
+        assert eval_mod.truncate_text(text) == text
+        text_over = "x" * 50001
+        assert "truncated" in eval_mod.truncate_text(text_over)
+# ===================================================================
+# calculate_engagement_score
+# ===================================================================
+class TestCalculateEngagementScore:
+    def test_no_comments_no_merge(self, eval_mod):
+        score = eval_mod.calculate_engagement_score([], [], False)
+        assert score == 0.0
+    def test_qa_report_posted_no_responses(self, eval_mod):
+        qa = [{"type": "qa_report", "body": "report"}]
+        score = eval_mod.calculate_engagement_score(qa, [], False)
+        assert score == pytest.approx(0.3)
+    def test_qa_report_with_responses(self, eval_mod):
+        qa = [{"type": "qa_report", "body": "report"}]
+        human = [{"type": "issue_comment", "body": "thanks"}]
+        score = eval_mod.calculate_engagement_score(qa, human, False)
+        # 0.3 (report) + 1.0 * 0.2 (response ratio capped at 1.0)
+        assert score == pytest.approx(0.5)
+    def test_merged_bonus(self, eval_mod):
+        score = eval_mod.calculate_engagement_score([], [], True)
+        assert score == pytest.approx(0.3)
+    def test_full_engagement(self, eval_mod):
+        qa = [{"type": "qa_report", "body": "report"}]
+        human = [{"type": "issue_comment", "body": "thanks"}]
+        score = eval_mod.calculate_engagement_score(qa, human, True)
+        # 0.3 (report) + 0.2 (response) + 0.3 (merged)
+        assert score == pytest.approx(0.8)
+    def test_many_responses_capped(self, eval_mod):
+        qa = [{"type": "qa_report", "body": "report"}]
+        human = [{"body": f"msg {i}"} for i in range(10)]
+        score = eval_mod.calculate_engagement_score(qa, human, False)
+        # ratio capped at 1.0 → 0.3 + 0.2
+        assert score == pytest.approx(0.5)
+    def test_multiple_qa_comments_with_fewer_responses(self, eval_mod):
+        qa = [{"body": f"qa {i}"} for i in range(4)]
+        human = [{"body": "reply"}]
+        score = eval_mod.calculate_engagement_score(qa, human, False)
+        # 0.3 + (1/4) * 0.2 = 0.35
+        assert score == pytest.approx(0.35)
+# ===================================================================
+# load_trace_info
+# ===================================================================
+class TestLoadTraceInfo:
+    def test_file_not_found_returns_empty(self, eval_mod, tmp_path):
+        result = eval_mod.load_trace_info(str(tmp_path / "nonexistent.json"))
+        assert result == {}
+    def test_loads_valid_trace_file(self, eval_mod, tmp_path):
+        trace_data = {
+            "trace_id": "abc-123",
+            "span_context": {"trace_id": "abc", "span_id": "def"},
+            "pr_number": "42",
+            "repo_name": "org/repo",
+            "commit_id": "deadbeef",
+            "model": "claude-sonnet",
+        }
+        trace_file = tmp_path / "trace.json"
+        trace_file.write_text(json.dumps(trace_data))
+        result = eval_mod.load_trace_info(str(trace_file))
+        assert result["trace_id"] == "abc-123"
+        assert result["pr_number"] == "42"
+        assert result["span_context"]["trace_id"] == "abc"
+    def test_trace_without_span_context(self, eval_mod, tmp_path):
+        trace_data = {"trace_id": "abc-123"}
+        trace_file = tmp_path / "trace.json"
+        trace_file.write_text(json.dumps(trace_data))
+        result = eval_mod.load_trace_info(str(trace_file))
+        assert result["trace_id"] == "abc-123"
+        assert result.get("span_context") is None