agentic-rubric-runner 0.5.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (81) hide show
  1. agentic_rubric_runner-0.5.0/.devcontainer/devcontainer.json +33 -0
  2. agentic_rubric_runner-0.5.0/.env.example +3 -0
  3. agentic_rubric_runner-0.5.0/.github/workflows/ci.yml +76 -0
  4. agentic_rubric_runner-0.5.0/.github/workflows/pages.yml +33 -0
  5. agentic_rubric_runner-0.5.0/.github/workflows/publish.yml +28 -0
  6. agentic_rubric_runner-0.5.0/.gitignore +28 -0
  7. agentic_rubric_runner-0.5.0/.python-version +1 -0
  8. agentic_rubric_runner-0.5.0/.streamlit/config.toml +15 -0
  9. agentic_rubric_runner-0.5.0/.streamlit/deploy.toml +18 -0
  10. agentic_rubric_runner-0.5.0/LICENSE +21 -0
  11. agentic_rubric_runner-0.5.0/PKG-INFO +596 -0
  12. agentic_rubric_runner-0.5.0/README.md +566 -0
  13. agentic_rubric_runner-0.5.0/aarrr_agent/__init__.py +1 -0
  14. agentic_rubric_runner-0.5.0/aarrr_agent/agent.py +242 -0
  15. agentic_rubric_runner-0.5.0/aarrr_agent/assets/executive_report.css +224 -0
  16. agentic_rubric_runner-0.5.0/aarrr_agent/attachment_relevance.py +206 -0
  17. agentic_rubric_runner-0.5.0/aarrr_agent/benchmark.py +815 -0
  18. agentic_rubric_runner-0.5.0/aarrr_agent/cli.py +435 -0
  19. agentic_rubric_runner-0.5.0/aarrr_agent/config.py +33 -0
  20. agentic_rubric_runner-0.5.0/aarrr_agent/env.py +17 -0
  21. agentic_rubric_runner-0.5.0/aarrr_agent/errors.py +21 -0
  22. agentic_rubric_runner-0.5.0/aarrr_agent/evidence.py +141 -0
  23. agentic_rubric_runner-0.5.0/aarrr_agent/grader.py +253 -0
  24. agentic_rubric_runner-0.5.0/aarrr_agent/grading_calibration.py +35 -0
  25. agentic_rubric_runner-0.5.0/aarrr_agent/grading_report.py +298 -0
  26. agentic_rubric_runner-0.5.0/aarrr_agent/html_pdf.py +79 -0
  27. agentic_rubric_runner-0.5.0/aarrr_agent/html_report.py +28 -0
  28. agentic_rubric_runner-0.5.0/aarrr_agent/llm.py +47 -0
  29. agentic_rubric_runner-0.5.0/aarrr_agent/md_report_parser.py +310 -0
  30. agentic_rubric_runner-0.5.0/aarrr_agent/pdf_gen.py +437 -0
  31. agentic_rubric_runner-0.5.0/aarrr_agent/phase1_state.py +83 -0
  32. agentic_rubric_runner-0.5.0/aarrr_agent/pipeline.py +232 -0
  33. agentic_rubric_runner-0.5.0/aarrr_agent/report_models.py +45 -0
  34. agentic_rubric_runner-0.5.0/aarrr_agent/reporting.py +46 -0
  35. agentic_rubric_runner-0.5.0/aarrr_agent/retrieval.py +88 -0
  36. agentic_rubric_runner-0.5.0/aarrr_agent/schemas.py +96 -0
  37. agentic_rubric_runner-0.5.0/aarrr_agent/structured_report.py +341 -0
  38. agentic_rubric_runner-0.5.0/aarrr_agent/templates/executive_report.html +109 -0
  39. agentic_rubric_runner-0.5.0/aarrr_agent/tools.py +415 -0
  40. agentic_rubric_runner-0.5.0/aarrr_agent/validation.py +61 -0
  41. agentic_rubric_runner-0.5.0/aarrr_agent/web_app.py +548 -0
  42. agentic_rubric_runner-0.5.0/app.py +27 -0
  43. agentic_rubric_runner-0.5.0/docs/agent_scoring_upgrade.md +448 -0
  44. agentic_rubric_runner-0.5.0/docs/index.html +100 -0
  45. agentic_rubric_runner-0.5.0/docs/streamlit_deploy.md +93 -0
  46. agentic_rubric_runner-0.5.0/docs/style.css +193 -0
  47. agentic_rubric_runner-0.5.0/fixtures/attachment.pdf +0 -0
  48. agentic_rubric_runner-0.5.0/fixtures/benchmarks/agent_cases.example.json +140 -0
  49. agentic_rubric_runner-0.5.0/fixtures/query.txt +1 -0
  50. agentic_rubric_runner-0.5.0/fixtures/rubrics.json +230 -0
  51. agentic_rubric_runner-0.5.0/fonts/.gitkeep +0 -0
  52. agentic_rubric_runner-0.5.0/fonts/README.md +6 -0
  53. agentic_rubric_runner-0.5.0/fonts/msyh.ttc +0 -0
  54. agentic_rubric_runner-0.5.0/packages.txt +1 -0
  55. agentic_rubric_runner-0.5.0/pyproject.toml +41 -0
  56. agentic_rubric_runner-0.5.0/requirements-streamlit.txt +2 -0
  57. agentic_rubric_runner-0.5.0/requirements-web.txt +3 -0
  58. agentic_rubric_runner-0.5.0/requirements.txt +10 -0
  59. agentic_rubric_runner-0.5.0/solution.py +12 -0
  60. agentic_rubric_runner-0.5.0/tests/__init__.py +0 -0
  61. agentic_rubric_runner-0.5.0/tests/test_agent_loop.py +90 -0
  62. agentic_rubric_runner-0.5.0/tests/test_agent_messages.py +87 -0
  63. agentic_rubric_runner-0.5.0/tests/test_attachment_relevance.py +153 -0
  64. agentic_rubric_runner-0.5.0/tests/test_cli_import.py +169 -0
  65. agentic_rubric_runner-0.5.0/tests/test_evidence.py +29 -0
  66. agentic_rubric_runner-0.5.0/tests/test_grading_report.py +65 -0
  67. agentic_rubric_runner-0.5.0/tests/test_html_report.py +95 -0
  68. agentic_rubric_runner-0.5.0/tests/test_path_whitelist.py +25 -0
  69. agentic_rubric_runner-0.5.0/tests/test_pdf_gen.py +42 -0
  70. agentic_rubric_runner-0.5.0/tests/test_phase1_finalize.py +47 -0
  71. agentic_rubric_runner-0.5.0/tests/test_phase1_state_machine.py +38 -0
  72. agentic_rubric_runner-0.5.0/tests/test_project_urls.py +19 -0
  73. agentic_rubric_runner-0.5.0/tests/test_report_validation.py +14 -0
  74. agentic_rubric_runner-0.5.0/tests/test_retrieval.py +17 -0
  75. agentic_rubric_runner-0.5.0/tests/test_schemas.py +30 -0
  76. agentic_rubric_runner-0.5.0/tests/test_score_recalculate.py +34 -0
  77. agentic_rubric_runner-0.5.0/tests/test_structured_report.py +94 -0
  78. agentic_rubric_runner-0.5.0/tests/test_trace.py +56 -0
  79. agentic_rubric_runner-0.5.0/tests/test_validation_critic.py +40 -0
  80. agentic_rubric_runner-0.5.0/tests/test_web_entry.py +19 -0
  81. agentic_rubric_runner-0.5.0/tests/test_web_no_public_demo.py +17 -0
@@ -0,0 +1,33 @@
1
+ {
2
+ "name": "Python 3",
3
+ // Or use a Dockerfile or Docker Compose file. More info: https://containers.dev/guide/dockerfile
4
+ "image": "mcr.microsoft.com/devcontainers/python:1-3.11-bookworm",
5
+ "customizations": {
6
+ "codespaces": {
7
+ "openFiles": [
8
+ "README.md",
9
+ "app.py"
10
+ ]
11
+ },
12
+ "vscode": {
13
+ "settings": {},
14
+ "extensions": [
15
+ "ms-python.python",
16
+ "ms-python.vscode-pylance"
17
+ ]
18
+ }
19
+ },
20
+ "updateContentCommand": "[ -f packages.txt ] && sudo apt update && sudo apt upgrade -y && sudo xargs apt install -y <packages.txt; [ -f requirements-web.txt ] && pip3 install --user -r requirements-web.txt; echo '✅ Packages installed and Requirements met'",
21
+ "postAttachCommand": {
22
+ "server": "streamlit run app.py --server.enableCORS false --server.enableXsrfProtection false"
23
+ },
24
+ "portsAttributes": {
25
+ "8501": {
26
+ "label": "Application",
27
+ "onAutoForward": "openPreview"
28
+ }
29
+ },
30
+ "forwardPorts": [
31
+ 8501
32
+ ]
33
+ }
@@ -0,0 +1,3 @@
1
+ DEEPSEEK_API_KEY=sk-your-key-here
2
+ DEEPSEEK_BASE_URL=https://api.deepseek.com
3
+ DEEPSEEK_MODEL=deepseek-chat
@@ -0,0 +1,76 @@
1
+ name: CI
2
+
3
+ on:
4
+ push:
5
+ branches: [main]
6
+ pull_request:
7
+
8
+ jobs:
9
+ cli-only:
10
+ runs-on: ubuntu-latest
11
+
12
+ steps:
13
+ - uses: actions/checkout@v4
14
+
15
+ - uses: actions/setup-python@v5
16
+ with:
17
+ python-version: "3.11"
18
+
19
+ - name: Install CLI only (no [web])
20
+ run: |
21
+ python -m pip install --upgrade pip
22
+ pip install -e .
23
+
24
+ - name: CLI smoke (core commands)
25
+ run: |
26
+ agentic-rubric --help
27
+ agentic-rubric run --help
28
+ agentic-rubric phase1 --help
29
+ agentic-rubric grade --help
30
+ agentic-rubric validate --help
31
+ agentic-rubric eval-run --help
32
+ agentic-rubric bench --help
33
+ agentic-rubric inspect-trace --help
34
+ agentic-rubric init --help
35
+
36
+ test-build:
37
+ runs-on: ubuntu-latest
38
+
39
+ steps:
40
+ - uses: actions/checkout@v4
41
+
42
+ - uses: actions/setup-python@v5
43
+ with:
44
+ python-version: "3.11"
45
+
46
+ - name: Install
47
+ run: |
48
+ python -m pip install --upgrade pip
49
+ pip install -e ".[dev,web]"
50
+
51
+ - name: Ruff
52
+ run: ruff check aarrr_agent tests app.py || true
53
+
54
+ - name: Pytest
55
+ run: pytest -q
56
+
57
+ - name: CLI help (with web extra)
58
+ run: |
59
+ agentic-rubric --help
60
+ agentic-rubric run --help
61
+ agentic-rubric phase1 --help
62
+ agentic-rubric grade --help
63
+ agentic-rubric validate --help
64
+ agentic-rubric eval-run --help
65
+ agentic-rubric bench --help
66
+ agentic-rubric inspect-trace --help
67
+ agentic-rubric ui --help
68
+
69
+ - name: Build package
70
+ run: python -m build
71
+
72
+ - name: Upload dist
73
+ uses: actions/upload-artifact@v4
74
+ with:
75
+ name: dist
76
+ path: dist/
@@ -0,0 +1,33 @@
1
+ name: Deploy GitHub Pages
2
+
3
+ on:
4
+ push:
5
+ branches: [main]
6
+ workflow_dispatch:
7
+
8
+ permissions:
9
+ contents: read
10
+ pages: write
11
+ id-token: write
12
+
13
+ concurrency:
14
+ group: pages
15
+ cancel-in-progress: true
16
+
17
+ jobs:
18
+ deploy:
19
+ runs-on: ubuntu-latest
20
+ environment:
21
+ name: github-pages
22
+ url: ${{ steps.deployment.outputs.page_url }}
23
+ steps:
24
+ - uses: actions/checkout@v4
25
+
26
+ - uses: actions/configure-pages@v5
27
+
28
+ - uses: actions/upload-pages-artifact@v3
29
+ with:
30
+ path: docs
31
+
32
+ - id: deployment
33
+ uses: actions/deploy-pages@v4
@@ -0,0 +1,28 @@
1
+ name: Publish to PyPI
2
+
3
+ on:
4
+ push:
5
+ tags:
6
+ - "v*"
7
+
8
+ jobs:
9
+ build-and-publish:
10
+ runs-on: ubuntu-latest
11
+ permissions:
12
+ id-token: write
13
+
14
+ steps:
15
+ - uses: actions/checkout@v4
16
+
17
+ - uses: actions/setup-python@v5
18
+ with:
19
+ python-version: "3.11"
20
+
21
+ - name: Install build tools
22
+ run: pip install hatch
23
+
24
+ - name: Build
25
+ run: hatch build
26
+
27
+ - name: Publish to PyPI
28
+ uses: pypa/gh-action-pypi-publish@release/v1
@@ -0,0 +1,28 @@
1
+ .venv/
2
+ .venv_pip_test/
3
+ __pycache__/
4
+ .pytest_cache/
5
+ *.pyc
6
+ *.pyo
7
+ .env
8
+ outputs/
9
+ dist/
10
+ dist_check/
11
+ build/
12
+ *.egg-info/
13
+ agent_trace_emergency.jsonl
14
+ phase1_output.pdf
15
+ phase1_output.md
16
+ phase1_output.html
17
+ grading_result.json
18
+ agent_trace.jsonl
19
+ run_meta.json
20
+ fonts/*
21
+ !fonts/.gitkeep
22
+ !fonts/README.md
23
+ !fonts/msyh.ttc
24
+ samples/
25
+ *.pdf
26
+ !fixtures/attachment.pdf
27
+ .DS_Store
28
+ Thumbs.db
@@ -0,0 +1 @@
1
+ 3.11
@@ -0,0 +1,15 @@
1
+ [theme]
2
+ primaryColor = "#1e40af"
3
+ backgroundColor = "#f1f5f9"
4
+ secondaryBackgroundColor = "#ffffff"
5
+ textColor = "#0f172a"
6
+ font = "sans serif"
7
+
8
+ [server]
9
+ headless = true
10
+
11
+ [client]
12
+ toolbarMode = "minimal"
13
+
14
+ [browser]
15
+ gatherUsageStats = false
@@ -0,0 +1,18 @@
1
+ # Streamlit Community Cloud 部署清单
2
+ # https://share.streamlit.io/
3
+
4
+ [deploy]
5
+ # 在控制台填写(此文件仅作文档,Streamlit 不自动读取)
6
+ repository = "bosprimigenious/agentic-rubric-runner"
7
+ branch = "main"
8
+ main_file = "app.py"
9
+ # Advanced → Requirements file: requirements-streamlit.txt
10
+ # 备选入口(需 requirements-web.txt / [web] extra):
11
+ # main_file = "aarrr_agent/web_app.py"
12
+ python_version = "3.11"
13
+
14
+ # Secrets:留空(用户在页面输入 API Key)
15
+ # Advanced > Secrets: 不填 DEEPSEEK_API_KEY
16
+
17
+ # 部署后 App URL(当前生产环境):
18
+ app_url = "https://agentic-rubric-runner.streamlit.app/"
@@ -0,0 +1,21 @@
1
+ MIT License
2
+
3
+ Copyright (c) 2026 BosPrimigenious
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining a copy
6
+ of this software and associated documentation files (the "Software"), to deal
7
+ in the Software without restriction, including without limitation the rights
8
+ to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
9
+ copies of the Software, and to permit persons to whom the Software is
10
+ furnished to do so, subject to the following conditions:
11
+
12
+ The above copyright notice and this permission notice shall be included in all
13
+ copies or substantial portions of the Software.
14
+
15
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
+ IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
+ FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18
+ AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19
+ LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20
+ OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21
+ SOFTWARE.