crossai-cli 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (64) hide show
  1. cross_ai/__init__.py +0 -0
  2. cross_ai/ai_error_handler.py +15 -0
  3. cross_ai/ai_handler.py +22 -0
  4. cross_ai/ai_url.py +89 -0
  5. cross_ai/base_handler.py +3 -0
  6. cross_ai/commands.py +54 -0
  7. cross_ai/cross_stones/cross-stones-10.json +57 -0
  8. cross_ai/cross_stones/domains/creative_media.prompt +18 -0
  9. cross_ai/cross_stones/domains/customer_service.prompt +12 -0
  10. cross_ai/cross_stones/domains/data_analytics.prompt +18 -0
  11. cross_ai/cross_stones/domains/education_learning.prompt +18 -0
  12. cross_ai/cross_stones/domains/finance_business.prompt +18 -0
  13. cross_ai/cross_stones/domains/healthcare_medical.prompt +18 -0
  14. cross_ai/cross_stones/domains/marketing_content.prompt +72 -0
  15. cross_ai/cross_stones/domains/research_qa.prompt +18 -0
  16. cross_ai/cross_stones/domains/software_development.prompt +19 -0
  17. cross_ai/cross_stones/domains/writing_editing.prompt +18 -0
  18. cross_ai/discourse.py +192 -0
  19. cross_ai/mmd_branding.py +42 -0
  20. cross_ai/mmd_data_analysis.py +382 -0
  21. cross_ai/mmd_for_speaking.py +225 -0
  22. cross_ai/mmd_plot.py +121 -0
  23. cross_ai/mmd_process_report.py +285 -0
  24. cross_ai/mmd_single_key.py +188 -0
  25. cross_ai/mmd_startup.py +69 -0
  26. cross_ai/mmd_util.py +234 -0
  27. cross_ai/mmd_voice.py +163 -0
  28. cross_ai/mmd_web_server.py +88 -0
  29. cross_ai/st-admin.py +791 -0
  30. cross_ai/st-analyze.py +441 -0
  31. cross_ai/st-bang.py +554 -0
  32. cross_ai/st-cat.py +122 -0
  33. cross_ai/st-cross.py +749 -0
  34. cross_ai/st-domain.py +466 -0
  35. cross_ai/st-edit.py +368 -0
  36. cross_ai/st-fact.py +657 -0
  37. cross_ai/st-fetch.py +359 -0
  38. cross_ai/st-find.py +375 -0
  39. cross_ai/st-fix.py +1926 -0
  40. cross_ai/st-gen.py +230 -0
  41. cross_ai/st-heatmap.py +394 -0
  42. cross_ai/st-ls.py +270 -0
  43. cross_ai/st-man.py +247 -0
  44. cross_ai/st-merge.py +841 -0
  45. cross_ai/st-new.py +169 -0
  46. cross_ai/st-plot.py +471 -0
  47. cross_ai/st-post.py +334 -0
  48. cross_ai/st-prep.py +242 -0
  49. cross_ai/st-print.py +497 -0
  50. cross_ai/st-read.py +155 -0
  51. cross_ai/st-rm.py +176 -0
  52. cross_ai/st-speak.py +128 -0
  53. cross_ai/st-speed.py +945 -0
  54. cross_ai/st-stones.py +1435 -0
  55. cross_ai/st-verdict.py +538 -0
  56. cross_ai/st-voice.py +237 -0
  57. cross_ai/st.py +503 -0
  58. cross_ai/template/default.prompt +10 -0
  59. crossai_cli-0.1.0.dist-info/METADATA +327 -0
  60. crossai_cli-0.1.0.dist-info/RECORD +64 -0
  61. crossai_cli-0.1.0.dist-info/WHEEL +5 -0
  62. crossai_cli-0.1.0.dist-info/entry_points.txt +30 -0
  63. crossai_cli-0.1.0.dist-info/licenses/LICENSE +26 -0
  64. crossai_cli-0.1.0.dist-info/top_level.txt +1 -0
cross_ai/__init__.py ADDED
File without changes
@@ -0,0 +1,15 @@
1
+ # ai_error_handler.py — compatibility shim
2
+ # Source of truth: cross-ai-core package (cross_ai_core.ai_error_handler)
3
+ from cross_ai_core.ai_error_handler import * # noqa: F401, F403
4
+ from cross_ai_core.ai_error_handler import ( # explicit for IDE / type checkers
5
+ handle_api_error,
6
+ is_quota_error,
7
+ is_rate_limit_error,
8
+ is_transient_error,
9
+ get_error_type,
10
+ retry_with_backoff,
11
+ CrossAIError,
12
+ QuotaExceededError,
13
+ RateLimitError,
14
+ TransientError,
15
+ )
cross_ai/ai_handler.py ADDED
@@ -0,0 +1,22 @@
1
+ # ai_handler.py — compatibility shim
2
+ # Source of truth: cross-ai-core package (cross_ai_core.ai_handler)
3
+ # This file exists so st-*.py files and tests can continue to use:
4
+ # from ai_handler import process_prompt, get_content, ...
5
+ from cross_ai_core.ai_handler import * # noqa: F401, F403
6
+ from cross_ai_core.ai_handler import ( # explicit for IDE / type checkers
7
+ AI_HANDLER_REGISTRY,
8
+ AI_LIST,
9
+ AIResponse,
10
+ _API_KEY_ENV_VARS, # private — needed by tests
11
+ check_api_key,
12
+ get_ai_list,
13
+ get_ai_make,
14
+ get_ai_model,
15
+ get_content,
16
+ get_data_content,
17
+ get_data_title,
18
+ get_default_ai,
19
+ get_usage,
20
+ process_prompt,
21
+ put_content,
22
+ )
cross_ai/ai_url.py ADDED
@@ -0,0 +1,89 @@
1
+ # Sorry, no AI here
2
+ import os
3
+ import json
4
+ import hashlib
5
+ import requests
6
+ import sys
7
+
8
+ AI_MAKE = "url"
9
+ AI_MODEL = "bs4"
10
+
11
+
12
+ def get_url_cached_response(tweet_id, verbose=False, use_cache=False):
13
+
14
+ url = f"https://api.twitter.com/2/tweets/{tweet_id}"
15
+ headers = get_url_headers()
16
+
17
+ if not use_cache:
18
+ response = requests.get(url, headers=headers)
19
+ json_str = json.dumps(response) # Force structure reorganization
20
+ json_response = json.loads(json_str)
21
+ return json_response, False # Not cached
22
+ else:
23
+ # Convert param to a string for hashing
24
+ param = {
25
+ "tweet_id": tweet_id,
26
+ "headers": headers,
27
+ "url": url,
28
+ }
29
+ param_str = json.dumps(param, sort_keys=True)
30
+ md5_hash = hashlib.md5(param_str.encode('utf-8')).hexdigest()
31
+
32
+ # Construct the cache file path
33
+ cache_dir = os.path.expanduser("~/.cross_api_cache")
34
+ cache_file = os.path.join(cache_dir, f"{md5_hash}.json")
35
+
36
+ # Check if the response is already in cache
37
+ if os.path.exists(cache_file):
38
+ if verbose:
39
+ print(f"api_cache: Using cache_file: {cache_file}")
40
+ with open(cache_file, 'r') as f:
41
+ return json.load(f), True # Cached
42
+ else:
43
+ if verbose:
44
+ print("api_cache: cache miss, submitting API request")
45
+
46
+ # If not in cache, fetch the response
47
+ response = requests.get(url, headers=headers)
48
+ if (status_code := response["status_code"]) != 200:
49
+ print(f"x.com response failed: {status_code}")
50
+ sys.exit(1)
51
+ json_str = json.dumps(response) # Force structure reorganization
52
+ json_response = json.loads(json_str)
53
+
54
+ # Save to cache
55
+ if not os.path.exists(cache_dir):
56
+ os.makedirs(cache_dir)
57
+ if verbose:
58
+ print(f"api_cache: api_cache/ dir created: {cache_dir}")
59
+
60
+ try:
61
+ with open(cache_file, 'w') as f:
62
+ json.dump(json_response, f)
63
+ if verbose:
64
+ print(f"api_cache: file created: {cache_file}")
65
+ except Exception as e:
66
+ print(f"api_cache: file write error: {str(e)}")
67
+
68
+ return json_response, False # Fresh API call, not cached
69
+
70
+
71
+ def get_url_headers():
72
+ x_bearer_token = os.environ.get('X_COM_BEARER_TOKEN')
73
+ headers = {"Authorization": f"Bearer {x_bearer_token}"}
74
+ return headers
75
+
76
+
77
+ def get_title(data):
78
+ title = data.get("title")
79
+ return title
80
+
81
+
82
+ def get_story(data):
83
+ text = data.get("text")
84
+ return text
85
+
86
+
87
+ def get_ai_tag():
88
+ return "\n\ncross:" + json.dumps(
89
+ {"make": AI_MAKE, "model": AI_MODEL})
@@ -0,0 +1,3 @@
1
+ # base_handler.py — compatibility shim
2
+ # Source of truth: cross-ai-core package (cross_ai_core.ai_base)
3
+ from cross_ai_core.ai_base import BaseAIHandler, _get_cache_dir # noqa: F401
cross_ai/commands.py ADDED
@@ -0,0 +1,54 @@
1
+ """
2
+ commands.py — Entry-point dispatch for pyproject.toml [project.scripts].
3
+ pip generates a thin wrapper that imports and calls each function here;
4
+ runpy executes the st-*.py file directly so hyphens in filenames are never
5
+ treated as Python identifiers.
6
+ """
7
+ import os
8
+ import runpy
9
+ import sys
10
+
11
+ _HERE = os.path.dirname(os.path.abspath(__file__))
12
+
13
+ # Ensure the cross_ai/ directory is on sys.path so that st-*.py scripts can
14
+ # use bare module imports (e.g. `from mmd_startup import require_config`).
15
+ # When scripts are run directly as files, Python adds their directory to
16
+ # sys.path[0] automatically — runpy.run_path() does not, so we do it here.
17
+ if _HERE not in sys.path:
18
+ sys.path.insert(0, _HERE)
19
+
20
+
21
+ def _run(name: str) -> None:
22
+ runpy.run_path(os.path.join(_HERE, f"{name}.py"), run_name="__main__")
23
+
24
+
25
+ def st(): _run("st")
26
+ def st_admin(): _run("st-admin")
27
+ def st_analyze(): _run("st-analyze")
28
+ def st_bang(): _run("st-bang")
29
+ def st_cat(): _run("st-cat")
30
+ def st_cross(): _run("st-cross")
31
+ def st_domain(): _run("st-domain")
32
+ def st_edit(): _run("st-edit")
33
+ def st_fact(): _run("st-fact")
34
+ def st_fetch(): _run("st-fetch")
35
+ def st_find(): _run("st-find")
36
+ def st_fix(): _run("st-fix")
37
+ def st_gen(): _run("st-gen")
38
+ def st_heatmap(): _run("st-heatmap")
39
+ def st_ls(): _run("st-ls")
40
+ def st_man(): _run("st-man")
41
+ def st_merge(): _run("st-merge")
42
+ def st_new(): _run("st-new")
43
+ def st_plot(): _run("st-plot")
44
+ def st_post(): _run("st-post")
45
+ def st_prep(): _run("st-prep")
46
+ def st_print(): _run("st-print")
47
+ def st_read(): _run("st-read")
48
+ def st_rm(): _run("st-rm")
49
+ def st_speak(): _run("st-speak")
50
+ def st_speed(): _run("st-speed")
51
+ def st_stones(): _run("st-stones")
52
+ def st_verdict(): _run("st-verdict")
53
+ def st_voice(): _run("st-voice")
54
+
@@ -0,0 +1,57 @@
1
+ {
2
+ "id": "cross-stones-10",
3
+ "description": "Standard 10-domain Cross-Stones benchmark set. Locked params ensure scores are directly comparable across runs over time.",
4
+ "n_claims": 10,
5
+ "max_fact_score": 200,
6
+ "domains_dir": "domains",
7
+ "domains": [
8
+ {
9
+ "id": "software_development",
10
+ "name": "Software Development & Programming"
11
+ },
12
+ {
13
+ "id": "customer_service",
14
+ "name": "Customer Service & Support"
15
+ },
16
+ {
17
+ "id": "marketing_content",
18
+ "name": "Marketing & Content Creation"
19
+ },
20
+ {
21
+ "id": "education_learning",
22
+ "name": "Education & Learning"
23
+ },
24
+ {
25
+ "id": "data_analytics",
26
+ "name": "Data Analytics & Business Intelligence"
27
+ },
28
+ {
29
+ "id": "healthcare_medical",
30
+ "name": "Healthcare & Medical Analysis"
31
+ },
32
+ {
33
+ "id": "finance_business",
34
+ "name": "Finance & Business Decision Making"
35
+ },
36
+ {
37
+ "id": "writing_editing",
38
+ "name": "Writing, Editing & Summarizing"
39
+ },
40
+ {
41
+ "id": "research_qa",
42
+ "name": "Research, Search & Q&A"
43
+ },
44
+ {
45
+ "id": "creative_media",
46
+ "name": "Creative Media (Images, Video, Audio)"
47
+ }
48
+ ],
49
+ "snapshots": [],
50
+ "speed_baseline": {
51
+ "gen_seconds": 20.07,
52
+ "fc_seconds": 91.87,
53
+ "total_seconds": 111.94,
54
+ "recorded_date": "2026-03-27",
55
+ "notes": "Baseline recorded 2026-03-27 \u2014 average across all AI providers. Future runs faster than 111.9s total will have speed_ratio > 1.0 and cross_stone_score may exceed 1.0, reflecting genuine improvement over the 2026 benchmark era."
56
+ }
57
+ }
@@ -0,0 +1,18 @@
1
+ # Cross-Stone Benchmark Prompt -- Creative Media (Images, Video, Audio)
2
+
3
+ Write exactly 10 specific, fact-checkable claims about the current state of AI in creative media production -- including image generation, video synthesis, music composition, and audio production -- as of 2025-2026.
4
+
5
+ Each claim must be a clear, declarative statement that a well-informed analyst could verify -- using publicly available sources such as company announcements, legal filings, industry reports, or reputable technology and entertainment news outlets -- as True, Partially True, Opinion, Partially False, or False.
6
+
7
+ Difficulty calibration: Approximately half of the claims should be verifiable with basic research (widely reported statistics or named tools), and half should require consulting primary sources, legal records, or detailed technical assessments published in 2024-2025.
8
+
9
+ Claims must not be vague generalizations. Each claim should include specific data points, named tools, model versions, legal case names, revenue figures, or named organizations where relevant.
10
+
11
+ Distribute your 10 claims across the following aspects:
12
+ - Capabilities and market adoption of leading AI image and video generation tools (e.g., DALL-E 3, Midjourney v6, Sora, Runway Gen-3, Stable Diffusion)
13
+ - AI in music generation, voice cloning, and audio production: leading tools, capabilities, and commercial deployments
14
+ - Commercial deployment of AI-generated media in advertising, film, publishing, and gaming industries
15
+ - Copyright, intellectual property, and compensation disputes involving AI-generated content (specific cases or legislation)
16
+ - Regulatory responses, platform policies, and industry standards addressing AI-generated deepfakes and synthetic media
17
+
18
+ Format: Return a numbered list of exactly 10 claims with no introductory text, section headers, summaries, or commentary.
@@ -0,0 +1,12 @@
1
+ # Cross-Stone Benchmark Prompt — Customer Service & Support
2
+ Write exactly 10 specific, fact-checkable claims about the current state of AI in customer service and support automation as of 2025–2026.
3
+ Each claim must be a clear, declarative statement that a well-informed analyst could verify — using publicly available sources such as industry surveys, vendor case studies, analyst reports, or reputable news outlets — as True, Partially True, Opinion, Partially False, or False.
4
+ **Difficulty calibration:** Approximately half of the claims should be verifiable with basic research (widely reported statistics or named platforms), and half should require consulting primary sources, empirical studies, or detailed performance data published in 2024–2025.
5
+ **Claims must not be vague generalizations.** Each claim should include specific data points, named platforms, percentages, benchmark metrics, or named organizations where relevant.
6
+ Distribute your 10 claims across the following aspects:
7
+ - Automation and deflection rates for AI-powered chatbots and virtual agents across industries
8
+ - Customer satisfaction (CSAT) and first-contact resolution quality compared to human agents
9
+ - Adoption rates across specific industries (retail, telecom, banking, healthcare)
10
+ - Integration of large language models (LLMs) into contact center platforms (e.g., Salesforce Einstein, Zendesk AI, AWS Connect)
11
+ - Documented cost savings, ROI metrics, and workforce impact reported by organizations deploying AI in customer service
12
+ **Format:** Return a numbered list of exactly 10 claims with no introductory text, section headers, summaries, or commentary.
@@ -0,0 +1,18 @@
1
+ # Cross-Stone Benchmark Prompt -- Data Analytics & Business Intelligence
2
+
3
+ Write exactly 10 specific, fact-checkable claims about the current state of AI in data analytics and business intelligence as of 2025-2026.
4
+
5
+ Each claim must be a clear, declarative statement that a well-informed analyst could verify -- using publicly available sources such as vendor documentation, industry reports, academic studies, or reputable news outlets -- as True, Partially True, Opinion, Partially False, or False.
6
+
7
+ Difficulty calibration: Approximately half of the claims should be verifiable with basic research (widely reported statistics or named platforms), and half should require consulting primary sources, empirical studies, or detailed technical documentation published in 2024-2025.
8
+
9
+ Claims must not be vague generalizations. Each claim should include specific data points, named tools, percentages, benchmark results, or named organizations where relevant.
10
+
11
+ Distribute your 10 claims across the following aspects:
12
+ - Adoption of AI and ML capabilities in major business intelligence platforms (e.g., Tableau, Microsoft Power BI, Looker, Snowflake Cortex)
13
+ - Impact of large language models on natural-language querying and self-service analytics
14
+ - AI-driven anomaly detection and predictive analytics performance in enterprise settings
15
+ - Accuracy, reliability, and hallucination risks in AI-generated data insights vs. human analysts
16
+ - Data governance, privacy, and explainability challenges in AI-driven analytics deployments
17
+
18
+ Format: Return a numbered list of exactly 10 claims with no introductory text, section headers, summaries, or commentary.
@@ -0,0 +1,18 @@
1
+ # Cross-Stone Benchmark Prompt -- Education & Learning
2
+
3
+ Write exactly 10 specific, fact-checkable claims about the current state of AI in education and personalized learning as of 2025-2026.
4
+
5
+ Each claim must be a clear, declarative statement that a well-informed analyst could verify -- using publicly available sources such as academic research, institutional reports, or reputable news outlets -- as True, Partially True, Opinion, Partially False, or False.
6
+
7
+ Difficulty calibration: Approximately half of the claims should be verifiable with basic research (widely reported statistics or named platforms), and half should require consulting primary sources, empirical studies, or detailed institutional data published in 2024-2025.
8
+
9
+ Claims must not be vague generalizations. Each claim should include specific data points, named platforms, percentages, study findings, or named institutions where relevant.
10
+
11
+ Distribute your 10 claims across the following aspects:
12
+ - Student and educator adoption rates of generative AI tools (e.g., ChatGPT, Khanmigo, Duolingo, Coursera AI)
13
+ - Measured learning outcomes from AI-assisted instruction or tutoring systems
14
+ - Institutional and government policies on AI use in classrooms and assessments
15
+ - AI-powered adaptive learning platforms and the evidence base for their effectiveness
16
+ - Academic integrity concerns, bias, and equity issues in AI-powered education
17
+
18
+ Format: Return a numbered list of exactly 10 claims with no introductory text, section headers, summaries, or commentary.
@@ -0,0 +1,18 @@
1
+ # Cross-Stone Benchmark Prompt -- Finance & Business Decision Making
2
+
3
+ Write exactly 10 specific, fact-checkable claims about the current state of AI in financial services, risk management, and business decision-making as of 2025-2026.
4
+
5
+ Each claim must be a clear, declarative statement that a well-informed analyst could verify -- using publicly available sources such as regulatory filings, industry surveys, academic research, or reputable financial news outlets -- as True, Partially True, Opinion, Partially False, or False.
6
+
7
+ Difficulty calibration: Approximately half of the claims should be verifiable with basic research (widely reported statistics or named systems), and half should require consulting primary sources, regulatory documents, or detailed financial performance data published in 2024-2025.
8
+
9
+ Claims must not be vague generalizations. Each claim should include specific data points, named platforms, dollar figures, performance metrics, regulatory citations, or named institutions where relevant.
10
+
11
+ Distribute your 10 claims across the following aspects:
12
+ - AI investment levels and adoption rates in the financial services sector (banks, insurers, asset managers)
13
+ - Performance of AI in fraud detection, credit scoring, and AML (anti-money laundering) systems
14
+ - AI in algorithmic trading and portfolio management: market share, strategies, and performance benchmarks
15
+ - Regulatory frameworks governing AI in financial services (e.g., EU AI Act, U.S. OCC guidance, SEC rules)
16
+ - Documented ROI, productivity gains, and risk reduction achieved by financial firms deploying AI
17
+
18
+ Format: Return a numbered list of exactly 10 claims with no introductory text, section headers, summaries, or commentary.
@@ -0,0 +1,18 @@
1
+ # Cross-Stone Benchmark Prompt -- Healthcare & Medical Analysis
2
+
3
+ Write exactly 10 specific, fact-checkable claims about the current state of AI in healthcare, medical diagnostics, and clinical decision support as of 2025-2026.
4
+
5
+ Each claim must be a clear, declarative statement that a well-informed analyst could verify -- using publicly available sources such as peer-reviewed journals, FDA databases, hospital system reports, or reputable health news outlets -- as True, Partially True, Opinion, Partially False, or False.
6
+
7
+ Difficulty calibration: Approximately half of the claims should be verifiable with basic research (widely reported statistics or named tools), and half should require consulting primary clinical literature, regulatory filings, or detailed health system data published in 2024-2025.
8
+
9
+ Claims must not be vague generalizations. Each claim should include specific data points, named systems, FDA clearance details, clinical trial results, percentages, or named institutions where relevant.
10
+
11
+ Distribute your 10 claims across the following aspects:
12
+ - FDA-cleared or CE-marked AI medical devices: cumulative count, approval trends, and leading categories (radiology, pathology, cardiology)
13
+ - Clinical performance of AI in medical imaging compared to human specialists (sensitivity, specificity, AUC metrics)
14
+ - AI in drug discovery and clinical trial design: timelines, cost reductions, and named examples
15
+ - Deployment and outcomes of AI clinical decision support systems in hospital settings
16
+ - Regulatory, liability, bias, and health equity challenges in medical AI adoption
17
+
18
+ Format: Return a numbered list of exactly 10 claims with no introductory text, section headers, summaries, or commentary.
@@ -0,0 +1,72 @@
1
+ # Cross-Stone Benchmark Prompt — Marketing & Content Creation
2
+ Write exactly 10 specific, fact-checkable claims about the current state of AI in marketing and content creation as of 2025–2026.
3
+ Each claim must be a clear, declarative statement that a well-informed analyst could verify — using publicly available sources such as industry surveys, vendor reports, academic studies, or reputable news outlets — as True, Partially True, Opinion, Partially False, or False.
4
+ **Difficulty calibration:** Approximately half of the claims should be verifiable with basic research (widely reported statistics or named platforms), and half should require consulting primary sources, empirical studies, or detailed performance data published in 2024–2025.
5
+ **Claims must not be vague generalizations.** Each claim should include specific data points, named platforms, percentages, benchmark metrics, or named organizations where releva# Cross-Stone Benchmark Prompt — Marketing & Content Creation
6
+ Write exactly 10 specific, AIWrite exactly 10 specific, fact-checkable claims about the cururEach claim must be a clear, declarative statement that a well-informed analyst could verify — using publicly available sources sdi**Difficulty calibration:** Approximately half of the claims should be verifiable with basic research (widely reported statistics or named platforms), and half should require consulting primary sources, empirical studies, or detailed performance data published in 2024–2025.
7
+ *AI**Claims must not be vague generalizations.** Each claim should include specific data points, named platforms, percentages, benchmark metriccat > /Users/Matt/github/cross-internal/st-stones/template/education_learning.prompt << 'EOF'
8
+ # Cross-Stone Benchmark Prompt — Education & Learning
9
+ Write exactly 10 specific, fact-checkable claims about the current state of AI in education and personalized learning as of 2025–2026.
10
+ Each claim must be a clear, declarative statement that a well-informed analyst could verify — using publicly available sources such as academic research, institutional reports, or reputable news outlets — as True, Partially True, Opinion, Partially False, or False.
11
+ Difficulty calibration: Approximately half of the claims should be verifiable with basic research (widely reported statistics or named platforms), and half should require consulting primary sources, empirical studies, or detailed institutional data published in 2024-2025.
12
+ Claims must not be vague generalizations. Each claim should include specific data points, named platforms, percentages, study findings, or named institutions where relevant.
13
+ Distribute your 10 c# Cross-Stone Benchmark Prompt — Education & Learning
14
+ Write exactly 10 specific, fact-checooWrite exactly 10 specific, fact-checkable claims aboutMeEach claim must be a clear, declarative statement that a well-informed analyst could verify — using publicly available sources such amsDifficulty calibration: Approximately half of the claims should be verifiable with basic research (widely reported statistics or named platforms), and half should require consulting primary sources, empirical studies, or detailed institutional data published in 2024-2n Claims must not be vague generalizationpython3 << 'PYEOF'
15
+ import os
16
+ base = "/Users/Matt/github/cross-internal/st-stones/template"
17
+ files = {
18
+ "education_learning.prompt": """# Cross-Stone Benchmark Prompt — Education & Learning
19
+ Write exactly 10 specific, fact-checkable claims about the current state of AI in education and personalized learning as of 2025-2026.
20
+ Each claim must be a clear, declarative statement that a well-informed analyst could verify — using publicly available sources such as academic research, institutional reports, or reputable news outlets — as True, Partially True, Opinion, Partially False, or False.
21
+ Difficulty calibration: Approximately half of the claims should be verifiable with basic research (widely reported statistics or named platforms), and half should require consulting primary sources, empirical studies, or detailed institutional data published in 2024-2025.
22
+ Claims must not be vague generalizations. Each claim should include specific data points, named platforms, percentages, study findings, or named institutionsimport os
23
+ base = Dibase = " yfiles = {
24
+ "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable claims about the current state of AI in educasEach claim must be a clear, declarative statement that a well-informed analyst could verify — using publicly available sources suchmsDifficulty calibration: Approximately half of the claims should be verifiable with basic research (widely reported statistics or named platforms), and half should require consulting primary sources, empirical studies, or detailed institutional data published in 2024-2n Claims must not be vague generalizations. Each claim should include specific data points, named platforms, percentages, study findings, or named institutionsimport os
25
+ base = Dibase = " yfiles = {
26
+ "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly20base = Dibase = " yfiles = {
27
+ "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable claims about the current state on,"education_learning.prompt" sbase = Dibase = " yfiles = {
28
+ "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly20base = Dibase = " yfiles = {
29
+ "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable claims about the current state on,"education_learning.prompt" sbase = Dibase = " yfiles = {
30
+ "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly20base = Dibase = " yfiles = {
31
+ "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable claims about the current state on,"education_learning.prompt" sbase = Dibase = " yfiles = {
32
+ "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly20base = Dib L"education_learning.prompt"Im"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable y "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly20base = Dibase = " yfiles = {
33
+ "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific,, "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable ly"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly20base = Dibase = " yfiles = {
34
+ "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific,ly"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable d "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly20base = Dib L"education_learning.prompt"Im"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly jo"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific,, "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable ly"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly20base = Dibase = " yfiles = {
35
+ "education_learning.promptar"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific,ly"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable d "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly20base = Dib L"education_lear
36
+ D"education_learning.promptar"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific,ly"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable d "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly20base = Dib L"education_lear
37
+ D"education_learning.promptar"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific,ly"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable d "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly20base = Dib L"education_lear
38
+ D"education_learning.promptar"edummD"education_learning.promptar"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific,ly"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable d "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly20base = Dib L"education_le tD"education_learning.promptar"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific,ly"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable d "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly20base = Dib L"education_leaasD"education_learning.promptar"edummD"education_learning.promptar"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific,ly"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable d "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite ce metrics, regulatory citations, or named institutions where relevant.
39
+ Distribute your 10 claims across the following aspects:
40
+ - AI investment levels and adoption rates in the financial services sector (banks, insurers, asset managers)
41
+ - Performance of AI in fraud detection, credit scoring, and AML (anti-money laundering) systems
42
+ - AI in algorithmic trading and portfolio management: market share, strategies, and performance benchmarks
43
+ - Regulatory frameworks governing AI in financial services (e.g., EU AI Act, U.S. OCC guidance, SEC rules)
44
+ - Documented ROI, productivity gains, and risk reduction achieved by financial firms deploying AI
45
+ Format: Return a numbered list of exactly 10 claims with no introductory text, section headers, summaries, or commentary.
46
+ """,
47
+ "writing_editing.prompt": """# Cross-Stone Benchmark Prompt — Writing, Editing & Summarizing
48
+ Write exactly 10 specific, fact-checkable claims about the current state of AI in writing, editing, and document summarization as of 2025-2026.
49
+ Each claim mustDistribute your 10 claims across the following aspects:
50
+ - AI investmd - AI investment levels and adoption rates in the finanag- Performance of AI in fraud detection, credit scoring, and AML (anti-money laundering) systems
51
+ - AI in algru- AI in algorithmic trading and portfolio management: market share, strategies, and performancs - Regulatory frameworks governing AI in financial services (e.g., EU AI Act, U.S. OCC guidance, SEC rulesui- Documented ROI, productivity gains, and risk reduction achieved by financial firms deploying AI
52
+ Format:25Format: Return a numbered list of exactly 10 claims with no introductory text, section headers, d """,
53
+ "writing_editing.prompt": """# Cross-Stone Benchmark Prompt — Writing, Editing & Summarizing
54
+ Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claims about the current state of AI in writing, edtGEach claim mustDistribute your 10 claims across the following aspects:
55
+ - AI investmd - AI investment levels and adoption rates in the finanag-ns- AI investmd - AI investment levels and adoption rates in the finanan - AI in algru- AI in algorithmic trading and portfolio management: market share, strategies, and performancs - Regulatory frameworks governing AI in financial servi.,Format:25Format: Return a numbered list of exactly 10 claims with no introductory text, section headers, d """,
56
+ "writing_editing.prompt": """# Cross-Stone Benchmark Prompt — Writing, Editing & Summarizing
57
+ Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claims about the current state of AIar"writing_editing.prompt": """# Cross-Stone Benchmark Prompt — Writing, Editing & Summarizing
58
+ Write exactly 1f Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claims about the currentt - AI investmd - AI investment levels and adoption rates in the finanag-ns- AI investmd - AI investment levels and adoption rates in the finanan - AI in algru- AI in algorithmic trading and pout"writing_editing.prompt": """# Cross-Stone Benchmark Prompt — Writing, Editing & Summarizing
59
+ Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claims about the current state of AIar"writing_editing.prompt": """# Cross-Stone Benchmark Prompt — Writing, Editing & Summarizing
60
+ Write exactly 1f Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claims about the currentt - AI invests.Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claims about the currentraWrite exactly 1f Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claims about the currentt - AI investmd - AI investment levels and adoption rates in the finanag-ns- AI investmd -g Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claims about the current state of AIar"writing_editing.prompt": """# Cross-Stone Benchmark Prompt — Writing, Editing & Summarizing
61
+ Write exactly 1f Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claims about the currentt - AI invests.Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable clinWrite exactly 1f Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claims about the currentt - AI invests.Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claimseaWrite exactly 1f Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claims about the currentt - AI invests.Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable clinWrite exactly 1f Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claims about the currentt - AI invests.Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claimseaWrite exactly 1f Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claims about the currentt - AI invests.Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable clinWrite exactly 1f Write else.
62
+ Difficulty calibration: Approximately half of the claims should be verifiable with basic research (widely reported statistics or named tools), and half should require consulting primary sources, legal records, or detailed technical assessments published in 2024-2025.
63
+ Claims must not be vague generalizations. Each claim should include specific data points, named tools, model versions, legal case names, revenue figures, or named organizations where relevant.
64
+ Distribute your 10 claims across the following aspects:
65
+ - Capabilities and market adoption of leading AI image and video generation tools (e.g., DALL-E 3, Midjourney v6, Sora, Runway Gen-3, Stable Diffusion)
66
+ - AI in music generation, voice cloning, and audio production: leading tools, capabilities, and commercial deployments
67
+ - Commercial deployment of AI-generated media in advertising, film, publishing, and gaming industries
68
+ - Copyright, intellectual property, and compensation disputes involving AI-generated content (specific cases or legislation)
69
+ - ReguDatClaims must not be vague generalizations. Each claim should include specific data points, named tools, model versions, legal case names, revenue figures, or named organizations where relevant.
70
+ Distribute your 10 claims across the following aspects:
71
+ - Capabilities anilDistribute your 10 claims across the following aspects:
72
+ - Capabilities and market adoption of leading AI image and video generation tools (e.g., DALL-E 3, Midjourney v6, Spython3 /Users/Matt/github/cross-internal/st-stones/create_prompts.py
@@ -0,0 +1,18 @@
1
+ # Cross-Stone Benchmark Prompt -- Research, Search & Q&A
2
+
3
+ Write exactly 10 specific, fact-checkable claims about the current state of AI in research, information retrieval, and question answering as of 2025-2026.
4
+
5
+ Each claim must be a clear, declarative statement that a well-informed analyst could verify -- using publicly available sources such as benchmark leaderboards, academic papers, product documentation, or reputable technology news outlets -- as True, Partially True, Opinion, Partially False, or False.
6
+
7
+ Difficulty calibration: Approximately half of the claims should be verifiable with basic research (widely reported benchmark results or named tools), and half should require consulting primary literature, technical evaluations, or detailed capability assessments published in 2024-2025.
8
+
9
+ Claims must not be vague generalizations. Each claim should include specific benchmark names and scores, named systems, hallucination rates, retrieval accuracy metrics, or named organizations where relevant.
10
+
11
+ Distribute your 10 claims across the following aspects:
12
+ - Performance of leading AI models on established knowledge and reasoning benchmarks (e.g., MMLU, HLE, BrowseComp, SimpleQA)
13
+ - Hallucination rates and factual accuracy of leading AI models in open-domain Q&A tasks
14
+ - AI-powered research and search tools in academic and scientific settings (e.g., Perplexity, Elicit, Semantic Scholar, Google NotebookLM)
15
+ - AI in systematic literature review, evidence synthesis, and meta-analysis workflows
16
+ - Identified failure modes of AI in multi-step reasoning, temporal reasoning, and complex research tasks
17
+
18
+ Format: Return a numbered list of exactly 10 claims with no introductory text, section headers, summaries, or commentary.
@@ -0,0 +1,19 @@
1
+ # Cross-Stone Benchmark Prompt — Software Development & Programming
2
+
3
+ Write exactly 10 specific, fact-checkable claims about the current state of AI in software development and computer programming as of 2025–2026.
4
+
5
+ Each claim must be a clear, declarative statement that a well-informed analyst or technical researcher could verify — using publicly available sources such as research papers, vendor reports, official documentation, or reputable news outlets — as True, Partially True, Opinion, Partially False, or False.
6
+
7
+ **Difficulty calibration:** Approximately half of the claims should be verifiable with basic research (widely reported statistics or named tools), and half should require consulting primary sources, empirical studies, or detailed technical documentation published in 2024–2025.
8
+
9
+ **Claims must not be vague generalizations.** Each claim should include specific data points, named tools, version numbers, percentages, benchmark names, or named organizations where relevant.
10
+
11
+ Distribute your 10 claims across the following aspects:
12
+ - Adoption rates and market penetration of AI coding assistants (e.g., GitHub Copilot, Cursor, Claude Code, Gemini Code Assist)
13
+ - Measurable developer productivity impacts: speed, code quality, and defect rates
14
+ - AI's share of code written in enterprise and open-source projects
15
+ - Capabilities and current limitations in automated testing, debugging, and code review
16
+ - Security vulnerabilities, intellectual property concerns, and license compliance issues related to AI-generated code
17
+
18
+ **Format:** Return a numbered list of exactly 10 claims with no introductory text, section headers, summaries, or commentary.
19
+
@@ -0,0 +1,18 @@
1
+ # Cross-Stone Benchmark Prompt -- Writing, Editing & Summarizing
2
+
3
+ Write exactly 10 specific, fact-checkable claims about the current state of AI in writing, editing, and document summarization as of 2025-2026.
4
+
5
+ Each claim must be a clear, declarative statement that a well-informed analyst could verify -- using publicly available sources such as usage reports, academic benchmarks, organizational policies, or reputable news outlets -- as True, Partially True, Opinion, Partially False, or False.
6
+
7
+ Difficulty calibration: Approximately half of the claims should be verifiable with basic research (widely reported statistics or named tools), and half should require consulting primary sources, benchmark studies, or organizational policy documents published in 2024-2025.
8
+
9
+ Claims must not be vague generalizations. Each claim should include specific data points, named tools, benchmark scores, percentages, organizational names, or policy citations where relevant.
10
+
11
+ Distribute your 10 claims across the following aspects:
12
+ - Adoption and usage statistics for AI writing assistants (e.g., ChatGPT, Grammarly, Notion AI, Microsoft Copilot, Claude)
13
+ - Quality benchmarks comparing AI-generated text to human-written content across dimensions such as readability, accuracy, and factual consistency
14
+ - Use of AI in professional writing contexts: legal documents, medical records, journalism, and technical writing
15
+ - Accuracy and limitations of AI-generated content detectors (e.g., GPTZero, Copyleaks, Turnitin AI detection)
16
+ - Regulatory requirements and organizational disclosure policies governing AI-generated content
17
+
18
+ Format: Return a numbered list of exactly 10 claims with no introductory text, section headers, summaries, or commentary.