crossai-cli 0.1.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- cross_ai/__init__.py +0 -0
- cross_ai/ai_error_handler.py +15 -0
- cross_ai/ai_handler.py +22 -0
- cross_ai/ai_url.py +89 -0
- cross_ai/base_handler.py +3 -0
- cross_ai/commands.py +54 -0
- cross_ai/cross_stones/cross-stones-10.json +57 -0
- cross_ai/cross_stones/domains/creative_media.prompt +18 -0
- cross_ai/cross_stones/domains/customer_service.prompt +12 -0
- cross_ai/cross_stones/domains/data_analytics.prompt +18 -0
- cross_ai/cross_stones/domains/education_learning.prompt +18 -0
- cross_ai/cross_stones/domains/finance_business.prompt +18 -0
- cross_ai/cross_stones/domains/healthcare_medical.prompt +18 -0
- cross_ai/cross_stones/domains/marketing_content.prompt +72 -0
- cross_ai/cross_stones/domains/research_qa.prompt +18 -0
- cross_ai/cross_stones/domains/software_development.prompt +19 -0
- cross_ai/cross_stones/domains/writing_editing.prompt +18 -0
- cross_ai/discourse.py +192 -0
- cross_ai/mmd_branding.py +42 -0
- cross_ai/mmd_data_analysis.py +382 -0
- cross_ai/mmd_for_speaking.py +225 -0
- cross_ai/mmd_plot.py +121 -0
- cross_ai/mmd_process_report.py +285 -0
- cross_ai/mmd_single_key.py +188 -0
- cross_ai/mmd_startup.py +69 -0
- cross_ai/mmd_util.py +234 -0
- cross_ai/mmd_voice.py +163 -0
- cross_ai/mmd_web_server.py +88 -0
- cross_ai/st-admin.py +791 -0
- cross_ai/st-analyze.py +441 -0
- cross_ai/st-bang.py +554 -0
- cross_ai/st-cat.py +122 -0
- cross_ai/st-cross.py +749 -0
- cross_ai/st-domain.py +466 -0
- cross_ai/st-edit.py +368 -0
- cross_ai/st-fact.py +657 -0
- cross_ai/st-fetch.py +359 -0
- cross_ai/st-find.py +375 -0
- cross_ai/st-fix.py +1926 -0
- cross_ai/st-gen.py +230 -0
- cross_ai/st-heatmap.py +394 -0
- cross_ai/st-ls.py +270 -0
- cross_ai/st-man.py +247 -0
- cross_ai/st-merge.py +841 -0
- cross_ai/st-new.py +169 -0
- cross_ai/st-plot.py +471 -0
- cross_ai/st-post.py +334 -0
- cross_ai/st-prep.py +242 -0
- cross_ai/st-print.py +497 -0
- cross_ai/st-read.py +155 -0
- cross_ai/st-rm.py +176 -0
- cross_ai/st-speak.py +128 -0
- cross_ai/st-speed.py +945 -0
- cross_ai/st-stones.py +1435 -0
- cross_ai/st-verdict.py +538 -0
- cross_ai/st-voice.py +237 -0
- cross_ai/st.py +503 -0
- cross_ai/template/default.prompt +10 -0
- crossai_cli-0.1.0.dist-info/METADATA +327 -0
- crossai_cli-0.1.0.dist-info/RECORD +64 -0
- crossai_cli-0.1.0.dist-info/WHEEL +5 -0
- crossai_cli-0.1.0.dist-info/entry_points.txt +30 -0
- crossai_cli-0.1.0.dist-info/licenses/LICENSE +26 -0
- crossai_cli-0.1.0.dist-info/top_level.txt +1 -0
cross_ai/__init__.py
ADDED
|
File without changes
|
|
@@ -0,0 +1,15 @@
|
|
|
1
|
+
# ai_error_handler.py — compatibility shim
|
|
2
|
+
# Source of truth: cross-ai-core package (cross_ai_core.ai_error_handler)
|
|
3
|
+
from cross_ai_core.ai_error_handler import * # noqa: F401, F403
|
|
4
|
+
from cross_ai_core.ai_error_handler import ( # explicit for IDE / type checkers
|
|
5
|
+
handle_api_error,
|
|
6
|
+
is_quota_error,
|
|
7
|
+
is_rate_limit_error,
|
|
8
|
+
is_transient_error,
|
|
9
|
+
get_error_type,
|
|
10
|
+
retry_with_backoff,
|
|
11
|
+
CrossAIError,
|
|
12
|
+
QuotaExceededError,
|
|
13
|
+
RateLimitError,
|
|
14
|
+
TransientError,
|
|
15
|
+
)
|
cross_ai/ai_handler.py
ADDED
|
@@ -0,0 +1,22 @@
|
|
|
1
|
+
# ai_handler.py — compatibility shim
|
|
2
|
+
# Source of truth: cross-ai-core package (cross_ai_core.ai_handler)
|
|
3
|
+
# This file exists so st-*.py files and tests can continue to use:
|
|
4
|
+
# from ai_handler import process_prompt, get_content, ...
|
|
5
|
+
from cross_ai_core.ai_handler import * # noqa: F401, F403
|
|
6
|
+
from cross_ai_core.ai_handler import ( # explicit for IDE / type checkers
|
|
7
|
+
AI_HANDLER_REGISTRY,
|
|
8
|
+
AI_LIST,
|
|
9
|
+
AIResponse,
|
|
10
|
+
_API_KEY_ENV_VARS, # private — needed by tests
|
|
11
|
+
check_api_key,
|
|
12
|
+
get_ai_list,
|
|
13
|
+
get_ai_make,
|
|
14
|
+
get_ai_model,
|
|
15
|
+
get_content,
|
|
16
|
+
get_data_content,
|
|
17
|
+
get_data_title,
|
|
18
|
+
get_default_ai,
|
|
19
|
+
get_usage,
|
|
20
|
+
process_prompt,
|
|
21
|
+
put_content,
|
|
22
|
+
)
|
cross_ai/ai_url.py
ADDED
|
@@ -0,0 +1,89 @@
|
|
|
1
|
+
# Sorry, no AI here
|
|
2
|
+
import os
|
|
3
|
+
import json
|
|
4
|
+
import hashlib
|
|
5
|
+
import requests
|
|
6
|
+
import sys
|
|
7
|
+
|
|
8
|
+
AI_MAKE = "url"
|
|
9
|
+
AI_MODEL = "bs4"
|
|
10
|
+
|
|
11
|
+
|
|
12
|
+
def get_url_cached_response(tweet_id, verbose=False, use_cache=False):
|
|
13
|
+
|
|
14
|
+
url = f"https://api.twitter.com/2/tweets/{tweet_id}"
|
|
15
|
+
headers = get_url_headers()
|
|
16
|
+
|
|
17
|
+
if not use_cache:
|
|
18
|
+
response = requests.get(url, headers=headers)
|
|
19
|
+
json_str = json.dumps(response) # Force structure reorganization
|
|
20
|
+
json_response = json.loads(json_str)
|
|
21
|
+
return json_response, False # Not cached
|
|
22
|
+
else:
|
|
23
|
+
# Convert param to a string for hashing
|
|
24
|
+
param = {
|
|
25
|
+
"tweet_id": tweet_id,
|
|
26
|
+
"headers": headers,
|
|
27
|
+
"url": url,
|
|
28
|
+
}
|
|
29
|
+
param_str = json.dumps(param, sort_keys=True)
|
|
30
|
+
md5_hash = hashlib.md5(param_str.encode('utf-8')).hexdigest()
|
|
31
|
+
|
|
32
|
+
# Construct the cache file path
|
|
33
|
+
cache_dir = os.path.expanduser("~/.cross_api_cache")
|
|
34
|
+
cache_file = os.path.join(cache_dir, f"{md5_hash}.json")
|
|
35
|
+
|
|
36
|
+
# Check if the response is already in cache
|
|
37
|
+
if os.path.exists(cache_file):
|
|
38
|
+
if verbose:
|
|
39
|
+
print(f"api_cache: Using cache_file: {cache_file}")
|
|
40
|
+
with open(cache_file, 'r') as f:
|
|
41
|
+
return json.load(f), True # Cached
|
|
42
|
+
else:
|
|
43
|
+
if verbose:
|
|
44
|
+
print("api_cache: cache miss, submitting API request")
|
|
45
|
+
|
|
46
|
+
# If not in cache, fetch the response
|
|
47
|
+
response = requests.get(url, headers=headers)
|
|
48
|
+
if (status_code := response["status_code"]) != 200:
|
|
49
|
+
print(f"x.com response failed: {status_code}")
|
|
50
|
+
sys.exit(1)
|
|
51
|
+
json_str = json.dumps(response) # Force structure reorganization
|
|
52
|
+
json_response = json.loads(json_str)
|
|
53
|
+
|
|
54
|
+
# Save to cache
|
|
55
|
+
if not os.path.exists(cache_dir):
|
|
56
|
+
os.makedirs(cache_dir)
|
|
57
|
+
if verbose:
|
|
58
|
+
print(f"api_cache: api_cache/ dir created: {cache_dir}")
|
|
59
|
+
|
|
60
|
+
try:
|
|
61
|
+
with open(cache_file, 'w') as f:
|
|
62
|
+
json.dump(json_response, f)
|
|
63
|
+
if verbose:
|
|
64
|
+
print(f"api_cache: file created: {cache_file}")
|
|
65
|
+
except Exception as e:
|
|
66
|
+
print(f"api_cache: file write error: {str(e)}")
|
|
67
|
+
|
|
68
|
+
return json_response, False # Fresh API call, not cached
|
|
69
|
+
|
|
70
|
+
|
|
71
|
+
def get_url_headers():
|
|
72
|
+
x_bearer_token = os.environ.get('X_COM_BEARER_TOKEN')
|
|
73
|
+
headers = {"Authorization": f"Bearer {x_bearer_token}"}
|
|
74
|
+
return headers
|
|
75
|
+
|
|
76
|
+
|
|
77
|
+
def get_title(data):
|
|
78
|
+
title = data.get("title")
|
|
79
|
+
return title
|
|
80
|
+
|
|
81
|
+
|
|
82
|
+
def get_story(data):
|
|
83
|
+
text = data.get("text")
|
|
84
|
+
return text
|
|
85
|
+
|
|
86
|
+
|
|
87
|
+
def get_ai_tag():
|
|
88
|
+
return "\n\ncross:" + json.dumps(
|
|
89
|
+
{"make": AI_MAKE, "model": AI_MODEL})
|
cross_ai/base_handler.py
ADDED
cross_ai/commands.py
ADDED
|
@@ -0,0 +1,54 @@
|
|
|
1
|
+
"""
|
|
2
|
+
commands.py — Entry-point dispatch for pyproject.toml [project.scripts].
|
|
3
|
+
pip generates a thin wrapper that imports and calls each function here;
|
|
4
|
+
runpy executes the st-*.py file directly so hyphens in filenames are never
|
|
5
|
+
treated as Python identifiers.
|
|
6
|
+
"""
|
|
7
|
+
import os
|
|
8
|
+
import runpy
|
|
9
|
+
import sys
|
|
10
|
+
|
|
11
|
+
_HERE = os.path.dirname(os.path.abspath(__file__))
|
|
12
|
+
|
|
13
|
+
# Ensure the cross_ai/ directory is on sys.path so that st-*.py scripts can
|
|
14
|
+
# use bare module imports (e.g. `from mmd_startup import require_config`).
|
|
15
|
+
# When scripts are run directly as files, Python adds their directory to
|
|
16
|
+
# sys.path[0] automatically — runpy.run_path() does not, so we do it here.
|
|
17
|
+
if _HERE not in sys.path:
|
|
18
|
+
sys.path.insert(0, _HERE)
|
|
19
|
+
|
|
20
|
+
|
|
21
|
+
def _run(name: str) -> None:
|
|
22
|
+
runpy.run_path(os.path.join(_HERE, f"{name}.py"), run_name="__main__")
|
|
23
|
+
|
|
24
|
+
|
|
25
|
+
def st(): _run("st")
|
|
26
|
+
def st_admin(): _run("st-admin")
|
|
27
|
+
def st_analyze(): _run("st-analyze")
|
|
28
|
+
def st_bang(): _run("st-bang")
|
|
29
|
+
def st_cat(): _run("st-cat")
|
|
30
|
+
def st_cross(): _run("st-cross")
|
|
31
|
+
def st_domain(): _run("st-domain")
|
|
32
|
+
def st_edit(): _run("st-edit")
|
|
33
|
+
def st_fact(): _run("st-fact")
|
|
34
|
+
def st_fetch(): _run("st-fetch")
|
|
35
|
+
def st_find(): _run("st-find")
|
|
36
|
+
def st_fix(): _run("st-fix")
|
|
37
|
+
def st_gen(): _run("st-gen")
|
|
38
|
+
def st_heatmap(): _run("st-heatmap")
|
|
39
|
+
def st_ls(): _run("st-ls")
|
|
40
|
+
def st_man(): _run("st-man")
|
|
41
|
+
def st_merge(): _run("st-merge")
|
|
42
|
+
def st_new(): _run("st-new")
|
|
43
|
+
def st_plot(): _run("st-plot")
|
|
44
|
+
def st_post(): _run("st-post")
|
|
45
|
+
def st_prep(): _run("st-prep")
|
|
46
|
+
def st_print(): _run("st-print")
|
|
47
|
+
def st_read(): _run("st-read")
|
|
48
|
+
def st_rm(): _run("st-rm")
|
|
49
|
+
def st_speak(): _run("st-speak")
|
|
50
|
+
def st_speed(): _run("st-speed")
|
|
51
|
+
def st_stones(): _run("st-stones")
|
|
52
|
+
def st_verdict(): _run("st-verdict")
|
|
53
|
+
def st_voice(): _run("st-voice")
|
|
54
|
+
|
|
@@ -0,0 +1,57 @@
|
|
|
1
|
+
{
|
|
2
|
+
"id": "cross-stones-10",
|
|
3
|
+
"description": "Standard 10-domain Cross-Stones benchmark set. Locked params ensure scores are directly comparable across runs over time.",
|
|
4
|
+
"n_claims": 10,
|
|
5
|
+
"max_fact_score": 200,
|
|
6
|
+
"domains_dir": "domains",
|
|
7
|
+
"domains": [
|
|
8
|
+
{
|
|
9
|
+
"id": "software_development",
|
|
10
|
+
"name": "Software Development & Programming"
|
|
11
|
+
},
|
|
12
|
+
{
|
|
13
|
+
"id": "customer_service",
|
|
14
|
+
"name": "Customer Service & Support"
|
|
15
|
+
},
|
|
16
|
+
{
|
|
17
|
+
"id": "marketing_content",
|
|
18
|
+
"name": "Marketing & Content Creation"
|
|
19
|
+
},
|
|
20
|
+
{
|
|
21
|
+
"id": "education_learning",
|
|
22
|
+
"name": "Education & Learning"
|
|
23
|
+
},
|
|
24
|
+
{
|
|
25
|
+
"id": "data_analytics",
|
|
26
|
+
"name": "Data Analytics & Business Intelligence"
|
|
27
|
+
},
|
|
28
|
+
{
|
|
29
|
+
"id": "healthcare_medical",
|
|
30
|
+
"name": "Healthcare & Medical Analysis"
|
|
31
|
+
},
|
|
32
|
+
{
|
|
33
|
+
"id": "finance_business",
|
|
34
|
+
"name": "Finance & Business Decision Making"
|
|
35
|
+
},
|
|
36
|
+
{
|
|
37
|
+
"id": "writing_editing",
|
|
38
|
+
"name": "Writing, Editing & Summarizing"
|
|
39
|
+
},
|
|
40
|
+
{
|
|
41
|
+
"id": "research_qa",
|
|
42
|
+
"name": "Research, Search & Q&A"
|
|
43
|
+
},
|
|
44
|
+
{
|
|
45
|
+
"id": "creative_media",
|
|
46
|
+
"name": "Creative Media (Images, Video, Audio)"
|
|
47
|
+
}
|
|
48
|
+
],
|
|
49
|
+
"snapshots": [],
|
|
50
|
+
"speed_baseline": {
|
|
51
|
+
"gen_seconds": 20.07,
|
|
52
|
+
"fc_seconds": 91.87,
|
|
53
|
+
"total_seconds": 111.94,
|
|
54
|
+
"recorded_date": "2026-03-27",
|
|
55
|
+
"notes": "Baseline recorded 2026-03-27 \u2014 average across all AI providers. Future runs faster than 111.9s total will have speed_ratio > 1.0 and cross_stone_score may exceed 1.0, reflecting genuine improvement over the 2026 benchmark era."
|
|
56
|
+
}
|
|
57
|
+
}
|
|
@@ -0,0 +1,18 @@
|
|
|
1
|
+
# Cross-Stone Benchmark Prompt -- Creative Media (Images, Video, Audio)
|
|
2
|
+
|
|
3
|
+
Write exactly 10 specific, fact-checkable claims about the current state of AI in creative media production -- including image generation, video synthesis, music composition, and audio production -- as of 2025-2026.
|
|
4
|
+
|
|
5
|
+
Each claim must be a clear, declarative statement that a well-informed analyst could verify -- using publicly available sources such as company announcements, legal filings, industry reports, or reputable technology and entertainment news outlets -- as True, Partially True, Opinion, Partially False, or False.
|
|
6
|
+
|
|
7
|
+
Difficulty calibration: Approximately half of the claims should be verifiable with basic research (widely reported statistics or named tools), and half should require consulting primary sources, legal records, or detailed technical assessments published in 2024-2025.
|
|
8
|
+
|
|
9
|
+
Claims must not be vague generalizations. Each claim should include specific data points, named tools, model versions, legal case names, revenue figures, or named organizations where relevant.
|
|
10
|
+
|
|
11
|
+
Distribute your 10 claims across the following aspects:
|
|
12
|
+
- Capabilities and market adoption of leading AI image and video generation tools (e.g., DALL-E 3, Midjourney v6, Sora, Runway Gen-3, Stable Diffusion)
|
|
13
|
+
- AI in music generation, voice cloning, and audio production: leading tools, capabilities, and commercial deployments
|
|
14
|
+
- Commercial deployment of AI-generated media in advertising, film, publishing, and gaming industries
|
|
15
|
+
- Copyright, intellectual property, and compensation disputes involving AI-generated content (specific cases or legislation)
|
|
16
|
+
- Regulatory responses, platform policies, and industry standards addressing AI-generated deepfakes and synthetic media
|
|
17
|
+
|
|
18
|
+
Format: Return a numbered list of exactly 10 claims with no introductory text, section headers, summaries, or commentary.
|
|
@@ -0,0 +1,12 @@
|
|
|
1
|
+
# Cross-Stone Benchmark Prompt — Customer Service & Support
|
|
2
|
+
Write exactly 10 specific, fact-checkable claims about the current state of AI in customer service and support automation as of 2025–2026.
|
|
3
|
+
Each claim must be a clear, declarative statement that a well-informed analyst could verify — using publicly available sources such as industry surveys, vendor case studies, analyst reports, or reputable news outlets — as True, Partially True, Opinion, Partially False, or False.
|
|
4
|
+
**Difficulty calibration:** Approximately half of the claims should be verifiable with basic research (widely reported statistics or named platforms), and half should require consulting primary sources, empirical studies, or detailed performance data published in 2024–2025.
|
|
5
|
+
**Claims must not be vague generalizations.** Each claim should include specific data points, named platforms, percentages, benchmark metrics, or named organizations where relevant.
|
|
6
|
+
Distribute your 10 claims across the following aspects:
|
|
7
|
+
- Automation and deflection rates for AI-powered chatbots and virtual agents across industries
|
|
8
|
+
- Customer satisfaction (CSAT) and first-contact resolution quality compared to human agents
|
|
9
|
+
- Adoption rates across specific industries (retail, telecom, banking, healthcare)
|
|
10
|
+
- Integration of large language models (LLMs) into contact center platforms (e.g., Salesforce Einstein, Zendesk AI, AWS Connect)
|
|
11
|
+
- Documented cost savings, ROI metrics, and workforce impact reported by organizations deploying AI in customer service
|
|
12
|
+
**Format:** Return a numbered list of exactly 10 claims with no introductory text, section headers, summaries, or commentary.
|
|
@@ -0,0 +1,18 @@
|
|
|
1
|
+
# Cross-Stone Benchmark Prompt -- Data Analytics & Business Intelligence
|
|
2
|
+
|
|
3
|
+
Write exactly 10 specific, fact-checkable claims about the current state of AI in data analytics and business intelligence as of 2025-2026.
|
|
4
|
+
|
|
5
|
+
Each claim must be a clear, declarative statement that a well-informed analyst could verify -- using publicly available sources such as vendor documentation, industry reports, academic studies, or reputable news outlets -- as True, Partially True, Opinion, Partially False, or False.
|
|
6
|
+
|
|
7
|
+
Difficulty calibration: Approximately half of the claims should be verifiable with basic research (widely reported statistics or named platforms), and half should require consulting primary sources, empirical studies, or detailed technical documentation published in 2024-2025.
|
|
8
|
+
|
|
9
|
+
Claims must not be vague generalizations. Each claim should include specific data points, named tools, percentages, benchmark results, or named organizations where relevant.
|
|
10
|
+
|
|
11
|
+
Distribute your 10 claims across the following aspects:
|
|
12
|
+
- Adoption of AI and ML capabilities in major business intelligence platforms (e.g., Tableau, Microsoft Power BI, Looker, Snowflake Cortex)
|
|
13
|
+
- Impact of large language models on natural-language querying and self-service analytics
|
|
14
|
+
- AI-driven anomaly detection and predictive analytics performance in enterprise settings
|
|
15
|
+
- Accuracy, reliability, and hallucination risks in AI-generated data insights vs. human analysts
|
|
16
|
+
- Data governance, privacy, and explainability challenges in AI-driven analytics deployments
|
|
17
|
+
|
|
18
|
+
Format: Return a numbered list of exactly 10 claims with no introductory text, section headers, summaries, or commentary.
|
|
@@ -0,0 +1,18 @@
|
|
|
1
|
+
# Cross-Stone Benchmark Prompt -- Education & Learning
|
|
2
|
+
|
|
3
|
+
Write exactly 10 specific, fact-checkable claims about the current state of AI in education and personalized learning as of 2025-2026.
|
|
4
|
+
|
|
5
|
+
Each claim must be a clear, declarative statement that a well-informed analyst could verify -- using publicly available sources such as academic research, institutional reports, or reputable news outlets -- as True, Partially True, Opinion, Partially False, or False.
|
|
6
|
+
|
|
7
|
+
Difficulty calibration: Approximately half of the claims should be verifiable with basic research (widely reported statistics or named platforms), and half should require consulting primary sources, empirical studies, or detailed institutional data published in 2024-2025.
|
|
8
|
+
|
|
9
|
+
Claims must not be vague generalizations. Each claim should include specific data points, named platforms, percentages, study findings, or named institutions where relevant.
|
|
10
|
+
|
|
11
|
+
Distribute your 10 claims across the following aspects:
|
|
12
|
+
- Student and educator adoption rates of generative AI tools (e.g., ChatGPT, Khanmigo, Duolingo, Coursera AI)
|
|
13
|
+
- Measured learning outcomes from AI-assisted instruction or tutoring systems
|
|
14
|
+
- Institutional and government policies on AI use in classrooms and assessments
|
|
15
|
+
- AI-powered adaptive learning platforms and the evidence base for their effectiveness
|
|
16
|
+
- Academic integrity concerns, bias, and equity issues in AI-powered education
|
|
17
|
+
|
|
18
|
+
Format: Return a numbered list of exactly 10 claims with no introductory text, section headers, summaries, or commentary.
|
|
@@ -0,0 +1,18 @@
|
|
|
1
|
+
# Cross-Stone Benchmark Prompt -- Finance & Business Decision Making
|
|
2
|
+
|
|
3
|
+
Write exactly 10 specific, fact-checkable claims about the current state of AI in financial services, risk management, and business decision-making as of 2025-2026.
|
|
4
|
+
|
|
5
|
+
Each claim must be a clear, declarative statement that a well-informed analyst could verify -- using publicly available sources such as regulatory filings, industry surveys, academic research, or reputable financial news outlets -- as True, Partially True, Opinion, Partially False, or False.
|
|
6
|
+
|
|
7
|
+
Difficulty calibration: Approximately half of the claims should be verifiable with basic research (widely reported statistics or named systems), and half should require consulting primary sources, regulatory documents, or detailed financial performance data published in 2024-2025.
|
|
8
|
+
|
|
9
|
+
Claims must not be vague generalizations. Each claim should include specific data points, named platforms, dollar figures, performance metrics, regulatory citations, or named institutions where relevant.
|
|
10
|
+
|
|
11
|
+
Distribute your 10 claims across the following aspects:
|
|
12
|
+
- AI investment levels and adoption rates in the financial services sector (banks, insurers, asset managers)
|
|
13
|
+
- Performance of AI in fraud detection, credit scoring, and AML (anti-money laundering) systems
|
|
14
|
+
- AI in algorithmic trading and portfolio management: market share, strategies, and performance benchmarks
|
|
15
|
+
- Regulatory frameworks governing AI in financial services (e.g., EU AI Act, U.S. OCC guidance, SEC rules)
|
|
16
|
+
- Documented ROI, productivity gains, and risk reduction achieved by financial firms deploying AI
|
|
17
|
+
|
|
18
|
+
Format: Return a numbered list of exactly 10 claims with no introductory text, section headers, summaries, or commentary.
|
|
@@ -0,0 +1,18 @@
|
|
|
1
|
+
# Cross-Stone Benchmark Prompt -- Healthcare & Medical Analysis
|
|
2
|
+
|
|
3
|
+
Write exactly 10 specific, fact-checkable claims about the current state of AI in healthcare, medical diagnostics, and clinical decision support as of 2025-2026.
|
|
4
|
+
|
|
5
|
+
Each claim must be a clear, declarative statement that a well-informed analyst could verify -- using publicly available sources such as peer-reviewed journals, FDA databases, hospital system reports, or reputable health news outlets -- as True, Partially True, Opinion, Partially False, or False.
|
|
6
|
+
|
|
7
|
+
Difficulty calibration: Approximately half of the claims should be verifiable with basic research (widely reported statistics or named tools), and half should require consulting primary clinical literature, regulatory filings, or detailed health system data published in 2024-2025.
|
|
8
|
+
|
|
9
|
+
Claims must not be vague generalizations. Each claim should include specific data points, named systems, FDA clearance details, clinical trial results, percentages, or named institutions where relevant.
|
|
10
|
+
|
|
11
|
+
Distribute your 10 claims across the following aspects:
|
|
12
|
+
- FDA-cleared or CE-marked AI medical devices: cumulative count, approval trends, and leading categories (radiology, pathology, cardiology)
|
|
13
|
+
- Clinical performance of AI in medical imaging compared to human specialists (sensitivity, specificity, AUC metrics)
|
|
14
|
+
- AI in drug discovery and clinical trial design: timelines, cost reductions, and named examples
|
|
15
|
+
- Deployment and outcomes of AI clinical decision support systems in hospital settings
|
|
16
|
+
- Regulatory, liability, bias, and health equity challenges in medical AI adoption
|
|
17
|
+
|
|
18
|
+
Format: Return a numbered list of exactly 10 claims with no introductory text, section headers, summaries, or commentary.
|
|
@@ -0,0 +1,72 @@
|
|
|
1
|
+
# Cross-Stone Benchmark Prompt — Marketing & Content Creation
|
|
2
|
+
Write exactly 10 specific, fact-checkable claims about the current state of AI in marketing and content creation as of 2025–2026.
|
|
3
|
+
Each claim must be a clear, declarative statement that a well-informed analyst could verify — using publicly available sources such as industry surveys, vendor reports, academic studies, or reputable news outlets — as True, Partially True, Opinion, Partially False, or False.
|
|
4
|
+
**Difficulty calibration:** Approximately half of the claims should be verifiable with basic research (widely reported statistics or named platforms), and half should require consulting primary sources, empirical studies, or detailed performance data published in 2024–2025.
|
|
5
|
+
**Claims must not be vague generalizations.** Each claim should include specific data points, named platforms, percentages, benchmark metrics, or named organizations where releva# Cross-Stone Benchmark Prompt — Marketing & Content Creation
|
|
6
|
+
Write exactly 10 specific, AIWrite exactly 10 specific, fact-checkable claims about the cururEach claim must be a clear, declarative statement that a well-informed analyst could verify — using publicly available sources sdi**Difficulty calibration:** Approximately half of the claims should be verifiable with basic research (widely reported statistics or named platforms), and half should require consulting primary sources, empirical studies, or detailed performance data published in 2024–2025.
|
|
7
|
+
*AI**Claims must not be vague generalizations.** Each claim should include specific data points, named platforms, percentages, benchmark metriccat > /Users/Matt/github/cross-internal/st-stones/template/education_learning.prompt << 'EOF'
|
|
8
|
+
# Cross-Stone Benchmark Prompt — Education & Learning
|
|
9
|
+
Write exactly 10 specific, fact-checkable claims about the current state of AI in education and personalized learning as of 2025–2026.
|
|
10
|
+
Each claim must be a clear, declarative statement that a well-informed analyst could verify — using publicly available sources such as academic research, institutional reports, or reputable news outlets — as True, Partially True, Opinion, Partially False, or False.
|
|
11
|
+
Difficulty calibration: Approximately half of the claims should be verifiable with basic research (widely reported statistics or named platforms), and half should require consulting primary sources, empirical studies, or detailed institutional data published in 2024-2025.
|
|
12
|
+
Claims must not be vague generalizations. Each claim should include specific data points, named platforms, percentages, study findings, or named institutions where relevant.
|
|
13
|
+
Distribute your 10 c# Cross-Stone Benchmark Prompt — Education & Learning
|
|
14
|
+
Write exactly 10 specific, fact-checooWrite exactly 10 specific, fact-checkable claims aboutMeEach claim must be a clear, declarative statement that a well-informed analyst could verify — using publicly available sources such amsDifficulty calibration: Approximately half of the claims should be verifiable with basic research (widely reported statistics or named platforms), and half should require consulting primary sources, empirical studies, or detailed institutional data published in 2024-2n Claims must not be vague generalizationpython3 << 'PYEOF'
|
|
15
|
+
import os
|
|
16
|
+
base = "/Users/Matt/github/cross-internal/st-stones/template"
|
|
17
|
+
files = {
|
|
18
|
+
"education_learning.prompt": """# Cross-Stone Benchmark Prompt — Education & Learning
|
|
19
|
+
Write exactly 10 specific, fact-checkable claims about the current state of AI in education and personalized learning as of 2025-2026.
|
|
20
|
+
Each claim must be a clear, declarative statement that a well-informed analyst could verify — using publicly available sources such as academic research, institutional reports, or reputable news outlets — as True, Partially True, Opinion, Partially False, or False.
|
|
21
|
+
Difficulty calibration: Approximately half of the claims should be verifiable with basic research (widely reported statistics or named platforms), and half should require consulting primary sources, empirical studies, or detailed institutional data published in 2024-2025.
|
|
22
|
+
Claims must not be vague generalizations. Each claim should include specific data points, named platforms, percentages, study findings, or named institutionsimport os
|
|
23
|
+
base = Dibase = " yfiles = {
|
|
24
|
+
"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable claims about the current state of AI in educasEach claim must be a clear, declarative statement that a well-informed analyst could verify — using publicly available sources suchmsDifficulty calibration: Approximately half of the claims should be verifiable with basic research (widely reported statistics or named platforms), and half should require consulting primary sources, empirical studies, or detailed institutional data published in 2024-2n Claims must not be vague generalizations. Each claim should include specific data points, named platforms, percentages, study findings, or named institutionsimport os
|
|
25
|
+
base = Dibase = " yfiles = {
|
|
26
|
+
"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly20base = Dibase = " yfiles = {
|
|
27
|
+
"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable claims about the current state on,"education_learning.prompt" sbase = Dibase = " yfiles = {
|
|
28
|
+
"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly20base = Dibase = " yfiles = {
|
|
29
|
+
"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable claims about the current state on,"education_learning.prompt" sbase = Dibase = " yfiles = {
|
|
30
|
+
"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly20base = Dibase = " yfiles = {
|
|
31
|
+
"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable claims about the current state on,"education_learning.prompt" sbase = Dibase = " yfiles = {
|
|
32
|
+
"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly20base = Dib L"education_learning.prompt"Im"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable y "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly20base = Dibase = " yfiles = {
|
|
33
|
+
"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific,, "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable ly"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly20base = Dibase = " yfiles = {
|
|
34
|
+
"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific,ly"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable d "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly20base = Dib L"education_learning.prompt"Im"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly jo"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific,, "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable ly"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly20base = Dibase = " yfiles = {
|
|
35
|
+
"education_learning.promptar"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific,ly"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable d "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly20base = Dib L"education_lear
|
|
36
|
+
D"education_learning.promptar"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific,ly"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable d "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly20base = Dib L"education_lear
|
|
37
|
+
D"education_learning.promptar"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific,ly"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable d "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly20base = Dib L"education_lear
|
|
38
|
+
D"education_learning.promptar"edummD"education_learning.promptar"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific,ly"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable d "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly20base = Dib L"education_le tD"education_learning.promptar"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific,ly"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable d "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly20base = Dib L"education_leaasD"education_learning.promptar"edummD"education_learning.promptar"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific,ly"education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite exactly 10 specific, fact-checkable d "education_learning.prompt": """# Cross-Stone Bencuc"educatiptWrite ce metrics, regulatory citations, or named institutions where relevant.
|
|
39
|
+
Distribute your 10 claims across the following aspects:
|
|
40
|
+
- AI investment levels and adoption rates in the financial services sector (banks, insurers, asset managers)
|
|
41
|
+
- Performance of AI in fraud detection, credit scoring, and AML (anti-money laundering) systems
|
|
42
|
+
- AI in algorithmic trading and portfolio management: market share, strategies, and performance benchmarks
|
|
43
|
+
- Regulatory frameworks governing AI in financial services (e.g., EU AI Act, U.S. OCC guidance, SEC rules)
|
|
44
|
+
- Documented ROI, productivity gains, and risk reduction achieved by financial firms deploying AI
|
|
45
|
+
Format: Return a numbered list of exactly 10 claims with no introductory text, section headers, summaries, or commentary.
|
|
46
|
+
""",
|
|
47
|
+
"writing_editing.prompt": """# Cross-Stone Benchmark Prompt — Writing, Editing & Summarizing
|
|
48
|
+
Write exactly 10 specific, fact-checkable claims about the current state of AI in writing, editing, and document summarization as of 2025-2026.
|
|
49
|
+
Each claim mustDistribute your 10 claims across the following aspects:
|
|
50
|
+
- AI investmd - AI investment levels and adoption rates in the finanag- Performance of AI in fraud detection, credit scoring, and AML (anti-money laundering) systems
|
|
51
|
+
- AI in algru- AI in algorithmic trading and portfolio management: market share, strategies, and performancs - Regulatory frameworks governing AI in financial services (e.g., EU AI Act, U.S. OCC guidance, SEC rulesui- Documented ROI, productivity gains, and risk reduction achieved by financial firms deploying AI
|
|
52
|
+
Format:25Format: Return a numbered list of exactly 10 claims with no introductory text, section headers, d """,
|
|
53
|
+
"writing_editing.prompt": """# Cross-Stone Benchmark Prompt — Writing, Editing & Summarizing
|
|
54
|
+
Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claims about the current state of AI in writing, edtGEach claim mustDistribute your 10 claims across the following aspects:
|
|
55
|
+
- AI investmd - AI investment levels and adoption rates in the finanag-ns- AI investmd - AI investment levels and adoption rates in the finanan - AI in algru- AI in algorithmic trading and portfolio management: market share, strategies, and performancs - Regulatory frameworks governing AI in financial servi.,Format:25Format: Return a numbered list of exactly 10 claims with no introductory text, section headers, d """,
|
|
56
|
+
"writing_editing.prompt": """# Cross-Stone Benchmark Prompt — Writing, Editing & Summarizing
|
|
57
|
+
Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claims about the current state of AIar"writing_editing.prompt": """# Cross-Stone Benchmark Prompt — Writing, Editing & Summarizing
|
|
58
|
+
Write exactly 1f Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claims about the currentt - AI investmd - AI investment levels and adoption rates in the finanag-ns- AI investmd - AI investment levels and adoption rates in the finanan - AI in algru- AI in algorithmic trading and pout"writing_editing.prompt": """# Cross-Stone Benchmark Prompt — Writing, Editing & Summarizing
|
|
59
|
+
Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claims about the current state of AIar"writing_editing.prompt": """# Cross-Stone Benchmark Prompt — Writing, Editing & Summarizing
|
|
60
|
+
Write exactly 1f Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claims about the currentt - AI invests.Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claims about the currentraWrite exactly 1f Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claims about the currentt - AI investmd - AI investment levels and adoption rates in the finanag-ns- AI investmd -g Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claims about the current state of AIar"writing_editing.prompt": """# Cross-Stone Benchmark Prompt — Writing, Editing & Summarizing
|
|
61
|
+
Write exactly 1f Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claims about the currentt - AI invests.Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable clinWrite exactly 1f Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claims about the currentt - AI invests.Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claimseaWrite exactly 1f Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claims about the currentt - AI invests.Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable clinWrite exactly 1f Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claims about the currentt - AI invests.Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claimseaWrite exactly 1f Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable claims about the currentt - AI invests.Write exactly 10 spes "wrosWrite exactly 10 specific, fact-checkable clinWrite exactly 1f Write else.
|
|
62
|
+
Difficulty calibration: Approximately half of the claims should be verifiable with basic research (widely reported statistics or named tools), and half should require consulting primary sources, legal records, or detailed technical assessments published in 2024-2025.
|
|
63
|
+
Claims must not be vague generalizations. Each claim should include specific data points, named tools, model versions, legal case names, revenue figures, or named organizations where relevant.
|
|
64
|
+
Distribute your 10 claims across the following aspects:
|
|
65
|
+
- Capabilities and market adoption of leading AI image and video generation tools (e.g., DALL-E 3, Midjourney v6, Sora, Runway Gen-3, Stable Diffusion)
|
|
66
|
+
- AI in music generation, voice cloning, and audio production: leading tools, capabilities, and commercial deployments
|
|
67
|
+
- Commercial deployment of AI-generated media in advertising, film, publishing, and gaming industries
|
|
68
|
+
- Copyright, intellectual property, and compensation disputes involving AI-generated content (specific cases or legislation)
|
|
69
|
+
- ReguDatClaims must not be vague generalizations. Each claim should include specific data points, named tools, model versions, legal case names, revenue figures, or named organizations where relevant.
|
|
70
|
+
Distribute your 10 claims across the following aspects:
|
|
71
|
+
- Capabilities anilDistribute your 10 claims across the following aspects:
|
|
72
|
+
- Capabilities and market adoption of leading AI image and video generation tools (e.g., DALL-E 3, Midjourney v6, Spython3 /Users/Matt/github/cross-internal/st-stones/create_prompts.py
|
|
@@ -0,0 +1,18 @@
|
|
|
1
|
+
# Cross-Stone Benchmark Prompt -- Research, Search & Q&A
|
|
2
|
+
|
|
3
|
+
Write exactly 10 specific, fact-checkable claims about the current state of AI in research, information retrieval, and question answering as of 2025-2026.
|
|
4
|
+
|
|
5
|
+
Each claim must be a clear, declarative statement that a well-informed analyst could verify -- using publicly available sources such as benchmark leaderboards, academic papers, product documentation, or reputable technology news outlets -- as True, Partially True, Opinion, Partially False, or False.
|
|
6
|
+
|
|
7
|
+
Difficulty calibration: Approximately half of the claims should be verifiable with basic research (widely reported benchmark results or named tools), and half should require consulting primary literature, technical evaluations, or detailed capability assessments published in 2024-2025.
|
|
8
|
+
|
|
9
|
+
Claims must not be vague generalizations. Each claim should include specific benchmark names and scores, named systems, hallucination rates, retrieval accuracy metrics, or named organizations where relevant.
|
|
10
|
+
|
|
11
|
+
Distribute your 10 claims across the following aspects:
|
|
12
|
+
- Performance of leading AI models on established knowledge and reasoning benchmarks (e.g., MMLU, HLE, BrowseComp, SimpleQA)
|
|
13
|
+
- Hallucination rates and factual accuracy of leading AI models in open-domain Q&A tasks
|
|
14
|
+
- AI-powered research and search tools in academic and scientific settings (e.g., Perplexity, Elicit, Semantic Scholar, Google NotebookLM)
|
|
15
|
+
- AI in systematic literature review, evidence synthesis, and meta-analysis workflows
|
|
16
|
+
- Identified failure modes of AI in multi-step reasoning, temporal reasoning, and complex research tasks
|
|
17
|
+
|
|
18
|
+
Format: Return a numbered list of exactly 10 claims with no introductory text, section headers, summaries, or commentary.
|
|
@@ -0,0 +1,19 @@
|
|
|
1
|
+
# Cross-Stone Benchmark Prompt — Software Development & Programming
|
|
2
|
+
|
|
3
|
+
Write exactly 10 specific, fact-checkable claims about the current state of AI in software development and computer programming as of 2025–2026.
|
|
4
|
+
|
|
5
|
+
Each claim must be a clear, declarative statement that a well-informed analyst or technical researcher could verify — using publicly available sources such as research papers, vendor reports, official documentation, or reputable news outlets — as True, Partially True, Opinion, Partially False, or False.
|
|
6
|
+
|
|
7
|
+
**Difficulty calibration:** Approximately half of the claims should be verifiable with basic research (widely reported statistics or named tools), and half should require consulting primary sources, empirical studies, or detailed technical documentation published in 2024–2025.
|
|
8
|
+
|
|
9
|
+
**Claims must not be vague generalizations.** Each claim should include specific data points, named tools, version numbers, percentages, benchmark names, or named organizations where relevant.
|
|
10
|
+
|
|
11
|
+
Distribute your 10 claims across the following aspects:
|
|
12
|
+
- Adoption rates and market penetration of AI coding assistants (e.g., GitHub Copilot, Cursor, Claude Code, Gemini Code Assist)
|
|
13
|
+
- Measurable developer productivity impacts: speed, code quality, and defect rates
|
|
14
|
+
- AI's share of code written in enterprise and open-source projects
|
|
15
|
+
- Capabilities and current limitations in automated testing, debugging, and code review
|
|
16
|
+
- Security vulnerabilities, intellectual property concerns, and license compliance issues related to AI-generated code
|
|
17
|
+
|
|
18
|
+
**Format:** Return a numbered list of exactly 10 claims with no introductory text, section headers, summaries, or commentary.
|
|
19
|
+
|
|
@@ -0,0 +1,18 @@
|
|
|
1
|
+
# Cross-Stone Benchmark Prompt -- Writing, Editing & Summarizing
|
|
2
|
+
|
|
3
|
+
Write exactly 10 specific, fact-checkable claims about the current state of AI in writing, editing, and document summarization as of 2025-2026.
|
|
4
|
+
|
|
5
|
+
Each claim must be a clear, declarative statement that a well-informed analyst could verify -- using publicly available sources such as usage reports, academic benchmarks, organizational policies, or reputable news outlets -- as True, Partially True, Opinion, Partially False, or False.
|
|
6
|
+
|
|
7
|
+
Difficulty calibration: Approximately half of the claims should be verifiable with basic research (widely reported statistics or named tools), and half should require consulting primary sources, benchmark studies, or organizational policy documents published in 2024-2025.
|
|
8
|
+
|
|
9
|
+
Claims must not be vague generalizations. Each claim should include specific data points, named tools, benchmark scores, percentages, organizational names, or policy citations where relevant.
|
|
10
|
+
|
|
11
|
+
Distribute your 10 claims across the following aspects:
|
|
12
|
+
- Adoption and usage statistics for AI writing assistants (e.g., ChatGPT, Grammarly, Notion AI, Microsoft Copilot, Claude)
|
|
13
|
+
- Quality benchmarks comparing AI-generated text to human-written content across dimensions such as readability, accuracy, and factual consistency
|
|
14
|
+
- Use of AI in professional writing contexts: legal documents, medical records, journalism, and technical writing
|
|
15
|
+
- Accuracy and limitations of AI-generated content detectors (e.g., GPTZero, Copyleaks, Turnitin AI detection)
|
|
16
|
+
- Regulatory requirements and organizational disclosure policies governing AI-generated content
|
|
17
|
+
|
|
18
|
+
Format: Return a numbered list of exactly 10 claims with no introductory text, section headers, summaries, or commentary.
|