@wentorai/research-plugins 1.2.2 → 1.3.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +16 -8
- package/openclaw.plugin.json +10 -3
- package/package.json +2 -5
- package/skills/analysis/dataviz/SKILL.md +25 -0
- package/skills/analysis/dataviz/chart-image-generator/SKILL.md +1 -1
- package/skills/analysis/econometrics/SKILL.md +23 -0
- package/skills/analysis/econometrics/robustness-checks/SKILL.md +1 -1
- package/skills/analysis/statistics/SKILL.md +21 -0
- package/skills/analysis/statistics/data-anomaly-detection/SKILL.md +1 -1
- package/skills/analysis/statistics/ml-experiment-tracker/SKILL.md +1 -1
- package/skills/analysis/statistics/{senior-data-scientist-guide → modeling-strategy-guide}/SKILL.md +5 -5
- package/skills/analysis/wrangling/SKILL.md +21 -0
- package/skills/analysis/wrangling/csv-data-analyzer/SKILL.md +1 -1
- package/skills/analysis/wrangling/data-cog-guide/SKILL.md +1 -1
- package/skills/domains/ai-ml/SKILL.md +37 -0
- package/skills/domains/biomedical/SKILL.md +28 -0
- package/skills/domains/biomedical/genomas-guide/SKILL.md +1 -1
- package/skills/domains/biomedical/med-researcher-guide/SKILL.md +1 -1
- package/skills/domains/biomedical/medgeclaw-guide/SKILL.md +1 -1
- package/skills/domains/business/SKILL.md +17 -0
- package/skills/domains/business/architecture-design-guide/SKILL.md +1 -1
- package/skills/domains/chemistry/SKILL.md +19 -0
- package/skills/domains/chemistry/computational-chemistry-guide/SKILL.md +1 -1
- package/skills/domains/cs/SKILL.md +21 -0
- package/skills/domains/ecology/SKILL.md +16 -0
- package/skills/domains/economics/SKILL.md +20 -0
- package/skills/domains/economics/post-labor-economics/SKILL.md +1 -1
- package/skills/domains/economics/pricing-psychology-guide/SKILL.md +1 -1
- package/skills/domains/education/SKILL.md +19 -0
- package/skills/domains/education/academic-study-methods/SKILL.md +1 -1
- package/skills/domains/education/edumcp-guide/SKILL.md +1 -1
- package/skills/domains/finance/SKILL.md +19 -0
- package/skills/domains/finance/akshare-finance-data/SKILL.md +1 -1
- package/skills/domains/finance/options-analytics-agent-guide/SKILL.md +1 -1
- package/skills/domains/finance/stata-accounting-research/SKILL.md +1 -1
- package/skills/domains/geoscience/SKILL.md +17 -0
- package/skills/domains/humanities/SKILL.md +16 -0
- package/skills/domains/humanities/history-research-guide/SKILL.md +1 -1
- package/skills/domains/humanities/political-history-guide/SKILL.md +1 -1
- package/skills/domains/law/SKILL.md +19 -0
- package/skills/domains/math/SKILL.md +17 -0
- package/skills/domains/pharma/SKILL.md +17 -0
- package/skills/domains/physics/SKILL.md +16 -0
- package/skills/domains/social-science/SKILL.md +17 -0
- package/skills/domains/social-science/sociology-research-methods/SKILL.md +1 -1
- package/skills/literature/discovery/SKILL.md +20 -0
- package/skills/literature/discovery/paper-recommendation-guide/SKILL.md +1 -1
- package/skills/literature/discovery/semantic-paper-radar/SKILL.md +1 -1
- package/skills/literature/fulltext/SKILL.md +26 -0
- package/skills/literature/metadata/SKILL.md +35 -0
- package/skills/literature/metadata/doi-content-negotiation/SKILL.md +4 -0
- package/skills/literature/metadata/doi-resolution-guide/SKILL.md +4 -0
- package/skills/literature/metadata/orcid-api/SKILL.md +4 -0
- package/skills/literature/metadata/orcid-integration-guide/SKILL.md +4 -0
- package/skills/literature/search/SKILL.md +43 -0
- package/skills/literature/search/paper-search-mcp-guide/SKILL.md +1 -1
- package/skills/research/automation/SKILL.md +21 -0
- package/skills/research/deep-research/SKILL.md +24 -0
- package/skills/research/deep-research/auto-deep-research-guide/SKILL.md +1 -1
- package/skills/research/deep-research/in-depth-research-guide/SKILL.md +1 -1
- package/skills/research/funding/SKILL.md +20 -0
- package/skills/research/methodology/SKILL.md +24 -0
- package/skills/research/paper-review/SKILL.md +19 -0
- package/skills/research/paper-review/paper-critique-framework/SKILL.md +1 -1
- package/skills/tools/code-exec/SKILL.md +18 -0
- package/skills/tools/diagram/SKILL.md +20 -0
- package/skills/tools/document/SKILL.md +21 -0
- package/skills/tools/knowledge-graph/SKILL.md +21 -0
- package/skills/tools/ocr-translate/SKILL.md +18 -0
- package/skills/tools/ocr-translate/handwriting-recognition-guide/SKILL.md +2 -0
- package/skills/tools/ocr-translate/latex-ocr-guide/SKILL.md +2 -0
- package/skills/tools/scraping/SKILL.md +17 -0
- package/skills/writing/citation/SKILL.md +33 -0
- package/skills/writing/citation/zotfile-attachment-guide/SKILL.md +2 -0
- package/skills/writing/composition/SKILL.md +22 -0
- package/skills/writing/composition/research-paper-writer/SKILL.md +1 -1
- package/skills/writing/composition/scientific-writing-wrapper/SKILL.md +1 -1
- package/skills/writing/latex/SKILL.md +22 -0
- package/skills/writing/latex/academic-writing-latex/SKILL.md +1 -1
- package/skills/writing/latex/latex-drawing-guide/SKILL.md +1 -1
- package/skills/writing/polish/SKILL.md +20 -0
- package/skills/writing/polish/chinese-text-humanizer/SKILL.md +1 -1
- package/skills/writing/templates/SKILL.md +22 -0
- package/skills/writing/templates/beamer-presentation-guide/SKILL.md +1 -1
- package/skills/writing/templates/scientific-article-pdf/SKILL.md +1 -1
- package/skills/analysis/dataviz/citation-map-guide/SKILL.md +0 -184
- package/skills/analysis/dataviz/data-visualization-principles/SKILL.md +0 -171
- package/skills/analysis/econometrics/empirical-paper-analysis/SKILL.md +0 -192
- package/skills/analysis/econometrics/panel-data-regression-workflow/SKILL.md +0 -267
- package/skills/analysis/econometrics/stata-regression/SKILL.md +0 -117
- package/skills/analysis/statistics/general-statistics-guide/SKILL.md +0 -226
- package/skills/analysis/statistics/infiagent-benchmark-guide/SKILL.md +0 -106
- package/skills/analysis/statistics/pywayne-statistics-guide/SKILL.md +0 -192
- package/skills/analysis/statistics/quantitative-methods-guide/SKILL.md +0 -193
- package/skills/analysis/wrangling/claude-data-analysis-guide/SKILL.md +0 -100
- package/skills/analysis/wrangling/open-data-scientist-guide/SKILL.md +0 -197
- package/skills/domains/ai-ml/annotated-dl-papers-guide/SKILL.md +0 -159
- package/skills/domains/humanities/digital-humanities-methods/SKILL.md +0 -232
- package/skills/domains/law/legal-research-methods/SKILL.md +0 -190
- package/skills/domains/social-science/sociology-research-guide/SKILL.md +0 -238
- package/skills/literature/discovery/arxiv-paper-monitoring/SKILL.md +0 -233
- package/skills/literature/discovery/paper-tracking-guide/SKILL.md +0 -211
- package/skills/literature/fulltext/zotero-scihub-guide/SKILL.md +0 -168
- package/skills/literature/search/arxiv-osiris/SKILL.md +0 -199
- package/skills/literature/search/deepgit-search-guide/SKILL.md +0 -147
- package/skills/literature/search/multi-database-literature-search/SKILL.md +0 -198
- package/skills/literature/search/papers-chat-guide/SKILL.md +0 -194
- package/skills/literature/search/pasa-paper-search-guide/SKILL.md +0 -138
- package/skills/literature/search/scientify-literature-survey/SKILL.md +0 -203
- package/skills/research/automation/ai-scientist-guide/SKILL.md +0 -228
- package/skills/research/automation/coexist-ai-guide/SKILL.md +0 -149
- package/skills/research/automation/foam-agent-guide/SKILL.md +0 -203
- package/skills/research/automation/research-paper-orchestrator/SKILL.md +0 -254
- package/skills/research/deep-research/academic-deep-research/SKILL.md +0 -190
- package/skills/research/deep-research/cognitive-kernel-guide/SKILL.md +0 -200
- package/skills/research/deep-research/corvus-research-guide/SKILL.md +0 -132
- package/skills/research/deep-research/deep-research-pro/SKILL.md +0 -213
- package/skills/research/deep-research/deep-research-work/SKILL.md +0 -204
- package/skills/research/deep-research/research-cog/SKILL.md +0 -153
- package/skills/research/methodology/academic-mentor-guide/SKILL.md +0 -169
- package/skills/research/methodology/deep-innovator-guide/SKILL.md +0 -242
- package/skills/research/methodology/research-pipeline-units-guide/SKILL.md +0 -169
- package/skills/research/paper-review/paper-compare-guide/SKILL.md +0 -238
- package/skills/research/paper-review/paper-digest-guide/SKILL.md +0 -240
- package/skills/research/paper-review/paper-research-assistant/SKILL.md +0 -231
- package/skills/research/paper-review/research-quality-filter/SKILL.md +0 -261
- package/skills/tools/code-exec/contextplus-mcp-guide/SKILL.md +0 -110
- package/skills/tools/diagram/clawphd-guide/SKILL.md +0 -149
- package/skills/tools/diagram/scientific-graphical-abstract/SKILL.md +0 -201
- package/skills/tools/document/md2pdf-xelatex/SKILL.md +0 -212
- package/skills/tools/document/openpaper-guide/SKILL.md +0 -232
- package/skills/tools/document/weknora-guide/SKILL.md +0 -216
- package/skills/tools/knowledge-graph/mimir-memory-guide/SKILL.md +0 -135
- package/skills/tools/knowledge-graph/open-webui-tools-guide/SKILL.md +0 -156
- package/skills/tools/ocr-translate/formula-recognition-guide/SKILL.md +0 -367
- package/skills/tools/ocr-translate/math-equation-renderer/SKILL.md +0 -198
- package/skills/tools/scraping/api-data-collection-guide/SKILL.md +0 -301
- package/skills/writing/citation/academic-citation-manager-guide/SKILL.md +0 -182
- package/skills/writing/composition/opendraft-thesis-guide/SKILL.md +0 -200
- package/skills/writing/composition/paper-debugger-guide/SKILL.md +0 -143
- package/skills/writing/composition/paperforge-guide/SKILL.md +0 -205
|
@@ -1,228 +0,0 @@
|
|
|
1
|
-
---
|
|
2
|
-
name: ai-scientist-guide
|
|
3
|
-
description: "End-to-end automated scientific discovery with AI Scientist v2"
|
|
4
|
-
metadata:
|
|
5
|
-
openclaw:
|
|
6
|
-
emoji: "🤖"
|
|
7
|
-
category: "research"
|
|
8
|
-
subcategory: "automation"
|
|
9
|
-
keywords: ["ai-scientist", "research automation", "scientific workflow", "AI experiment design"]
|
|
10
|
-
source: "https://github.com/SakanaAI/AI-Scientist-v2"
|
|
11
|
-
---
|
|
12
|
-
|
|
13
|
-
# AI Scientist Guide
|
|
14
|
-
|
|
15
|
-
## Overview
|
|
16
|
-
|
|
17
|
-
The AI Scientist v2 is a fully autonomous scientific research system developed by Sakana AI that can generate hypotheses, run experiments, analyze data, and write complete scientific manuscripts. It represents the cutting edge of AI-driven research automation, having produced the first workshop paper written entirely by AI and accepted through peer review at ICLR 2025.
|
|
18
|
-
|
|
19
|
-
Unlike its predecessor (v1), the AI Scientist v2 removes reliance on human-authored templates, generalizes across Machine Learning domains, and employs a progressive agentic tree search guided by an experiment manager agent. This guide explains how to set up, configure, and use the system effectively, as well as how to integrate its principles into your own research workflows.
|
|
20
|
-
|
|
21
|
-
This skill is relevant for researchers interested in accelerating their experimental cycles, exploring automated hypothesis generation, or understanding how agentic AI systems approach scientific discovery. Even if you do not use AI Scientist v2 directly, the concepts behind its design -- structured ideation, tree-based experiment exploration, automated writing -- can inform how you organize your own research.
|
|
22
|
-
|
|
23
|
-
## System Architecture
|
|
24
|
-
|
|
25
|
-
The AI Scientist v2 operates through a multi-stage pipeline:
|
|
26
|
-
|
|
27
|
-
```
|
|
28
|
-
Topic Description (.md)
|
|
29
|
-
|
|
|
30
|
-
v
|
|
31
|
-
[Ideation Stage] --> Research Ideas (.json)
|
|
32
|
-
|
|
|
33
|
-
v
|
|
34
|
-
[Experiment Stage] --> Best-First Tree Search (BFTS)
|
|
35
|
-
| - Multiple parallel workers
|
|
36
|
-
| - Automatic debugging
|
|
37
|
-
| - Experiment manager agent
|
|
38
|
-
v
|
|
39
|
-
[Analysis Stage] --> Results + Figures
|
|
40
|
-
|
|
|
41
|
-
v
|
|
42
|
-
[Writing Stage] --> Complete Paper (.pdf)
|
|
43
|
-
|
|
|
44
|
-
v
|
|
45
|
-
[Review Stage] --> Automated Peer Review
|
|
46
|
-
```
|
|
47
|
-
|
|
48
|
-
### Key Components
|
|
49
|
-
|
|
50
|
-
| Component | Role | Model Used |
|
|
51
|
-
|-----------|------|------------|
|
|
52
|
-
| Ideation Agent | Generates research hypotheses | Configurable (GPT-4o, Claude) |
|
|
53
|
-
| Experiment Manager | Guides tree search exploration | Claude 3.5 Sonnet (default) |
|
|
54
|
-
| Analysis Agent | Interprets results, creates figures | Same as experiment |
|
|
55
|
-
| Writing Agent | Drafts full paper with LaTeX | o1-preview (default) |
|
|
56
|
-
| Citation Agent | Finds and integrates references | GPT-4o (default) |
|
|
57
|
-
| Review Agent | Simulates peer review | GPT-4o (default) |
|
|
58
|
-
|
|
59
|
-
## Installation and Setup
|
|
60
|
-
|
|
61
|
-
### Prerequisites
|
|
62
|
-
|
|
63
|
-
- Linux with NVIDIA GPU (CUDA support required)
|
|
64
|
-
- Python 3.11+
|
|
65
|
-
- conda or mamba package manager
|
|
66
|
-
|
|
67
|
-
### Step-by-Step Installation
|
|
68
|
-
|
|
69
|
-
```bash
|
|
70
|
-
# 1. Create and activate environment
|
|
71
|
-
conda create -n ai_scientist python=3.11
|
|
72
|
-
conda activate ai_scientist
|
|
73
|
-
|
|
74
|
-
# 2. Install PyTorch with CUDA
|
|
75
|
-
conda install pytorch torchvision torchaudio pytorch-cuda=12.4 \
|
|
76
|
-
-c pytorch -c nvidia
|
|
77
|
-
|
|
78
|
-
# 3. Install PDF and LaTeX tools
|
|
79
|
-
conda install anaconda::poppler conda-forge::chktex
|
|
80
|
-
|
|
81
|
-
# 4. Clone and install
|
|
82
|
-
git clone https://github.com/SakanaAI/AI-Scientist-v2.git
|
|
83
|
-
cd AI-Scientist-v2
|
|
84
|
-
pip install -r requirements.txt
|
|
85
|
-
|
|
86
|
-
# 5. Set API keys
|
|
87
|
-
export OPENAI_API_KEY=<key>
|
|
88
|
-
export S2_API_KEY=<key> # Optional but recommended
|
|
89
|
-
```
|
|
90
|
-
|
|
91
|
-
## Running the Pipeline
|
|
92
|
-
|
|
93
|
-
### Stage 1: Ideation
|
|
94
|
-
|
|
95
|
-
Create a topic description file following this structure:
|
|
96
|
-
|
|
97
|
-
```markdown
|
|
98
|
-
# Title
|
|
99
|
-
Exploring Efficient Fine-Tuning Methods for Large Language Models
|
|
100
|
-
|
|
101
|
-
# Keywords
|
|
102
|
-
LoRA, parameter-efficient fine-tuning, LLM adaptation, low-rank
|
|
103
|
-
|
|
104
|
-
# TL;DR
|
|
105
|
-
Investigate novel parameter-efficient methods for adapting LLMs to
|
|
106
|
-
domain-specific tasks with minimal compute.
|
|
107
|
-
|
|
108
|
-
# Abstract
|
|
109
|
-
Large language models require substantial resources for full fine-tuning.
|
|
110
|
-
Parameter-efficient methods like LoRA reduce this cost but may sacrifice
|
|
111
|
-
performance. We seek to explore new approaches that balance efficiency
|
|
112
|
-
and effectiveness across diverse downstream tasks.
|
|
113
|
-
```
|
|
114
|
-
|
|
115
|
-
Run ideation:
|
|
116
|
-
|
|
117
|
-
```bash
|
|
118
|
-
python ai_scientist/perform_ideation_temp_free.py \
|
|
119
|
-
--workshop-file "ai_scientist/ideas/my_topic.md" \
|
|
120
|
-
--model gpt-4o-2024-05-13 \
|
|
121
|
-
--max-num-generations 20 \
|
|
122
|
-
--num-reflections 5
|
|
123
|
-
```
|
|
124
|
-
|
|
125
|
-
This produces a JSON file with structured research ideas including hypotheses, proposed experiments, and related work.
|
|
126
|
-
|
|
127
|
-
### Stage 2: Experiment and Paper Generation
|
|
128
|
-
|
|
129
|
-
```bash
|
|
130
|
-
python launch_scientist_bfts.py \
|
|
131
|
-
--load_ideas "ai_scientist/ideas/my_topic.json" \
|
|
132
|
-
--load_code \
|
|
133
|
-
--add_dataset_ref \
|
|
134
|
-
--model_writeup o1-preview-2024-09-12 \
|
|
135
|
-
--model_citation gpt-4o-2024-11-20 \
|
|
136
|
-
--model_review gpt-4o-2024-11-20 \
|
|
137
|
-
--model_agg_plots o3-mini-2025-01-31 \
|
|
138
|
-
--num_cite_rounds 20
|
|
139
|
-
```
|
|
140
|
-
|
|
141
|
-
### Configuration: bfts_config.yaml
|
|
142
|
-
|
|
143
|
-
Key parameters to tune:
|
|
144
|
-
|
|
145
|
-
```yaml
|
|
146
|
-
agent:
|
|
147
|
-
num_workers: 3 # Parallel exploration paths
|
|
148
|
-
steps: 21 # Maximum nodes to explore
|
|
149
|
-
num_seeds: 3 # Initial root nodes
|
|
150
|
-
|
|
151
|
-
search:
|
|
152
|
-
max_debug_depth: 3 # Max debug attempts per failing node
|
|
153
|
-
debug_prob: 0.5 # Probability of debugging vs. abandoning
|
|
154
|
-
num_drafts: 3 # Number of independent search trees
|
|
155
|
-
```
|
|
156
|
-
|
|
157
|
-
## Cost and Performance Estimates
|
|
158
|
-
|
|
159
|
-
| Phase | Typical Cost | Duration |
|
|
160
|
-
|-------|-------------|----------|
|
|
161
|
-
| Ideation (20 ideas) | $2-5 | 15-30 min |
|
|
162
|
-
| Experimentation (BFTS) | $15-20 | 2-6 hours |
|
|
163
|
-
| Writing + Citation | $5 | 20-30 min |
|
|
164
|
-
| Review | $1-2 | 5-10 min |
|
|
165
|
-
| **Total per run** | **$23-32** | **3-7 hours** |
|
|
166
|
-
|
|
167
|
-
## Integrating AI Scientist Principles Into Your Research
|
|
168
|
-
|
|
169
|
-
Even without running the full system, you can adopt its methodological ideas:
|
|
170
|
-
|
|
171
|
-
### Structured Ideation
|
|
172
|
-
|
|
173
|
-
Use LLMs to brainstorm research directions systematically:
|
|
174
|
-
|
|
175
|
-
```python
|
|
176
|
-
prompt = """
|
|
177
|
-
Given the research area of [TOPIC], generate 5 research ideas.
|
|
178
|
-
For each idea, provide:
|
|
179
|
-
1. Hypothesis (one sentence)
|
|
180
|
-
2. Key experiment to test it
|
|
181
|
-
3. Expected outcome if hypothesis is true
|
|
182
|
-
4. Expected outcome if hypothesis is false
|
|
183
|
-
5. Why this matters (impact)
|
|
184
|
-
"""
|
|
185
|
-
```
|
|
186
|
-
|
|
187
|
-
### Tree-Based Experiment Design
|
|
188
|
-
|
|
189
|
-
Instead of running experiments linearly, structure them as a tree:
|
|
190
|
-
|
|
191
|
-
1. Start with 2-3 seed experiments (broad exploration)
|
|
192
|
-
2. Evaluate results at each node
|
|
193
|
-
3. Expand the most promising branches
|
|
194
|
-
4. Prune branches that show diminishing returns
|
|
195
|
-
5. Debug failures before abandoning (up to a depth limit)
|
|
196
|
-
|
|
197
|
-
### Automated Literature Checks
|
|
198
|
-
|
|
199
|
-
Use Semantic Scholar API to check novelty before investing in an idea:
|
|
200
|
-
|
|
201
|
-
```python
|
|
202
|
-
import requests
|
|
203
|
-
|
|
204
|
-
def check_novelty(query, max_results=10):
|
|
205
|
-
url = "https://api.semanticscholar.org/graph/v1/paper/search"
|
|
206
|
-
params = {"query": query, "limit": max_results,
|
|
207
|
-
"fields": "title,year,citationCount"}
|
|
208
|
-
resp = requests.get(url, params=params)
|
|
209
|
-
papers = resp.json().get('data', [])
|
|
210
|
-
return papers
|
|
211
|
-
```
|
|
212
|
-
|
|
213
|
-
## Best Practices
|
|
214
|
-
|
|
215
|
-
- **Always disclose AI involvement.** If AI Scientist generates any part of your paper, disclose this clearly in the methods section.
|
|
216
|
-
- **Validate all generated results.** Automated systems can produce plausible but incorrect code. Review experiments manually.
|
|
217
|
-
- **Use sandboxed environments.** The system executes LLM-generated code. Run it in Docker containers.
|
|
218
|
-
- **Start with well-defined topics.** Narrow, concrete research questions produce better results than broad ones.
|
|
219
|
-
- **Iterate on the topic description.** The quality of the input topic file strongly influences output quality.
|
|
220
|
-
- **Combine with human judgment.** Use AI Scientist for ideation and draft generation, but apply human expertise for final decisions.
|
|
221
|
-
|
|
222
|
-
## References
|
|
223
|
-
|
|
224
|
-
- [AI-Scientist-v2 Repository](https://github.com/SakanaAI/AI-Scientist-v2) -- Source code (2,229+ stars)
|
|
225
|
-
- [AI Scientist v2 Paper](https://pub.sakana.ai/ai-scientist-v2/paper) -- Workshop-Level Automated Scientific Discovery via Agentic Tree Search
|
|
226
|
-
- [AI Scientist Blog Post](https://sakana.ai/ai-scientist-first-publication/) -- Sakana AI announcement
|
|
227
|
-
- [AIDE: ML Engineering Agent](https://github.com/WecoAI/aideml) -- Foundation for the tree search component
|
|
228
|
-
- [Semantic Scholar API](https://api.semanticscholar.org/) -- Literature search API
|
|
@@ -1,149 +0,0 @@
|
|
|
1
|
-
---
|
|
2
|
-
name: coexist-ai-guide
|
|
3
|
-
description: "Modular MCP-based research assistant framework"
|
|
4
|
-
metadata:
|
|
5
|
-
openclaw:
|
|
6
|
-
emoji: "🧩"
|
|
7
|
-
category: "research"
|
|
8
|
-
subcategory: "automation"
|
|
9
|
-
keywords: ["CoexistAI", "MCP", "research assistant", "modular agents", "academic workflow", "framework"]
|
|
10
|
-
source: "https://github.com/SPThole/CoexistAI"
|
|
11
|
-
---
|
|
12
|
-
|
|
13
|
-
# CoexistAI Research Assistant Guide
|
|
14
|
-
|
|
15
|
-
## Overview
|
|
16
|
-
|
|
17
|
-
CoexistAI is a modular research assistant framework built on MCP (Model Context Protocol) that provides composable academic research capabilities. It offers MCP servers for paper search, citation management, data analysis, and writing assistance that can be mixed and matched with any MCP-compatible LLM client. Designed for researchers who want customizable, extensible AI research tooling.
|
|
18
|
-
|
|
19
|
-
## Architecture
|
|
20
|
-
|
|
21
|
-
```
|
|
22
|
-
LLM Client (Claude Code / Open WebUI / etc.)
|
|
23
|
-
↓ MCP Protocol
|
|
24
|
-
CoexistAI MCP Servers
|
|
25
|
-
├── paper-search (arXiv, S2, PubMed)
|
|
26
|
-
├── citation-manager (BibTeX, formatting)
|
|
27
|
-
├── data-analysis (Python execution)
|
|
28
|
-
├── writing-assist (drafting, revision)
|
|
29
|
-
├── note-taker (structured notes)
|
|
30
|
-
└── custom modules (extend as needed)
|
|
31
|
-
```
|
|
32
|
-
|
|
33
|
-
## Installation
|
|
34
|
-
|
|
35
|
-
```bash
|
|
36
|
-
# Install CoexistAI
|
|
37
|
-
npm install -g @coexistai/mcp-servers
|
|
38
|
-
|
|
39
|
-
# Or individual modules
|
|
40
|
-
npm install -g @coexistai/paper-search
|
|
41
|
-
npm install -g @coexistai/citation-manager
|
|
42
|
-
npm install -g @coexistai/data-analysis
|
|
43
|
-
```
|
|
44
|
-
|
|
45
|
-
## MCP Configuration
|
|
46
|
-
|
|
47
|
-
```json
|
|
48
|
-
{
|
|
49
|
-
"mcpServers": {
|
|
50
|
-
"coexist-paper-search": {
|
|
51
|
-
"command": "npx",
|
|
52
|
-
"args": ["@coexistai/paper-search"],
|
|
53
|
-
"env": {}
|
|
54
|
-
},
|
|
55
|
-
"coexist-citation": {
|
|
56
|
-
"command": "npx",
|
|
57
|
-
"args": ["@coexistai/citation-manager"],
|
|
58
|
-
"env": {
|
|
59
|
-
"BIB_FILE": "./references.bib"
|
|
60
|
-
}
|
|
61
|
-
},
|
|
62
|
-
"coexist-analysis": {
|
|
63
|
-
"command": "npx",
|
|
64
|
-
"args": ["@coexistai/data-analysis"],
|
|
65
|
-
"env": {
|
|
66
|
-
"SANDBOX": "true"
|
|
67
|
-
}
|
|
68
|
-
}
|
|
69
|
-
}
|
|
70
|
-
}
|
|
71
|
-
```
|
|
72
|
-
|
|
73
|
-
## Module: Paper Search
|
|
74
|
-
|
|
75
|
-
```markdown
|
|
76
|
-
### Available Tools
|
|
77
|
-
- `search_papers(query, source, limit)` — Search academic DBs
|
|
78
|
-
- `get_paper_details(id)` — Fetch full metadata
|
|
79
|
-
- `find_related(id, limit)` — Find related papers
|
|
80
|
-
- `get_citations(id)` — List citing papers
|
|
81
|
-
- `get_references(id)` — List referenced papers
|
|
82
|
-
|
|
83
|
-
### Example Usage
|
|
84
|
-
"Search for papers on contrastive learning in NLP from 2023"
|
|
85
|
-
→ Returns top results with title, authors, abstract, DOI
|
|
86
|
-
```
|
|
87
|
-
|
|
88
|
-
## Module: Citation Manager
|
|
89
|
-
|
|
90
|
-
```markdown
|
|
91
|
-
### Available Tools
|
|
92
|
-
- `add_citation(doi)` — Add to .bib file from DOI
|
|
93
|
-
- `format_citation(id, style)` — Format in APA/MLA/etc
|
|
94
|
-
- `search_bib(query)` — Search existing bibliography
|
|
95
|
-
- `check_duplicates()` — Find duplicate entries
|
|
96
|
-
- `export_bib(format)` — Export in various formats
|
|
97
|
-
|
|
98
|
-
### Example Usage
|
|
99
|
-
"Add the BERT paper to my bibliography"
|
|
100
|
-
→ Fetches metadata, generates BibTeX, appends to refs.bib
|
|
101
|
-
```
|
|
102
|
-
|
|
103
|
-
## Module: Data Analysis
|
|
104
|
-
|
|
105
|
-
```markdown
|
|
106
|
-
### Available Tools
|
|
107
|
-
- `run_python(code)` — Execute Python in sandbox
|
|
108
|
-
- `analyze_csv(path, task)` — Auto-analyze data file
|
|
109
|
-
- `generate_plot(data, type)` — Create visualizations
|
|
110
|
-
- `run_statistics(data, test)` — Statistical tests
|
|
111
|
-
|
|
112
|
-
### Example Usage
|
|
113
|
-
"Run a t-test comparing groups A and B in experiment.csv"
|
|
114
|
-
→ Loads data, runs scipy.stats.ttest_ind, returns results
|
|
115
|
-
```
|
|
116
|
-
|
|
117
|
-
## Custom Module Development
|
|
118
|
-
|
|
119
|
-
```typescript
|
|
120
|
-
// Create a custom MCP module
|
|
121
|
-
import { McpServer } from "@modelcontextprotocol/sdk/server/mcp.js";
|
|
122
|
-
|
|
123
|
-
const server = new McpServer({
|
|
124
|
-
name: "my-research-tool",
|
|
125
|
-
version: "1.0.0",
|
|
126
|
-
});
|
|
127
|
-
|
|
128
|
-
server.tool(
|
|
129
|
-
"custom_analysis",
|
|
130
|
-
{ description: "Run custom research analysis" },
|
|
131
|
-
async (args) => {
|
|
132
|
-
// Your custom logic
|
|
133
|
-
return { result: "Analysis complete" };
|
|
134
|
-
}
|
|
135
|
-
);
|
|
136
|
-
```
|
|
137
|
-
|
|
138
|
-
## Use Cases
|
|
139
|
-
|
|
140
|
-
1. **Modular research**: Pick-and-choose research capabilities
|
|
141
|
-
2. **Custom pipelines**: Build tailored research workflows
|
|
142
|
-
3. **Tool integration**: Connect to existing research infrastructure
|
|
143
|
-
4. **Team standardization**: Shared MCP modules across lab
|
|
144
|
-
5. **Extension**: Add domain-specific research tools
|
|
145
|
-
|
|
146
|
-
## References
|
|
147
|
-
|
|
148
|
-
- [CoexistAI GitHub](https://github.com/SPThole/CoexistAI)
|
|
149
|
-
- [MCP Specification](https://modelcontextprotocol.io/)
|
|
@@ -1,203 +0,0 @@
|
|
|
1
|
-
---
|
|
2
|
-
name: foam-agent-guide
|
|
3
|
-
description: "Agent for automated knowledge graph building from research notes"
|
|
4
|
-
metadata:
|
|
5
|
-
openclaw:
|
|
6
|
-
emoji: "🫧"
|
|
7
|
-
category: "research"
|
|
8
|
-
subcategory: "automation"
|
|
9
|
-
keywords: ["Foam", "knowledge graph", "Zettelkasten", "research notes", "linked notes", "PKM agent"]
|
|
10
|
-
source: "https://github.com/foambubble/foam"
|
|
11
|
-
---
|
|
12
|
-
|
|
13
|
-
# Foam Agent Guide
|
|
14
|
-
|
|
15
|
-
## Overview
|
|
16
|
-
|
|
17
|
-
Foam is a personal knowledge management and note-sharing system built on VS Code, inspired by Roam Research. This guide covers using AI agents to automate Foam-based research workflows — extracting concepts from papers, building knowledge graphs, discovering connections between notes, and maintaining a Zettelkasten-style research knowledge base. Particularly useful for researchers managing large literature collections.
|
|
18
|
-
|
|
19
|
-
## Foam Basics
|
|
20
|
-
|
|
21
|
-
### Workspace Structure
|
|
22
|
-
|
|
23
|
-
```
|
|
24
|
-
research-foam/
|
|
25
|
-
├── .foam/
|
|
26
|
-
│ └── config.json # Foam configuration
|
|
27
|
-
├── .vscode/
|
|
28
|
-
│ └── settings.json # VS Code settings
|
|
29
|
-
├── inbox/ # Unprocessed notes
|
|
30
|
-
├── literature/ # Paper notes (one per paper)
|
|
31
|
-
├── concepts/ # Concept/topic notes
|
|
32
|
-
├── projects/ # Project-specific notes
|
|
33
|
-
├── daily/ # Daily research journal
|
|
34
|
-
└── README.md # Graph entry point
|
|
35
|
-
```
|
|
36
|
-
|
|
37
|
-
### Note Format
|
|
38
|
-
|
|
39
|
-
```markdown
|
|
40
|
-
# Attention Mechanism
|
|
41
|
-
|
|
42
|
-
Tags: #transformer #nlp #deep-learning
|
|
43
|
-
|
|
44
|
-
## Summary
|
|
45
|
-
The attention mechanism allows models to focus on relevant parts
|
|
46
|
-
of the input sequence when producing output.
|
|
47
|
-
|
|
48
|
-
## Key Concepts
|
|
49
|
-
- [[self-attention]] computes relationships within a sequence
|
|
50
|
-
- [[cross-attention]] relates two different sequences
|
|
51
|
-
- [[multi-head-attention]] runs parallel attention functions
|
|
52
|
-
|
|
53
|
-
## References
|
|
54
|
-
- [[vaswani-2017-attention]] — original Transformer paper
|
|
55
|
-
- [[bahdanau-2015-attention]] — attention for NMT
|
|
56
|
-
|
|
57
|
-
## Related
|
|
58
|
-
- [[transformer-architecture]]
|
|
59
|
-
- [[positional-encoding]]
|
|
60
|
-
```
|
|
61
|
-
|
|
62
|
-
## Automated Note Generation
|
|
63
|
-
|
|
64
|
-
```python
|
|
65
|
-
from foam_agent import FoamAgent
|
|
66
|
-
|
|
67
|
-
agent = FoamAgent(
|
|
68
|
-
workspace="./research-foam",
|
|
69
|
-
llm_provider="anthropic",
|
|
70
|
-
)
|
|
71
|
-
|
|
72
|
-
# Generate literature note from PDF
|
|
73
|
-
note = agent.process_paper(
|
|
74
|
-
pdf_path="papers/vaswani2017attention.pdf",
|
|
75
|
-
template="literature",
|
|
76
|
-
)
|
|
77
|
-
# Creates: literature/vaswani-2017-attention.md
|
|
78
|
-
# - Extracts title, authors, year, venue
|
|
79
|
-
# - Summarizes key contributions
|
|
80
|
-
# - Identifies main concepts → [[wikilinks]]
|
|
81
|
-
# - Adds BibTeX reference
|
|
82
|
-
|
|
83
|
-
# Batch process papers directory
|
|
84
|
-
agent.process_papers_batch(
|
|
85
|
-
input_dir="papers/",
|
|
86
|
-
output_dir="literature/",
|
|
87
|
-
skip_existing=True,
|
|
88
|
-
)
|
|
89
|
-
```
|
|
90
|
-
|
|
91
|
-
## Knowledge Graph Building
|
|
92
|
-
|
|
93
|
-
```python
|
|
94
|
-
# Discover connections between notes
|
|
95
|
-
connections = agent.discover_connections(
|
|
96
|
-
scope="literature/",
|
|
97
|
-
min_similarity=0.7,
|
|
98
|
-
)
|
|
99
|
-
|
|
100
|
-
for conn in connections:
|
|
101
|
-
print(f"{conn.source} ↔ {conn.target}")
|
|
102
|
-
print(f" Reason: {conn.reason}")
|
|
103
|
-
print(f" Similarity: {conn.score:.2f}")
|
|
104
|
-
|
|
105
|
-
# Auto-insert wikilinks for discovered connections
|
|
106
|
-
agent.link_notes(connections, mode="suggest")
|
|
107
|
-
# Adds [[suggested-link]] with <!-- foam:auto --> comment
|
|
108
|
-
|
|
109
|
-
# Build concept map from literature notes
|
|
110
|
-
concept_map = agent.build_concept_map(
|
|
111
|
-
scope="literature/",
|
|
112
|
-
min_mentions=3,
|
|
113
|
-
)
|
|
114
|
-
for concept in concept_map.nodes:
|
|
115
|
-
print(f"{concept.name}: mentioned in {concept.count} papers")
|
|
116
|
-
```
|
|
117
|
-
|
|
118
|
-
## Daily Research Journal
|
|
119
|
-
|
|
120
|
-
```python
|
|
121
|
-
# Generate daily note with research context
|
|
122
|
-
agent.create_daily_note(
|
|
123
|
-
include=[
|
|
124
|
-
"recent_papers", # Papers read recently
|
|
125
|
-
"open_questions", # Unresolved questions from notes
|
|
126
|
-
"stale_notes", # Notes not updated in 30+ days
|
|
127
|
-
"orphan_notes", # Notes with no incoming links
|
|
128
|
-
"suggested_reading", # Papers related to recent work
|
|
129
|
-
],
|
|
130
|
-
)
|
|
131
|
-
|
|
132
|
-
# Output: daily/2025-03-10.md
|
|
133
|
-
# ## Recently Added
|
|
134
|
-
# - [[vaswani-2017-attention]] (added yesterday)
|
|
135
|
-
#
|
|
136
|
-
# ## Open Questions
|
|
137
|
-
# - How does [[rotary-position-embedding]] compare to [[alibi]]?
|
|
138
|
-
#
|
|
139
|
-
# ## Suggested Reading
|
|
140
|
-
# Based on recent notes on [[flash-attention]], consider:
|
|
141
|
-
# - "FlashAttention-2: Faster Attention" (Dao, 2023)
|
|
142
|
-
```
|
|
143
|
-
|
|
144
|
-
## Graph Analysis
|
|
145
|
-
|
|
146
|
-
```python
|
|
147
|
-
# Analyze knowledge graph structure
|
|
148
|
-
stats = agent.analyze_graph()
|
|
149
|
-
|
|
150
|
-
print(f"Total notes: {stats.total_notes}")
|
|
151
|
-
print(f"Total links: {stats.total_links}")
|
|
152
|
-
print(f"Orphan notes: {stats.orphan_count}")
|
|
153
|
-
print(f"Most connected: {stats.top_nodes[:5]}")
|
|
154
|
-
print(f"Clusters: {stats.cluster_count}")
|
|
155
|
-
|
|
156
|
-
# Identify research gaps
|
|
157
|
-
gaps = agent.find_gaps()
|
|
158
|
-
for gap in gaps:
|
|
159
|
-
print(f"Gap: {gap.description}")
|
|
160
|
-
print(f" Between clusters: {gap.cluster_a} ↔ {gap.cluster_b}")
|
|
161
|
-
print(f" Suggested topics: {gap.suggested_topics}")
|
|
162
|
-
```
|
|
163
|
-
|
|
164
|
-
## Configuration
|
|
165
|
-
|
|
166
|
-
```json
|
|
167
|
-
{
|
|
168
|
-
"foam.agent": {
|
|
169
|
-
"llm_provider": "anthropic",
|
|
170
|
-
"templates": {
|
|
171
|
-
"literature": "templates/literature.md",
|
|
172
|
-
"concept": "templates/concept.md",
|
|
173
|
-
"daily": "templates/daily.md"
|
|
174
|
-
},
|
|
175
|
-
"auto_link": {
|
|
176
|
-
"enabled": true,
|
|
177
|
-
"min_similarity": 0.75,
|
|
178
|
-
"max_suggestions_per_note": 5
|
|
179
|
-
},
|
|
180
|
-
"graph": {
|
|
181
|
-
"exclude_patterns": ["daily/*", "templates/*"],
|
|
182
|
-
"tag_colors": {
|
|
183
|
-
"transformer": "#3B82F6",
|
|
184
|
-
"nlp": "#10B981"
|
|
185
|
-
}
|
|
186
|
-
}
|
|
187
|
-
}
|
|
188
|
-
}
|
|
189
|
-
```
|
|
190
|
-
|
|
191
|
-
## Use Cases
|
|
192
|
-
|
|
193
|
-
1. **Literature management**: Auto-generate linked notes from papers
|
|
194
|
-
2. **Concept mapping**: Build and visualize research concept graphs
|
|
195
|
-
3. **Research journaling**: AI-assisted daily research summaries
|
|
196
|
-
4. **Gap discovery**: Find under-explored connections between topics
|
|
197
|
-
5. **Collaborative wikis**: Shared team research knowledge bases
|
|
198
|
-
|
|
199
|
-
## References
|
|
200
|
-
|
|
201
|
-
- [Foam GitHub](https://github.com/foambubble/foam)
|
|
202
|
-
- [Foam Documentation](https://foambubble.github.io/foam/)
|
|
203
|
-
- [Zettelkasten Method](https://zettelkasten.de/introduction/)
|