@happycastle/oh-my-openclaw 0.15.2 → 0.15.3
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/tools/look-at.js +2 -2
- package/dist/tools/web-search.js +2 -2
- package/openclaw.plugin.json +1 -1
- package/package.json +1 -1
- package/skills/gemini-look-at.md +21 -15
package/dist/tools/look-at.js
CHANGED
|
@@ -12,11 +12,11 @@ export function registerLookAtTool(api) {
|
|
|
12
12
|
goal: Type.String({ description: 'What to analyze or look for' }),
|
|
13
13
|
model: Type.Optional(Type.String({
|
|
14
14
|
description: 'Gemini model to use',
|
|
15
|
-
default: 'gemini-3-flash',
|
|
15
|
+
default: 'gemini-3-flash-preview',
|
|
16
16
|
})),
|
|
17
17
|
}),
|
|
18
18
|
execute: async (_toolCallId, params) => {
|
|
19
|
-
const model = params.model ?? 'gemini-3-flash';
|
|
19
|
+
const model = params.model ?? 'gemini-3-flash-preview';
|
|
20
20
|
try {
|
|
21
21
|
const stdout = await new Promise((resolve, reject) => {
|
|
22
22
|
execFile('gemini', ['-m', model, '--prompt', params.goal, '-f', params.file_path, '-o', 'text'], { timeout: GEMINI_TIMEOUT_MS, maxBuffer: 10 * 1024 * 1024 }, (error, stdout, stderr) => {
|
package/dist/tools/web-search.js
CHANGED
|
@@ -11,7 +11,7 @@ export function registerWebSearchTool(api) {
|
|
|
11
11
|
query: Type.String({ description: 'Search query or question to answer using web search' }),
|
|
12
12
|
model: Type.Optional(Type.String({
|
|
13
13
|
description: 'Gemini model to use',
|
|
14
|
-
default: 'gemini-3-flash',
|
|
14
|
+
default: 'gemini-3-flash-preview',
|
|
15
15
|
})),
|
|
16
16
|
}),
|
|
17
17
|
execute: async (_toolCallId, params) => {
|
|
@@ -19,7 +19,7 @@ export function registerWebSearchTool(api) {
|
|
|
19
19
|
if (!query) {
|
|
20
20
|
return toolError('Query is required and must not be empty');
|
|
21
21
|
}
|
|
22
|
-
const model = params.model ?? 'gemini-3-flash';
|
|
22
|
+
const model = params.model ?? 'gemini-3-flash-preview';
|
|
23
23
|
return new Promise((resolve) => {
|
|
24
24
|
execFile('gemini', ['-m', model, '--prompt', query, '-o', 'text'], { timeout: GEMINI_TIMEOUT_MS, maxBuffer: 10 * 1024 * 1024 }, (error, stdout, stderr) => {
|
|
25
25
|
if (error) {
|
package/openclaw.plugin.json
CHANGED
|
@@ -2,7 +2,7 @@
|
|
|
2
2
|
"id": "oh-my-openclaw",
|
|
3
3
|
"name": "Oh-My-OpenClaw",
|
|
4
4
|
"description": "Multi-agent orchestration plugin \u2014 11 agents, category-based model routing, todo enforcer, ralph loop, agent setup CLI, and custom tools",
|
|
5
|
-
"version": "0.
|
|
5
|
+
"version": "0.15.3",
|
|
6
6
|
"skills": ["skills"],
|
|
7
7
|
"configSchema": {
|
|
8
8
|
"type": "object",
|
package/package.json
CHANGED
package/skills/gemini-look-at.md
CHANGED
|
@@ -2,6 +2,7 @@
|
|
|
2
2
|
name: gemini-look-at
|
|
3
3
|
description: Gemini CLI-based multimodal analysis skill. Analyzes PDFs, images, screenshots, and diagrams using Gemini's native multimodal capabilities. Executed via tmux gemini session.
|
|
4
4
|
---
|
|
5
|
+
|
|
5
6
|
# Gemini Look-At — Multimodal Analysis via Gemini CLI
|
|
6
7
|
|
|
7
8
|
OmO's `look-at` tool reimplemented with Gemini CLI + tmux.
|
|
@@ -46,7 +47,7 @@ SESSION="gemini"
|
|
|
46
47
|
|
|
47
48
|
# Single file analysis
|
|
48
49
|
tmux -S "$SOCKET" send-keys -t "$SESSION":0.0 -l -- \
|
|
49
|
-
"gemini -m gemini-3-flash --prompt 'Analyze this file. Evaluate layout, design, and content quality, and suggest improvements.' -f /path/to/file.pdf -o text" \
|
|
50
|
+
"gemini -m gemini-3-flash-preview --prompt 'Analyze this file. Evaluate layout, design, and content quality, and suggest improvements.' -f /path/to/file.pdf -o text" \
|
|
50
51
|
&& sleep 0.1 && tmux -S "$SOCKET" send-keys -t "$SESSION":0.0 Enter
|
|
51
52
|
|
|
52
53
|
# Check results (wait 10-30 seconds)
|
|
@@ -60,7 +61,7 @@ When analysis results are long, redirect to file:
|
|
|
60
61
|
|
|
61
62
|
```bash
|
|
62
63
|
tmux -S "$SOCKET" send-keys -t "$SESSION":0.0 -l -- \
|
|
63
|
-
"gemini -m gemini-3-flash --prompt 'Detailed analysis' -f /path/to/file.pdf -o text > /tmp/gemini-analysis.md 2>&1" \
|
|
64
|
+
"gemini -m gemini-3-flash-preview --prompt 'Detailed analysis' -f /path/to/file.pdf -o text > /tmp/gemini-analysis.md 2>&1" \
|
|
64
65
|
&& sleep 0.1 && tmux -S "$SOCKET" send-keys -t "$SESSION":0.0 Enter
|
|
65
66
|
|
|
66
67
|
# Read results file
|
|
@@ -72,13 +73,14 @@ cat /tmp/gemini-analysis.md
|
|
|
72
73
|
|
|
73
74
|
```bash
|
|
74
75
|
tmux -S "$SOCKET" send-keys -t "$SESSION":0.0 -l -- \
|
|
75
|
-
"gemini -m gemini-3-flash --prompt 'Compare these two files' -f /path/to/before.png -f /path/to/after.png -o text" \
|
|
76
|
+
"gemini -m gemini-3-flash-preview --prompt 'Compare these two files' -f /path/to/before.png -f /path/to/after.png -o text" \
|
|
76
77
|
&& sleep 0.1 && tmux -S "$SOCKET" send-keys -t "$SESSION":0.0 Enter
|
|
77
78
|
```
|
|
78
79
|
|
|
79
80
|
## Analysis Prompts by Pattern
|
|
80
81
|
|
|
81
82
|
### PDF Layout/Design Review
|
|
83
|
+
|
|
82
84
|
```
|
|
83
85
|
Evaluate this PDF's layout, line breaks, and design.
|
|
84
86
|
If there are unnatural parts, tell me specifically.
|
|
@@ -86,6 +88,7 @@ In particular, check: margins, font size, line spacing, page breaks, table/image
|
|
|
86
88
|
```
|
|
87
89
|
|
|
88
90
|
### Screenshot UI Review
|
|
91
|
+
|
|
89
92
|
```
|
|
90
93
|
Analyze this web UI screenshot.
|
|
91
94
|
1. Layout alignment and spacing consistency
|
|
@@ -97,6 +100,7 @@ Provide specific improvement suggestions.
|
|
|
97
100
|
```
|
|
98
101
|
|
|
99
102
|
### Architecture Diagram Interpretation
|
|
103
|
+
|
|
100
104
|
```
|
|
101
105
|
Analyze this architecture diagram.
|
|
102
106
|
- Identify the role of each component
|
|
@@ -106,6 +110,7 @@ Analyze this architecture diagram.
|
|
|
106
110
|
```
|
|
107
111
|
|
|
108
112
|
### Before/After Comparison
|
|
113
|
+
|
|
109
114
|
```
|
|
110
115
|
Compare these two images.
|
|
111
116
|
- List specific changes
|
|
@@ -114,6 +119,7 @@ Compare these two images.
|
|
|
114
119
|
```
|
|
115
120
|
|
|
116
121
|
### Error Screenshot Debugging
|
|
122
|
+
|
|
117
123
|
```
|
|
118
124
|
Analyze this error screenshot.
|
|
119
125
|
- Read the error message accurately
|
|
@@ -123,21 +129,21 @@ Analyze this error screenshot.
|
|
|
123
129
|
|
|
124
130
|
## Model Selection Guide
|
|
125
131
|
|
|
126
|
-
| Use Case
|
|
127
|
-
|
|
128
|
-
| Quick check
|
|
129
|
-
| Detailed analysis | `gemini-3-pro`
|
|
130
|
-
| Best quality
|
|
132
|
+
| Use Case | Recommended Model | Reason |
|
|
133
|
+
| ----------------- | ----------------- | -------------------------------------- |
|
|
134
|
+
| Quick check | `gemini-3-flash` | Fast, sufficient multimodal capability |
|
|
135
|
+
| Detailed analysis | `gemini-3-pro` | Deeper analysis, longer content |
|
|
136
|
+
| Best quality | `gemini-3.1-pro` | Latest model, best multimodal |
|
|
131
137
|
|
|
132
138
|
## OpenClaw read vs Gemini CLI
|
|
133
139
|
|
|
134
|
-
| Feature
|
|
135
|
-
|
|
136
|
-
| Images (PNG/JPG)
|
|
137
|
-
| PDF
|
|
138
|
-
| Video
|
|
139
|
-
| Multiple files simultaneously | ❌ One at a time
|
|
140
|
-
| Authentication
|
|
140
|
+
| Feature | OpenClaw `read` | Gemini CLI |
|
|
141
|
+
| ----------------------------- | --------------------- | ---------------------------- |
|
|
142
|
+
| Images (PNG/JPG) | ✅ Send as attachment | ✅ Native analysis |
|
|
143
|
+
| PDF | ❌ Text only | ✅ Layout-inclusive analysis |
|
|
144
|
+
| Video | ❌ | ✅ Frame analysis |
|
|
145
|
+
| Multiple files simultaneously | ❌ One at a time | ✅ Multiple `-f` flags |
|
|
146
|
+
| Authentication | Not required | tmux session required |
|
|
141
147
|
|
|
142
148
|
## Workflow: OpenCode + Gemini CLI Integration
|
|
143
149
|
|