aidevops 2.52.1 → 2.53.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +1 -1
- package/VERSION +1 -1
- package/aidevops.sh +15 -9
- package/package.json +4 -4
- package/scripts/npm-postinstall.js +6 -7
- package/setup.sh +1 -1
- package/templates/deploy-templates.sh +144 -0
- package/templates/home/.agent/README.md +33 -0
- package/templates/home/AGENTS.md +96 -0
- package/templates/home/git/.agent/README.md +48 -0
- package/templates/home/git/AGENTS.md +97 -0
- package/templates/standard-functions.sh +179 -0
- package/templates/wordpress-performance-workflow.md +217 -0
- package/.agent/AGENTS.md +0 -614
- package/.agent/accounts.md +0 -65
- package/.agent/aidevops/add-new-mcp-to-aidevops.md +0 -456
- package/.agent/aidevops/api-integrations.md +0 -335
- package/.agent/aidevops/architecture.md +0 -510
- package/.agent/aidevops/configs.md +0 -274
- package/.agent/aidevops/docs.md +0 -244
- package/.agent/aidevops/extension.md +0 -311
- package/.agent/aidevops/mcp-integrations.md +0 -340
- package/.agent/aidevops/mcp-troubleshooting.md +0 -162
- package/.agent/aidevops/memory-patterns.md +0 -172
- package/.agent/aidevops/providers.md +0 -217
- package/.agent/aidevops/recommendations.md +0 -321
- package/.agent/aidevops/requirements.md +0 -301
- package/.agent/aidevops/resources.md +0 -214
- package/.agent/aidevops/security-requirements.md +0 -174
- package/.agent/aidevops/security.md +0 -350
- package/.agent/aidevops/service-links.md +0 -400
- package/.agent/aidevops/services.md +0 -357
- package/.agent/aidevops/setup.md +0 -153
- package/.agent/aidevops/troubleshooting.md +0 -389
- package/.agent/aidevops.md +0 -124
- package/.agent/build-plus.md +0 -244
- package/.agent/content/guidelines.md +0 -109
- package/.agent/content.md +0 -87
- package/.agent/health.md +0 -59
- package/.agent/legal.md +0 -59
- package/.agent/loop-state/full-loop.local.md +0 -16
- package/.agent/loop-state/ralph-loop.local.md +0 -10
- package/.agent/marketing.md +0 -440
- package/.agent/memory/README.md +0 -260
- package/.agent/onboarding.md +0 -796
- package/.agent/plan-plus.md +0 -245
- package/.agent/research.md +0 -100
- package/.agent/sales.md +0 -333
- package/.agent/scripts/101domains-helper.sh +0 -701
- package/.agent/scripts/add-missing-returns.sh +0 -140
- package/.agent/scripts/agent-browser-helper.sh +0 -311
- package/.agent/scripts/agno-setup.sh +0 -712
- package/.agent/scripts/ahrefs-mcp-wrapper.js +0 -168
- package/.agent/scripts/aidevops-update-check.sh +0 -71
- package/.agent/scripts/ampcode-cli.sh +0 -522
- package/.agent/scripts/auto-version-bump.sh +0 -156
- package/.agent/scripts/autogen-helper.sh +0 -512
- package/.agent/scripts/beads-sync-helper.sh +0 -596
- package/.agent/scripts/closte-helper.sh +0 -5
- package/.agent/scripts/cloudron-helper.sh +0 -321
- package/.agent/scripts/codacy-cli-chunked.sh +0 -581
- package/.agent/scripts/codacy-cli.sh +0 -442
- package/.agent/scripts/code-audit-helper.sh +0 -5
- package/.agent/scripts/coderabbit-cli.sh +0 -417
- package/.agent/scripts/coderabbit-pro-analysis.sh +0 -238
- package/.agent/scripts/commands/code-simplifier.md +0 -86
- package/.agent/scripts/commands/full-loop.md +0 -246
- package/.agent/scripts/commands/postflight-loop.md +0 -103
- package/.agent/scripts/commands/recall.md +0 -182
- package/.agent/scripts/commands/remember.md +0 -132
- package/.agent/scripts/commands/save-todo.md +0 -175
- package/.agent/scripts/commands/session-review.md +0 -154
- package/.agent/scripts/comprehensive-quality-fix.sh +0 -106
- package/.agent/scripts/context-builder-helper.sh +0 -522
- package/.agent/scripts/coolify-cli-helper.sh +0 -674
- package/.agent/scripts/coolify-helper.sh +0 -380
- package/.agent/scripts/crawl4ai-examples.sh +0 -401
- package/.agent/scripts/crawl4ai-helper.sh +0 -1078
- package/.agent/scripts/crewai-helper.sh +0 -681
- package/.agent/scripts/dev-browser-helper.sh +0 -513
- package/.agent/scripts/dns-helper.sh +0 -396
- package/.agent/scripts/domain-research-helper.sh +0 -917
- package/.agent/scripts/dspy-helper.sh +0 -285
- package/.agent/scripts/dspyground-helper.sh +0 -291
- package/.agent/scripts/eeat-score-helper.sh +0 -1242
- package/.agent/scripts/efficient-return-fix.sh +0 -92
- package/.agent/scripts/extract-opencode-prompts.sh +0 -128
- package/.agent/scripts/find-missing-returns.sh +0 -113
- package/.agent/scripts/fix-auth-headers.sh +0 -104
- package/.agent/scripts/fix-common-strings.sh +0 -254
- package/.agent/scripts/fix-content-type.sh +0 -100
- package/.agent/scripts/fix-error-messages.sh +0 -130
- package/.agent/scripts/fix-misplaced-returns.sh +0 -74
- package/.agent/scripts/fix-remaining-literals.sh +0 -152
- package/.agent/scripts/fix-return-statements.sh +0 -41
- package/.agent/scripts/fix-s131-default-cases.sh +0 -249
- package/.agent/scripts/fix-sc2155-simple.sh +0 -102
- package/.agent/scripts/fix-shellcheck-critical.sh +0 -187
- package/.agent/scripts/fix-string-literals.sh +0 -273
- package/.agent/scripts/full-loop-helper.sh +0 -773
- package/.agent/scripts/generate-opencode-agents.sh +0 -497
- package/.agent/scripts/generate-opencode-commands.sh +0 -1629
- package/.agent/scripts/generate-skills.sh +0 -366
- package/.agent/scripts/git-platforms-helper.sh +0 -640
- package/.agent/scripts/gitea-cli-helper.sh +0 -743
- package/.agent/scripts/github-cli-helper.sh +0 -702
- package/.agent/scripts/gitlab-cli-helper.sh +0 -682
- package/.agent/scripts/gsc-add-user-helper.sh +0 -325
- package/.agent/scripts/gsc-sitemap-helper.sh +0 -678
- package/.agent/scripts/hetzner-helper.sh +0 -485
- package/.agent/scripts/hostinger-helper.sh +0 -229
- package/.agent/scripts/keyword-research-helper.sh +0 -1815
- package/.agent/scripts/langflow-helper.sh +0 -544
- package/.agent/scripts/linkedin-automation.py +0 -241
- package/.agent/scripts/linter-manager.sh +0 -599
- package/.agent/scripts/linters-local.sh +0 -434
- package/.agent/scripts/list-keys-helper.sh +0 -488
- package/.agent/scripts/local-browser-automation.py +0 -339
- package/.agent/scripts/localhost-helper.sh +0 -744
- package/.agent/scripts/loop-common.sh +0 -806
- package/.agent/scripts/mainwp-helper.sh +0 -728
- package/.agent/scripts/markdown-formatter.sh +0 -338
- package/.agent/scripts/markdown-lint-fix.sh +0 -311
- package/.agent/scripts/mass-fix-returns.sh +0 -58
- package/.agent/scripts/mcp-diagnose.sh +0 -167
- package/.agent/scripts/mcp-inspector-helper.sh +0 -449
- package/.agent/scripts/memory-helper.sh +0 -650
- package/.agent/scripts/monitor-code-review.sh +0 -255
- package/.agent/scripts/onboarding-helper.sh +0 -706
- package/.agent/scripts/opencode-github-setup-helper.sh +0 -797
- package/.agent/scripts/opencode-test-helper.sh +0 -213
- package/.agent/scripts/pagespeed-helper.sh +0 -464
- package/.agent/scripts/pandoc-helper.sh +0 -362
- package/.agent/scripts/postflight-check.sh +0 -555
- package/.agent/scripts/pre-commit-hook.sh +0 -259
- package/.agent/scripts/pre-edit-check.sh +0 -169
- package/.agent/scripts/qlty-cli.sh +0 -356
- package/.agent/scripts/quality-cli-manager.sh +0 -525
- package/.agent/scripts/quality-feedback-helper.sh +0 -462
- package/.agent/scripts/quality-fix.sh +0 -263
- package/.agent/scripts/quality-loop-helper.sh +0 -1108
- package/.agent/scripts/ralph-loop-helper.sh +0 -836
- package/.agent/scripts/ralph-upstream-check.sh +0 -341
- package/.agent/scripts/secretlint-helper.sh +0 -847
- package/.agent/scripts/servers-helper.sh +0 -241
- package/.agent/scripts/ses-helper.sh +0 -619
- package/.agent/scripts/session-review-helper.sh +0 -404
- package/.agent/scripts/setup-linters-wizard.sh +0 -379
- package/.agent/scripts/setup-local-api-keys.sh +0 -330
- package/.agent/scripts/setup-mcp-integrations.sh +0 -472
- package/.agent/scripts/shared-constants.sh +0 -246
- package/.agent/scripts/site-crawler-helper.sh +0 -1487
- package/.agent/scripts/snyk-helper.sh +0 -940
- package/.agent/scripts/sonarcloud-autofix.sh +0 -193
- package/.agent/scripts/sonarcloud-cli.sh +0 -191
- package/.agent/scripts/sonarscanner-cli.sh +0 -455
- package/.agent/scripts/spaceship-helper.sh +0 -747
- package/.agent/scripts/stagehand-helper.sh +0 -321
- package/.agent/scripts/stagehand-python-helper.sh +0 -321
- package/.agent/scripts/stagehand-python-setup.sh +0 -441
- package/.agent/scripts/stagehand-setup.sh +0 -439
- package/.agent/scripts/system-cleanup.sh +0 -340
- package/.agent/scripts/terminal-title-helper.sh +0 -388
- package/.agent/scripts/terminal-title-setup.sh +0 -549
- package/.agent/scripts/test-stagehand-both-integration.sh +0 -317
- package/.agent/scripts/test-stagehand-integration.sh +0 -309
- package/.agent/scripts/test-stagehand-python-integration.sh +0 -341
- package/.agent/scripts/todo-ready.sh +0 -263
- package/.agent/scripts/tool-version-check.sh +0 -362
- package/.agent/scripts/toon-helper.sh +0 -469
- package/.agent/scripts/twilio-helper.sh +0 -917
- package/.agent/scripts/updown-helper.sh +0 -279
- package/.agent/scripts/validate-mcp-integrations.sh +0 -250
- package/.agent/scripts/validate-version-consistency.sh +0 -131
- package/.agent/scripts/vaultwarden-helper.sh +0 -597
- package/.agent/scripts/vercel-cli-helper.sh +0 -816
- package/.agent/scripts/verify-mirrors.sh +0 -169
- package/.agent/scripts/version-manager.sh +0 -831
- package/.agent/scripts/webhosting-helper.sh +0 -471
- package/.agent/scripts/webhosting-verify.sh +0 -238
- package/.agent/scripts/wordpress-mcp-helper.sh +0 -508
- package/.agent/scripts/worktree-helper.sh +0 -595
- package/.agent/scripts/worktree-sessions.sh +0 -577
- package/.agent/seo/dataforseo.md +0 -215
- package/.agent/seo/domain-research.md +0 -532
- package/.agent/seo/eeat-score.md +0 -659
- package/.agent/seo/google-search-console.md +0 -366
- package/.agent/seo/gsc-sitemaps.md +0 -282
- package/.agent/seo/keyword-research.md +0 -521
- package/.agent/seo/serper.md +0 -278
- package/.agent/seo/site-crawler.md +0 -387
- package/.agent/seo.md +0 -236
- package/.agent/services/accounting/quickfile.md +0 -159
- package/.agent/services/communications/telfon.md +0 -470
- package/.agent/services/communications/twilio.md +0 -569
- package/.agent/services/crm/fluentcrm.md +0 -449
- package/.agent/services/email/ses.md +0 -399
- package/.agent/services/hosting/101domains.md +0 -378
- package/.agent/services/hosting/closte.md +0 -177
- package/.agent/services/hosting/cloudflare.md +0 -251
- package/.agent/services/hosting/cloudron.md +0 -478
- package/.agent/services/hosting/dns-providers.md +0 -335
- package/.agent/services/hosting/domain-purchasing.md +0 -344
- package/.agent/services/hosting/hetzner.md +0 -327
- package/.agent/services/hosting/hostinger.md +0 -287
- package/.agent/services/hosting/localhost.md +0 -419
- package/.agent/services/hosting/spaceship.md +0 -353
- package/.agent/services/hosting/webhosting.md +0 -330
- package/.agent/social-media.md +0 -69
- package/.agent/templates/plans-template.md +0 -114
- package/.agent/templates/prd-template.md +0 -129
- package/.agent/templates/tasks-template.md +0 -108
- package/.agent/templates/todo-template.md +0 -89
- package/.agent/tools/ai-assistants/agno.md +0 -471
- package/.agent/tools/ai-assistants/capsolver.md +0 -326
- package/.agent/tools/ai-assistants/configuration.md +0 -221
- package/.agent/tools/ai-assistants/overview.md +0 -209
- package/.agent/tools/ai-assistants/status.md +0 -171
- package/.agent/tools/ai-assistants/windsurf.md +0 -193
- package/.agent/tools/ai-orchestration/autogen.md +0 -406
- package/.agent/tools/ai-orchestration/crewai.md +0 -445
- package/.agent/tools/ai-orchestration/langflow.md +0 -405
- package/.agent/tools/ai-orchestration/openprose.md +0 -487
- package/.agent/tools/ai-orchestration/overview.md +0 -362
- package/.agent/tools/ai-orchestration/packaging.md +0 -647
- package/.agent/tools/browser/agent-browser.md +0 -464
- package/.agent/tools/browser/browser-automation.md +0 -400
- package/.agent/tools/browser/chrome-devtools.md +0 -282
- package/.agent/tools/browser/crawl4ai-integration.md +0 -422
- package/.agent/tools/browser/crawl4ai-resources.md +0 -277
- package/.agent/tools/browser/crawl4ai-usage.md +0 -416
- package/.agent/tools/browser/crawl4ai.md +0 -585
- package/.agent/tools/browser/dev-browser.md +0 -341
- package/.agent/tools/browser/pagespeed.md +0 -260
- package/.agent/tools/browser/playwright.md +0 -266
- package/.agent/tools/browser/playwriter.md +0 -310
- package/.agent/tools/browser/stagehand-examples.md +0 -456
- package/.agent/tools/browser/stagehand-python.md +0 -483
- package/.agent/tools/browser/stagehand.md +0 -421
- package/.agent/tools/build-agent/agent-review.md +0 -224
- package/.agent/tools/build-agent/build-agent.md +0 -784
- package/.agent/tools/build-mcp/aidevops-plugin.md +0 -476
- package/.agent/tools/build-mcp/api-wrapper.md +0 -445
- package/.agent/tools/build-mcp/build-mcp.md +0 -240
- package/.agent/tools/build-mcp/deployment.md +0 -401
- package/.agent/tools/build-mcp/server-patterns.md +0 -632
- package/.agent/tools/build-mcp/transports.md +0 -366
- package/.agent/tools/code-review/auditing.md +0 -383
- package/.agent/tools/code-review/automation.md +0 -219
- package/.agent/tools/code-review/best-practices.md +0 -203
- package/.agent/tools/code-review/codacy.md +0 -151
- package/.agent/tools/code-review/code-simplifier.md +0 -174
- package/.agent/tools/code-review/code-standards.md +0 -309
- package/.agent/tools/code-review/coderabbit.md +0 -101
- package/.agent/tools/code-review/management.md +0 -155
- package/.agent/tools/code-review/qlty.md +0 -248
- package/.agent/tools/code-review/secretlint.md +0 -565
- package/.agent/tools/code-review/setup.md +0 -250
- package/.agent/tools/code-review/snyk.md +0 -563
- package/.agent/tools/code-review/tools.md +0 -230
- package/.agent/tools/content/summarize.md +0 -353
- package/.agent/tools/context/augment-context-engine.md +0 -468
- package/.agent/tools/context/context-builder-agent.md +0 -76
- package/.agent/tools/context/context-builder.md +0 -375
- package/.agent/tools/context/context7.md +0 -371
- package/.agent/tools/context/dspy.md +0 -302
- package/.agent/tools/context/dspyground.md +0 -374
- package/.agent/tools/context/llm-tldr.md +0 -219
- package/.agent/tools/context/osgrep.md +0 -488
- package/.agent/tools/context/prompt-optimization.md +0 -338
- package/.agent/tools/context/toon.md +0 -292
- package/.agent/tools/conversion/pandoc.md +0 -304
- package/.agent/tools/credentials/api-key-management.md +0 -154
- package/.agent/tools/credentials/api-key-setup.md +0 -224
- package/.agent/tools/credentials/environment-variables.md +0 -180
- package/.agent/tools/credentials/vaultwarden.md +0 -382
- package/.agent/tools/data-extraction/outscraper.md +0 -974
- package/.agent/tools/deployment/coolify-cli.md +0 -388
- package/.agent/tools/deployment/coolify-setup.md +0 -353
- package/.agent/tools/deployment/coolify.md +0 -345
- package/.agent/tools/deployment/vercel.md +0 -390
- package/.agent/tools/git/authentication.md +0 -132
- package/.agent/tools/git/gitea-cli.md +0 -193
- package/.agent/tools/git/github-actions.md +0 -207
- package/.agent/tools/git/github-cli.md +0 -223
- package/.agent/tools/git/gitlab-cli.md +0 -190
- package/.agent/tools/git/opencode-github-security.md +0 -350
- package/.agent/tools/git/opencode-github.md +0 -328
- package/.agent/tools/git/opencode-gitlab.md +0 -252
- package/.agent/tools/git/security.md +0 -196
- package/.agent/tools/git.md +0 -207
- package/.agent/tools/opencode/oh-my-opencode.md +0 -375
- package/.agent/tools/opencode/opencode-anthropic-auth.md +0 -446
- package/.agent/tools/opencode/opencode.md +0 -651
- package/.agent/tools/social-media/bird.md +0 -437
- package/.agent/tools/task-management/beads.md +0 -336
- package/.agent/tools/terminal/terminal-title.md +0 -251
- package/.agent/tools/ui/shadcn.md +0 -196
- package/.agent/tools/ui/ui-skills.md +0 -115
- package/.agent/tools/wordpress/localwp.md +0 -311
- package/.agent/tools/wordpress/mainwp.md +0 -391
- package/.agent/tools/wordpress/scf.md +0 -527
- package/.agent/tools/wordpress/wp-admin.md +0 -729
- package/.agent/tools/wordpress/wp-dev.md +0 -940
- package/.agent/tools/wordpress/wp-preferred.md +0 -398
- package/.agent/tools/wordpress.md +0 -95
- package/.agent/workflows/branch/bugfix.md +0 -63
- package/.agent/workflows/branch/chore.md +0 -95
- package/.agent/workflows/branch/experiment.md +0 -115
- package/.agent/workflows/branch/feature.md +0 -59
- package/.agent/workflows/branch/hotfix.md +0 -98
- package/.agent/workflows/branch/refactor.md +0 -92
- package/.agent/workflows/branch/release.md +0 -96
- package/.agent/workflows/branch.md +0 -347
- package/.agent/workflows/bug-fixing.md +0 -267
- package/.agent/workflows/changelog.md +0 -129
- package/.agent/workflows/code-audit-remote.md +0 -279
- package/.agent/workflows/conversation-starter.md +0 -69
- package/.agent/workflows/error-feedback.md +0 -578
- package/.agent/workflows/feature-development.md +0 -355
- package/.agent/workflows/git-workflow.md +0 -702
- package/.agent/workflows/multi-repo-workspace.md +0 -268
- package/.agent/workflows/plans.md +0 -709
- package/.agent/workflows/postflight.md +0 -604
- package/.agent/workflows/pr.md +0 -571
- package/.agent/workflows/preflight.md +0 -278
- package/.agent/workflows/ralph-loop.md +0 -773
- package/.agent/workflows/release.md +0 -498
- package/.agent/workflows/session-manager.md +0 -254
- package/.agent/workflows/session-review.md +0 -311
- package/.agent/workflows/sql-migrations.md +0 -631
- package/.agent/workflows/version-bump.md +0 -283
- package/.agent/workflows/wiki-update.md +0 -333
- package/.agent/workflows/worktree.md +0 -477
package/.agent/seo/serper.md
DELETED
|
@@ -1,278 +0,0 @@
|
|
|
1
|
-
---
|
|
2
|
-
description: Serper MCP for Google Search API integration
|
|
3
|
-
mode: subagent
|
|
4
|
-
tools:
|
|
5
|
-
read: true
|
|
6
|
-
write: false
|
|
7
|
-
edit: false
|
|
8
|
-
bash: true
|
|
9
|
-
glob: true
|
|
10
|
-
grep: true
|
|
11
|
-
webfetch: true
|
|
12
|
-
---
|
|
13
|
-
|
|
14
|
-
# Serper MCP Integration
|
|
15
|
-
|
|
16
|
-
<!-- AI-CONTEXT-START -->
|
|
17
|
-
|
|
18
|
-
## Quick Reference
|
|
19
|
-
|
|
20
|
-
- **Purpose**: Google Search results via Serper API
|
|
21
|
-
- **MCP Package**: `serper-mcp-server` (Python, community)
|
|
22
|
-
- **Auth**: API Key (stored in `~/.config/aidevops/mcp-env.sh`)
|
|
23
|
-
- **Env Var**: `SERPER_API_KEY`
|
|
24
|
-
- **API Dashboard**: https://serper.dev/
|
|
25
|
-
- **GitHub**: https://github.com/garylab/serper-mcp-server
|
|
26
|
-
|
|
27
|
-
**Available Tools**:
|
|
28
|
-
|
|
29
|
-
| Tool | Purpose |
|
|
30
|
-
|------|---------|
|
|
31
|
-
| `google_search` | Web search results |
|
|
32
|
-
| `google_search_images` | Image search results |
|
|
33
|
-
| `google_search_videos` | Video search results |
|
|
34
|
-
| `google_search_places` | Local business/place search |
|
|
35
|
-
| `google_search_maps` | Map search results |
|
|
36
|
-
| `google_search_reviews` | Business reviews |
|
|
37
|
-
| `google_search_news` | News search results |
|
|
38
|
-
| `google_search_shopping` | Shopping/product search |
|
|
39
|
-
| `google_search_lens` | Visual search (Google Lens) |
|
|
40
|
-
| `google_search_scholar` | Academic/scholarly search |
|
|
41
|
-
| `google_search_patents` | Patent search |
|
|
42
|
-
| `google_search_autocomplete` | Search suggestions |
|
|
43
|
-
| `webpage_scrape` | Scrape webpage content |
|
|
44
|
-
|
|
45
|
-
<!-- AI-CONTEXT-END -->
|
|
46
|
-
|
|
47
|
-
## Installation
|
|
48
|
-
|
|
49
|
-
### Via setup.sh (Recommended)
|
|
50
|
-
|
|
51
|
-
The aidevops `setup.sh` script automatically configures the Serper MCP server.
|
|
52
|
-
|
|
53
|
-
### Manual Installation
|
|
54
|
-
|
|
55
|
-
```bash
|
|
56
|
-
# Using uv (recommended)
|
|
57
|
-
uvx serper-mcp-server
|
|
58
|
-
|
|
59
|
-
# Using pip
|
|
60
|
-
pip install serper-mcp-server
|
|
61
|
-
|
|
62
|
-
# Or install globally
|
|
63
|
-
pip3 install serper-mcp-server
|
|
64
|
-
```text
|
|
65
|
-
|
|
66
|
-
## Configuration
|
|
67
|
-
|
|
68
|
-
### Store Credentials
|
|
69
|
-
|
|
70
|
-
```bash
|
|
71
|
-
# Using the secure key management script
|
|
72
|
-
bash ~/.aidevops/agents/scripts/setup-local-api-keys.sh set SERPER_API_KEY "your_api_key"
|
|
73
|
-
```text
|
|
74
|
-
|
|
75
|
-
### OpenCode Configuration
|
|
76
|
-
|
|
77
|
-
Add to `~/.config/opencode/opencode.json`:
|
|
78
|
-
|
|
79
|
-
```json
|
|
80
|
-
{
|
|
81
|
-
"mcp": {
|
|
82
|
-
"serper": {
|
|
83
|
-
"type": "local",
|
|
84
|
-
"command": [
|
|
85
|
-
"/bin/bash",
|
|
86
|
-
"-c",
|
|
87
|
-
"source ~/.config/aidevops/mcp-env.sh && SERPER_API_KEY=$SERPER_API_KEY uvx serper-mcp-server"
|
|
88
|
-
],
|
|
89
|
-
"enabled": true
|
|
90
|
-
}
|
|
91
|
-
}
|
|
92
|
-
}
|
|
93
|
-
```text
|
|
94
|
-
|
|
95
|
-
### Claude Desktop Configuration
|
|
96
|
-
|
|
97
|
-
Add to `~/Library/Application Support/Claude/claude_desktop_config.json`:
|
|
98
|
-
|
|
99
|
-
```json
|
|
100
|
-
{
|
|
101
|
-
"mcpServers": {
|
|
102
|
-
"serper": {
|
|
103
|
-
"command": "uvx",
|
|
104
|
-
"args": ["serper-mcp-server"],
|
|
105
|
-
"env": {
|
|
106
|
-
"SERPER_API_KEY": "your_api_key"
|
|
107
|
-
}
|
|
108
|
-
}
|
|
109
|
-
}
|
|
110
|
-
}
|
|
111
|
-
```text
|
|
112
|
-
|
|
113
|
-
### Cursor Configuration
|
|
114
|
-
|
|
115
|
-
Add to `~/.cursor/mcp.json`:
|
|
116
|
-
|
|
117
|
-
```json
|
|
118
|
-
{
|
|
119
|
-
"mcpServers": {
|
|
120
|
-
"serper": {
|
|
121
|
-
"command": "uvx",
|
|
122
|
-
"args": ["serper-mcp-server"],
|
|
123
|
-
"env": {
|
|
124
|
-
"SERPER_API_KEY": "your_api_key"
|
|
125
|
-
}
|
|
126
|
-
}
|
|
127
|
-
}
|
|
128
|
-
}
|
|
129
|
-
```text
|
|
130
|
-
|
|
131
|
-
### Alternative: Using pip
|
|
132
|
-
|
|
133
|
-
If you prefer pip over uv:
|
|
134
|
-
|
|
135
|
-
```json
|
|
136
|
-
{
|
|
137
|
-
"mcpServers": {
|
|
138
|
-
"serper": {
|
|
139
|
-
"command": "python3",
|
|
140
|
-
"args": ["-m", "serper_mcp_server"],
|
|
141
|
-
"env": {
|
|
142
|
-
"SERPER_API_KEY": "your_api_key"
|
|
143
|
-
}
|
|
144
|
-
}
|
|
145
|
-
}
|
|
146
|
-
}
|
|
147
|
-
```text
|
|
148
|
-
|
|
149
|
-
## Usage Examples
|
|
150
|
-
|
|
151
|
-
### Web Search
|
|
152
|
-
|
|
153
|
-
```javascript
|
|
154
|
-
// Basic Google search
|
|
155
|
-
await serper.google_search({
|
|
156
|
-
q: "best seo tools 2024",
|
|
157
|
-
gl: "us", // Country code
|
|
158
|
-
hl: "en", // Language
|
|
159
|
-
num: 10 // Number of results
|
|
160
|
-
});
|
|
161
|
-
```text
|
|
162
|
-
|
|
163
|
-
### Image Search
|
|
164
|
-
|
|
165
|
-
```javascript
|
|
166
|
-
// Search for images
|
|
167
|
-
await serper.google_search_images({
|
|
168
|
-
q: "seo infographic",
|
|
169
|
-
gl: "us",
|
|
170
|
-
num: 20
|
|
171
|
-
});
|
|
172
|
-
```text
|
|
173
|
-
|
|
174
|
-
### News Search
|
|
175
|
-
|
|
176
|
-
```javascript
|
|
177
|
-
// Get latest news
|
|
178
|
-
await serper.google_search_news({
|
|
179
|
-
q: "google algorithm update",
|
|
180
|
-
gl: "us",
|
|
181
|
-
tbs: "qdr:w" // Past week
|
|
182
|
-
});
|
|
183
|
-
```text
|
|
184
|
-
|
|
185
|
-
### Local/Places Search
|
|
186
|
-
|
|
187
|
-
```javascript
|
|
188
|
-
// Find local businesses
|
|
189
|
-
await serper.google_search_places({
|
|
190
|
-
q: "seo agency",
|
|
191
|
-
location: "New York, NY"
|
|
192
|
-
});
|
|
193
|
-
```text
|
|
194
|
-
|
|
195
|
-
### Shopping Search
|
|
196
|
-
|
|
197
|
-
```javascript
|
|
198
|
-
// Product search
|
|
199
|
-
await serper.google_search_shopping({
|
|
200
|
-
q: "seo software",
|
|
201
|
-
gl: "us"
|
|
202
|
-
});
|
|
203
|
-
```text
|
|
204
|
-
|
|
205
|
-
### Scholar Search
|
|
206
|
-
|
|
207
|
-
```javascript
|
|
208
|
-
// Academic papers
|
|
209
|
-
await serper.google_search_scholar({
|
|
210
|
-
q: "search engine optimization research",
|
|
211
|
-
num: 10
|
|
212
|
-
});
|
|
213
|
-
```text
|
|
214
|
-
|
|
215
|
-
### Webpage Scraping
|
|
216
|
-
|
|
217
|
-
```javascript
|
|
218
|
-
// Scrape a webpage
|
|
219
|
-
await serper.webpage_scrape({
|
|
220
|
-
url: "https://example.com/article"
|
|
221
|
-
});
|
|
222
|
-
```text
|
|
223
|
-
|
|
224
|
-
## Search Parameters
|
|
225
|
-
|
|
226
|
-
Common parameters for all search tools:
|
|
227
|
-
|
|
228
|
-
| Parameter | Description | Example |
|
|
229
|
-
|-----------|-------------|---------|
|
|
230
|
-
| `q` | Search query | `"seo tools"` |
|
|
231
|
-
| `gl` | Country code | `"us"`, `"uk"`, `"de"` |
|
|
232
|
-
| `hl` | Language code | `"en"`, `"es"`, `"fr"` |
|
|
233
|
-
| `num` | Number of results | `10`, `20`, `100` |
|
|
234
|
-
| `page` | Page number | `1`, `2`, `3` |
|
|
235
|
-
| `tbs` | Time filter | `"qdr:d"` (day), `"qdr:w"` (week), `"qdr:m"` (month) |
|
|
236
|
-
|
|
237
|
-
## Verification
|
|
238
|
-
|
|
239
|
-
Test the integration:
|
|
240
|
-
|
|
241
|
-
```text
|
|
242
|
-
Use the Serper MCP to search for "best seo tools 2024" in the United States
|
|
243
|
-
```text
|
|
244
|
-
|
|
245
|
-
Expected: Google search results with titles, URLs, snippets, and related data.
|
|
246
|
-
|
|
247
|
-
## Debugging
|
|
248
|
-
|
|
249
|
-
```bash
|
|
250
|
-
# Using MCP inspector with uvx
|
|
251
|
-
npx @modelcontextprotocol/inspector uvx serper-mcp-server
|
|
252
|
-
|
|
253
|
-
# Or with local development
|
|
254
|
-
git clone https://github.com/garylab/serper-mcp-server.git
|
|
255
|
-
cd serper-mcp-server
|
|
256
|
-
npx @modelcontextprotocol/inspector uv run serper-mcp-server -e SERPER_API_KEY=your_key
|
|
257
|
-
```text
|
|
258
|
-
|
|
259
|
-
## Comparison with DataForSEO
|
|
260
|
-
|
|
261
|
-
| Feature | Serper | DataForSEO |
|
|
262
|
-
|---------|--------|------------|
|
|
263
|
-
| **Focus** | Google Search API | Comprehensive SEO data |
|
|
264
|
-
| **SERP Data** | Yes | Yes |
|
|
265
|
-
| **Keyword Research** | No | Yes |
|
|
266
|
-
| **Backlinks** | No | Yes |
|
|
267
|
-
| **On-Page Analysis** | No | Yes |
|
|
268
|
-
| **Pricing** | Pay-per-search | Subscription |
|
|
269
|
-
| **Best For** | Quick searches | Full SEO workflows |
|
|
270
|
-
|
|
271
|
-
Use Serper for quick Google searches; use DataForSEO for comprehensive SEO analysis.
|
|
272
|
-
|
|
273
|
-
## Resources
|
|
274
|
-
|
|
275
|
-
- **API Dashboard**: https://serper.dev/
|
|
276
|
-
- **GitHub**: https://github.com/garylab/serper-mcp-server
|
|
277
|
-
- **PyPI**: https://pypi.org/project/serper-mcp-server/
|
|
278
|
-
- **API Docs**: https://serper.dev/docs
|
|
@@ -1,387 +0,0 @@
|
|
|
1
|
-
---
|
|
2
|
-
description: SEO site crawler with Screaming Frog-like capabilities
|
|
3
|
-
mode: subagent
|
|
4
|
-
tools:
|
|
5
|
-
read: true
|
|
6
|
-
write: true
|
|
7
|
-
edit: true
|
|
8
|
-
bash: true
|
|
9
|
-
glob: true
|
|
10
|
-
grep: true
|
|
11
|
-
webfetch: true
|
|
12
|
-
task: true
|
|
13
|
-
---
|
|
14
|
-
|
|
15
|
-
# Site Crawler - SEO Spider Agent
|
|
16
|
-
|
|
17
|
-
<!-- AI-CONTEXT-START -->
|
|
18
|
-
|
|
19
|
-
## Quick Reference
|
|
20
|
-
|
|
21
|
-
- **Purpose**: Comprehensive SEO site auditing like Screaming Frog
|
|
22
|
-
- **Helper**: `~/.aidevops/agents/scripts/site-crawler-helper.sh`
|
|
23
|
-
- **Browser Tools**: `tools/browser/crawl4ai.md`, `tools/browser/playwriter.md`
|
|
24
|
-
- **Output**: `~/Downloads/{domain}/{datestamp}/` with `_latest` symlink
|
|
25
|
-
- **Formats**: CSV, XLSX, JSON, HTML reports
|
|
26
|
-
|
|
27
|
-
**Commands**:
|
|
28
|
-
|
|
29
|
-
```bash
|
|
30
|
-
# Full site crawl
|
|
31
|
-
site-crawler-helper.sh crawl https://example.com
|
|
32
|
-
|
|
33
|
-
# Crawl with depth limit
|
|
34
|
-
site-crawler-helper.sh crawl https://example.com --depth 3 --max-urls 500
|
|
35
|
-
|
|
36
|
-
# Specific audits
|
|
37
|
-
site-crawler-helper.sh audit-links https://example.com
|
|
38
|
-
site-crawler-helper.sh audit-meta https://example.com
|
|
39
|
-
site-crawler-helper.sh audit-redirects https://example.com
|
|
40
|
-
|
|
41
|
-
# Export formats
|
|
42
|
-
site-crawler-helper.sh crawl https://example.com --format xlsx
|
|
43
|
-
site-crawler-helper.sh crawl https://example.com --format csv
|
|
44
|
-
|
|
45
|
-
# JavaScript rendering
|
|
46
|
-
site-crawler-helper.sh crawl https://example.com --render-js
|
|
47
|
-
```text
|
|
48
|
-
|
|
49
|
-
**Key Features**:
|
|
50
|
-
|
|
51
|
-
- Broken link detection (4XX, 5XX errors)
|
|
52
|
-
- Redirect chain analysis
|
|
53
|
-
- Meta data auditing (titles, descriptions, robots)
|
|
54
|
-
- Duplicate content detection
|
|
55
|
-
- Structured data extraction
|
|
56
|
-
- XML sitemap generation
|
|
57
|
-
- Internal linking analysis
|
|
58
|
-
- JavaScript rendering support
|
|
59
|
-
|
|
60
|
-
<!-- AI-CONTEXT-END -->
|
|
61
|
-
|
|
62
|
-
## Overview
|
|
63
|
-
|
|
64
|
-
The Site Crawler agent provides Screaming Frog-like SEO auditing capabilities using
|
|
65
|
-
Crawl4AI, Playwriter, and custom scripts. It crawls websites to identify technical
|
|
66
|
-
SEO issues and exports findings to spreadsheets for analysis.
|
|
67
|
-
|
|
68
|
-
## Crawl Capabilities
|
|
69
|
-
|
|
70
|
-
### Core SEO Data Collection
|
|
71
|
-
|
|
72
|
-
| Category | Data Collected |
|
|
73
|
-
|----------|----------------|
|
|
74
|
-
| **URLs** | Address, status code, content type, response time, file size |
|
|
75
|
-
| **Page Titles** | Title text, length, missing/duplicate detection |
|
|
76
|
-
| **Meta Descriptions** | Description text, length, missing/duplicate detection |
|
|
77
|
-
| **Meta Robots** | Index/noindex, follow/nofollow, canonical, robots directives |
|
|
78
|
-
| **Headings** | H1, H2 content, missing/duplicate/multiple detection |
|
|
79
|
-
| **Links** | Internal/external, follow/nofollow, anchor text, broken links |
|
|
80
|
-
| **Images** | URL, alt text, file size, missing alt detection |
|
|
81
|
-
| **Redirects** | Type (301/302/307), chains, loops, final destination |
|
|
82
|
-
| **Canonicals** | Canonical URL, self-referencing, conflicts |
|
|
83
|
-
| **Hreflang** | Language codes, return links, conflicts |
|
|
84
|
-
| **Structured Data** | JSON-LD, Microdata, RDFa extraction and validation |
|
|
85
|
-
|
|
86
|
-
### Advanced Features
|
|
87
|
-
|
|
88
|
-
| Feature | Description |
|
|
89
|
-
|---------|-------------|
|
|
90
|
-
| **JavaScript Rendering** | Crawl SPAs (React, Vue, Angular) via Chromium |
|
|
91
|
-
| **Custom Extraction** | XPath, CSS selectors, regex for any HTML data |
|
|
92
|
-
| **Robots.txt Analysis** | Blocked URLs, directives, crawl delays |
|
|
93
|
-
| **XML Sitemap Analysis** | Parse sitemaps, find orphan/missing pages |
|
|
94
|
-
| **Duplicate Detection** | MD5 hash for exact duplicates, similarity scoring |
|
|
95
|
-
| **Crawl Depth** | Track URL depth in site architecture |
|
|
96
|
-
| **Word Count** | Content length analysis per page |
|
|
97
|
-
|
|
98
|
-
## Usage
|
|
99
|
-
|
|
100
|
-
### Basic Site Crawl
|
|
101
|
-
|
|
102
|
-
```bash
|
|
103
|
-
# Crawl entire site (respects robots.txt)
|
|
104
|
-
site-crawler-helper.sh crawl https://example.com
|
|
105
|
-
|
|
106
|
-
# Output: ~/Downloads/example.com/2025-01-15_143022/
|
|
107
|
-
# - crawl-data.csv
|
|
108
|
-
# - crawl-data.xlsx
|
|
109
|
-
# - broken-links.csv
|
|
110
|
-
# - redirects.csv
|
|
111
|
-
# - meta-issues.csv
|
|
112
|
-
# - summary.json
|
|
113
|
-
```text
|
|
114
|
-
|
|
115
|
-
### Targeted Audits
|
|
116
|
-
|
|
117
|
-
```bash
|
|
118
|
-
# Broken links only
|
|
119
|
-
site-crawler-helper.sh audit-links https://example.com
|
|
120
|
-
|
|
121
|
-
# Meta data audit (titles, descriptions)
|
|
122
|
-
site-crawler-helper.sh audit-meta https://example.com
|
|
123
|
-
|
|
124
|
-
# Redirect audit
|
|
125
|
-
site-crawler-helper.sh audit-redirects https://example.com
|
|
126
|
-
|
|
127
|
-
# Duplicate content check
|
|
128
|
-
site-crawler-helper.sh audit-duplicates https://example.com
|
|
129
|
-
|
|
130
|
-
# Structured data validation
|
|
131
|
-
site-crawler-helper.sh audit-schema https://example.com
|
|
132
|
-
```text
|
|
133
|
-
|
|
134
|
-
### Crawl Configuration
|
|
135
|
-
|
|
136
|
-
```bash
|
|
137
|
-
# Limit crawl scope
|
|
138
|
-
site-crawler-helper.sh crawl https://example.com \
|
|
139
|
-
--depth 3 \
|
|
140
|
-
--max-urls 1000 \
|
|
141
|
-
--include "/blog/*" \
|
|
142
|
-
--exclude "/admin/*,/wp-json/*"
|
|
143
|
-
|
|
144
|
-
# JavaScript rendering for SPAs
|
|
145
|
-
site-crawler-helper.sh crawl https://spa-site.com --render-js
|
|
146
|
-
|
|
147
|
-
# Custom user agent
|
|
148
|
-
site-crawler-helper.sh crawl https://example.com --user-agent "Googlebot"
|
|
149
|
-
|
|
150
|
-
# Respect/ignore robots.txt
|
|
151
|
-
site-crawler-helper.sh crawl https://example.com --ignore-robots
|
|
152
|
-
```text
|
|
153
|
-
|
|
154
|
-
### Export Options
|
|
155
|
-
|
|
156
|
-
```bash
|
|
157
|
-
# CSV export (default)
|
|
158
|
-
site-crawler-helper.sh crawl https://example.com --format csv
|
|
159
|
-
|
|
160
|
-
# Excel export
|
|
161
|
-
site-crawler-helper.sh crawl https://example.com --format xlsx
|
|
162
|
-
|
|
163
|
-
# Both formats
|
|
164
|
-
site-crawler-helper.sh crawl https://example.com --format all
|
|
165
|
-
|
|
166
|
-
# Custom output location
|
|
167
|
-
site-crawler-helper.sh crawl https://example.com --output ~/SEO-Audits/
|
|
168
|
-
```text
|
|
169
|
-
|
|
170
|
-
## Output Structure
|
|
171
|
-
|
|
172
|
-
All crawl outputs are organized by domain and timestamp:
|
|
173
|
-
|
|
174
|
-
```text
|
|
175
|
-
~/Downloads/
|
|
176
|
-
└── example.com/
|
|
177
|
-
├── 2025-01-15_143022/
|
|
178
|
-
│ ├── crawl-data.xlsx # Full crawl data
|
|
179
|
-
│ ├── crawl-data.csv # Full crawl data (CSV)
|
|
180
|
-
│ ├── broken-links.csv # 4XX/5XX errors
|
|
181
|
-
│ ├── redirects.csv # All redirects with chains
|
|
182
|
-
│ ├── meta-issues.csv # Title/description issues
|
|
183
|
-
│ ├── duplicate-content.csv # Duplicate pages
|
|
184
|
-
│ ├── images.csv # Image audit
|
|
185
|
-
│ ├── internal-links.csv # Link structure
|
|
186
|
-
│ ├── external-links.csv # Outbound links
|
|
187
|
-
│ ├── structured-data.json # Schema.org data
|
|
188
|
-
│ └── summary.json # Crawl statistics
|
|
189
|
-
├── 2025-01-10_091500/
|
|
190
|
-
│ └── ...
|
|
191
|
-
└── _latest -> 2025-01-15_143022 # Symlink to latest
|
|
192
|
-
```text
|
|
193
|
-
|
|
194
|
-
## Spreadsheet Columns
|
|
195
|
-
|
|
196
|
-
### Main Crawl Data (crawl-data.xlsx)
|
|
197
|
-
|
|
198
|
-
| Column | Description |
|
|
199
|
-
|--------|-------------|
|
|
200
|
-
| URL | Full page URL |
|
|
201
|
-
| Status Code | HTTP response code |
|
|
202
|
-
| Status | OK, Redirect, Client Error, Server Error |
|
|
203
|
-
| Content Type | MIME type |
|
|
204
|
-
| Title | Page title |
|
|
205
|
-
| Title Length | Character count |
|
|
206
|
-
| Meta Description | Description content |
|
|
207
|
-
| Description Length | Character count |
|
|
208
|
-
| H1 | First H1 content |
|
|
209
|
-
| H1 Count | Number of H1 tags |
|
|
210
|
-
| H2 | First H2 content |
|
|
211
|
-
| H2 Count | Number of H2 tags |
|
|
212
|
-
| Canonical | Canonical URL |
|
|
213
|
-
| Meta Robots | Robots directives |
|
|
214
|
-
| Word Count | Text content word count |
|
|
215
|
-
| Response Time | Server response in ms |
|
|
216
|
-
| File Size | Page size in bytes |
|
|
217
|
-
| Crawl Depth | Clicks from homepage |
|
|
218
|
-
| Inlinks | Number of internal links to page |
|
|
219
|
-
| Outlinks | Number of links from page |
|
|
220
|
-
| External Links | Number of external links |
|
|
221
|
-
| Images | Number of images |
|
|
222
|
-
| Images Missing Alt | Images without alt text |
|
|
223
|
-
|
|
224
|
-
### Broken Links Report
|
|
225
|
-
|
|
226
|
-
| Column | Description |
|
|
227
|
-
|--------|-------------|
|
|
228
|
-
| Broken URL | The 4XX/5XX URL |
|
|
229
|
-
| Status Code | Error code |
|
|
230
|
-
| Source URL | Page containing the link |
|
|
231
|
-
| Anchor Text | Link text |
|
|
232
|
-
| Link Type | Internal/External |
|
|
233
|
-
|
|
234
|
-
### Redirect Report
|
|
235
|
-
|
|
236
|
-
| Column | Description |
|
|
237
|
-
|--------|-------------|
|
|
238
|
-
| Original URL | Starting URL |
|
|
239
|
-
| Status Code | 301/302/307/308 |
|
|
240
|
-
| Redirect URL | Target URL |
|
|
241
|
-
| Final URL | End of chain |
|
|
242
|
-
| Chain Length | Number of hops |
|
|
243
|
-
| Chain | Full redirect path |
|
|
244
|
-
|
|
245
|
-
## Integration with Other Agents
|
|
246
|
-
|
|
247
|
-
### With E-E-A-T Score Agent
|
|
248
|
-
|
|
249
|
-
```bash
|
|
250
|
-
# Crawl site first
|
|
251
|
-
site-crawler-helper.sh crawl https://example.com --format json
|
|
252
|
-
|
|
253
|
-
# Then run E-E-A-T analysis on crawled pages
|
|
254
|
-
eeat-score-helper.sh analyze ~/Downloads/example.com/_latest/crawl-data.json
|
|
255
|
-
```text
|
|
256
|
-
|
|
257
|
-
### With PageSpeed Agent
|
|
258
|
-
|
|
259
|
-
```bash
|
|
260
|
-
# Crawl and get performance data
|
|
261
|
-
site-crawler-helper.sh crawl https://example.com --include-pagespeed
|
|
262
|
-
```text
|
|
263
|
-
|
|
264
|
-
### With Crawl4AI
|
|
265
|
-
|
|
266
|
-
The site crawler uses Crawl4AI for:
|
|
267
|
-
- JavaScript rendering
|
|
268
|
-
- Structured data extraction
|
|
269
|
-
- LLM-powered content analysis
|
|
270
|
-
- CAPTCHA handling (with CapSolver)
|
|
271
|
-
|
|
272
|
-
See `tools/browser/crawl4ai.md` for advanced configuration.
|
|
273
|
-
|
|
274
|
-
## Browser Automation
|
|
275
|
-
|
|
276
|
-
For sites requiring authentication or complex interactions:
|
|
277
|
-
|
|
278
|
-
```bash
|
|
279
|
-
# Use Playwriter for authenticated crawls
|
|
280
|
-
site-crawler-helper.sh crawl https://example.com \
|
|
281
|
-
--auth-type form \
|
|
282
|
-
--login-url https://example.com/login \
|
|
283
|
-
--username user@example.com \
|
|
284
|
-
--password-env SITE_PASSWORD
|
|
285
|
-
```text
|
|
286
|
-
|
|
287
|
-
See `tools/browser/playwriter.md` for browser automation details.
|
|
288
|
-
|
|
289
|
-
## XML Sitemap Generation
|
|
290
|
-
|
|
291
|
-
```bash
|
|
292
|
-
# Generate sitemap from crawl
|
|
293
|
-
site-crawler-helper.sh generate-sitemap https://example.com
|
|
294
|
-
|
|
295
|
-
# Output: ~/Downloads/example.com/_latest/sitemap.xml
|
|
296
|
-
|
|
297
|
-
# With configuration
|
|
298
|
-
site-crawler-helper.sh generate-sitemap https://example.com \
|
|
299
|
-
--changefreq weekly \
|
|
300
|
-
--priority-rules "/blog/*:0.8,/*:0.5" \
|
|
301
|
-
--exclude "/admin/*,/private/*"
|
|
302
|
-
```text
|
|
303
|
-
|
|
304
|
-
## Crawl Comparison
|
|
305
|
-
|
|
306
|
-
Compare two crawls to track changes:
|
|
307
|
-
|
|
308
|
-
```bash
|
|
309
|
-
# Compare latest with previous
|
|
310
|
-
site-crawler-helper.sh compare https://example.com
|
|
311
|
-
|
|
312
|
-
# Compare specific crawls
|
|
313
|
-
site-crawler-helper.sh compare \
|
|
314
|
-
~/Downloads/example.com/2025-01-10_091500 \
|
|
315
|
-
~/Downloads/example.com/2025-01-15_143022
|
|
316
|
-
|
|
317
|
-
# Output: changes-report.xlsx with:
|
|
318
|
-
# - New URLs
|
|
319
|
-
# - Removed URLs
|
|
320
|
-
# - Changed titles/descriptions
|
|
321
|
-
# - New/fixed broken links
|
|
322
|
-
# - Redirect changes
|
|
323
|
-
```text
|
|
324
|
-
|
|
325
|
-
## Configuration File
|
|
326
|
-
|
|
327
|
-
Create `~/.config/aidevops/site-crawler.json` for defaults:
|
|
328
|
-
|
|
329
|
-
```json
|
|
330
|
-
{
|
|
331
|
-
"default_depth": 10,
|
|
332
|
-
"max_urls": 10000,
|
|
333
|
-
"respect_robots": true,
|
|
334
|
-
"render_js": false,
|
|
335
|
-
"user_agent": "AIDevOps-Crawler/1.0",
|
|
336
|
-
"request_delay": 100,
|
|
337
|
-
"concurrent_requests": 5,
|
|
338
|
-
"timeout": 30,
|
|
339
|
-
"output_format": "xlsx",
|
|
340
|
-
"output_directory": "~/Downloads",
|
|
341
|
-
"exclude_patterns": [
|
|
342
|
-
"/wp-admin/*",
|
|
343
|
-
"/wp-json/*",
|
|
344
|
-
"*.pdf",
|
|
345
|
-
"*.zip"
|
|
346
|
-
]
|
|
347
|
-
}
|
|
348
|
-
```text
|
|
349
|
-
|
|
350
|
-
## Rate Limiting & Politeness
|
|
351
|
-
|
|
352
|
-
The crawler respects website resources:
|
|
353
|
-
|
|
354
|
-
- **Robots.txt**: Honored by default (override with `--ignore-robots`)
|
|
355
|
-
- **Crawl-delay**: Respected from robots.txt
|
|
356
|
-
- **Request delay**: Configurable delay between requests
|
|
357
|
-
- **Concurrent requests**: Limited to avoid overwhelming servers
|
|
358
|
-
|
|
359
|
-
## Troubleshooting
|
|
360
|
-
|
|
361
|
-
### Common Issues
|
|
362
|
-
|
|
363
|
-
| Issue | Solution |
|
|
364
|
-
|-------|----------|
|
|
365
|
-
| Crawl blocked | Check robots.txt, try different user-agent |
|
|
366
|
-
| JavaScript not rendering | Use `--render-js` flag |
|
|
367
|
-
| Missing pages | Increase `--depth` or check internal linking |
|
|
368
|
-
| Slow crawl | Reduce `--concurrent-requests` or increase `--request-delay` |
|
|
369
|
-
| Memory issues | Reduce `--max-urls` or use disk storage mode |
|
|
370
|
-
|
|
371
|
-
### Debug Mode
|
|
372
|
-
|
|
373
|
-
```bash
|
|
374
|
-
# Verbose output
|
|
375
|
-
site-crawler-helper.sh crawl https://example.com --verbose
|
|
376
|
-
|
|
377
|
-
# Save raw HTML for inspection
|
|
378
|
-
site-crawler-helper.sh crawl https://example.com --save-html
|
|
379
|
-
```text
|
|
380
|
-
|
|
381
|
-
## Related Agents
|
|
382
|
-
|
|
383
|
-
- `seo/eeat-score.md` - E-E-A-T content quality scoring
|
|
384
|
-
- `tools/browser/crawl4ai.md` - AI-powered web crawling
|
|
385
|
-
- `tools/browser/playwriter.md` - Browser automation
|
|
386
|
-
- `tools/browser/pagespeed.md` - Performance auditing
|
|
387
|
-
- `seo/google-search-console.md` - Search performance data
|