@agenticmail/enterprise 0.5.327 → 0.5.329
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/dist/agent-tools-F3CYENMK.js +13949 -0
- package/dist/browser-tool-P57PLVW2.js +4002 -0
- package/dist/chunk-3RI3AIJN.js +1519 -0
- package/dist/chunk-AD4DFKHR.js +4928 -0
- package/dist/chunk-UQXPVWXG.js +5101 -0
- package/dist/cli-agent-K6UFZRXC.js +2473 -0
- package/dist/cli-serve-4MT7RDEL.js +260 -0
- package/dist/cli.js +3 -3
- package/dist/dashboard/app.js +1 -1
- package/dist/dashboard/components/transport-encryption.js +0 -62
- package/dist/dashboard/pages/agent-detail/index.js +5 -2
- package/dist/dashboard/pages/agent-detail/manager.js +1 -1
- package/dist/dashboard/pages/agent-detail/overview.js +4 -2
- package/dist/dashboard/pages/agent-detail/tool-security.js +1 -1
- package/dist/dashboard/pages/domain-status.js +3 -6
- package/dist/dashboard/pages/memory-transfer.js +1 -1
- package/dist/dashboard/pages/messages.js +0 -1
- package/dist/dashboard/pages/roles.js +0 -2
- package/dist/dashboard/pages/workforce.js +0 -1
- package/dist/index.js +3 -3
- package/dist/runtime-L5ADJORP.js +45 -0
- package/dist/server-KSN56EZQ.js +28 -0
- package/dist/setup-UUNBBOQH.js +20 -0
- package/logs/cloudflared-error.log +42 -0
- package/logs/enterprise-out.log +6 -0
- package/package.json +1 -1
- package/src/admin/page-registry.ts +0 -290
- package/src/admin/routes.ts +0 -2968
- package/src/agent-tools/common.ts +0 -260
- package/src/agent-tools/index.ts +0 -542
- package/src/agent-tools/merge.ts +0 -62
- package/src/agent-tools/middleware.ts +0 -436
- package/src/agent-tools/schema/typebox.ts +0 -25
- package/src/agent-tools/security.ts +0 -352
- package/src/agent-tools/tool-resolver.ts +0 -1018
- package/src/agent-tools/tools/agenticmail.ts +0 -1017
- package/src/agent-tools/tools/bash.ts +0 -179
- package/src/agent-tools/tools/browser-tool.schema.ts +0 -112
- package/src/agent-tools/tools/browser-tool.ts +0 -388
- package/src/agent-tools/tools/browser.ts +0 -764
- package/src/agent-tools/tools/edit.ts +0 -100
- package/src/agent-tools/tools/enterprise-code-sandbox.ts +0 -395
- package/src/agent-tools/tools/enterprise-database.ts +0 -377
- package/src/agent-tools/tools/enterprise-diff.ts +0 -580
- package/src/agent-tools/tools/enterprise-documents.ts +0 -896
- package/src/agent-tools/tools/enterprise-http.ts +0 -485
- package/src/agent-tools/tools/enterprise-security-scan.ts +0 -528
- package/src/agent-tools/tools/enterprise-spreadsheet.ts +0 -825
- package/src/agent-tools/tools/glob.ts +0 -129
- package/src/agent-tools/tools/google/calendar.ts +0 -230
- package/src/agent-tools/tools/google/chat.ts +0 -725
- package/src/agent-tools/tools/google/contacts.ts +0 -209
- package/src/agent-tools/tools/google/docs.ts +0 -162
- package/src/agent-tools/tools/google/drive.ts +0 -392
- package/src/agent-tools/tools/google/forms.ts +0 -367
- package/src/agent-tools/tools/google/gmail.ts +0 -897
- package/src/agent-tools/tools/google/index.ts +0 -86
- package/src/agent-tools/tools/google/maps.ts +0 -543
- package/src/agent-tools/tools/google/meeting-voice.ts +0 -885
- package/src/agent-tools/tools/google/meetings.ts +0 -1094
- package/src/agent-tools/tools/google/sheets.ts +0 -215
- package/src/agent-tools/tools/google/slides.ts +0 -559
- package/src/agent-tools/tools/google/tasks.ts +0 -200
- package/src/agent-tools/tools/grep.ts +0 -178
- package/src/agent-tools/tools/integrations/_factory.ts +0 -102
- package/src/agent-tools/tools/integrations/activecampaign.ts +0 -14
- package/src/agent-tools/tools/integrations/adobe-sign.ts +0 -14
- package/src/agent-tools/tools/integrations/adp.ts +0 -14
- package/src/agent-tools/tools/integrations/airtable.ts +0 -14
- package/src/agent-tools/tools/integrations/apollo.ts +0 -14
- package/src/agent-tools/tools/integrations/asana.ts +0 -14
- package/src/agent-tools/tools/integrations/auth0.ts +0 -14
- package/src/agent-tools/tools/integrations/aws.ts +0 -14
- package/src/agent-tools/tools/integrations/azure-devops.ts +0 -14
- package/src/agent-tools/tools/integrations/bamboohr.ts +0 -14
- package/src/agent-tools/tools/integrations/basecamp.ts +0 -14
- package/src/agent-tools/tools/integrations/bigcommerce.ts +0 -14
- package/src/agent-tools/tools/integrations/bitbucket.ts +0 -14
- package/src/agent-tools/tools/integrations/box.ts +0 -14
- package/src/agent-tools/tools/integrations/brex.ts +0 -14
- package/src/agent-tools/tools/integrations/buffer.ts +0 -14
- package/src/agent-tools/tools/integrations/calendly.ts +0 -14
- package/src/agent-tools/tools/integrations/canva.ts +0 -14
- package/src/agent-tools/tools/integrations/chargebee.ts +0 -14
- package/src/agent-tools/tools/integrations/circleci.ts +0 -14
- package/src/agent-tools/tools/integrations/clickup.ts +0 -14
- package/src/agent-tools/tools/integrations/close.ts +0 -14
- package/src/agent-tools/tools/integrations/cloudflare.ts +0 -14
- package/src/agent-tools/tools/integrations/confluence.ts +0 -14
- package/src/agent-tools/tools/integrations/contentful.ts +0 -14
- package/src/agent-tools/tools/integrations/copper.ts +0 -14
- package/src/agent-tools/tools/integrations/crisp.ts +0 -14
- package/src/agent-tools/tools/integrations/crowdstrike.ts +0 -14
- package/src/agent-tools/tools/integrations/datadog.ts +0 -14
- package/src/agent-tools/tools/integrations/digitalocean.ts +0 -14
- package/src/agent-tools/tools/integrations/discord.ts +0 -14
- package/src/agent-tools/tools/integrations/docker.ts +0 -14
- package/src/agent-tools/tools/integrations/docusign.ts +0 -14
- package/src/agent-tools/tools/integrations/drift.ts +0 -14
- package/src/agent-tools/tools/integrations/dropbox.ts +0 -14
- package/src/agent-tools/tools/integrations/figma.ts +0 -14
- package/src/agent-tools/tools/integrations/firebase.ts +0 -14
- package/src/agent-tools/tools/integrations/flyio.ts +0 -14
- package/src/agent-tools/tools/integrations/freshbooks.ts +0 -14
- package/src/agent-tools/tools/integrations/freshdesk.ts +0 -14
- package/src/agent-tools/tools/integrations/freshsales.ts +0 -14
- package/src/agent-tools/tools/integrations/freshservice.ts +0 -14
- package/src/agent-tools/tools/integrations/front.ts +0 -14
- package/src/agent-tools/tools/integrations/github-actions.ts +0 -14
- package/src/agent-tools/tools/integrations/github.ts +0 -14
- package/src/agent-tools/tools/integrations/gitlab.ts +0 -14
- package/src/agent-tools/tools/integrations/gong.ts +0 -14
- package/src/agent-tools/tools/integrations/google-ads.ts +0 -14
- package/src/agent-tools/tools/integrations/google-analytics.ts +0 -14
- package/src/agent-tools/tools/integrations/google-cloud.ts +0 -14
- package/src/agent-tools/tools/integrations/gotomeeting.ts +0 -14
- package/src/agent-tools/tools/integrations/grafana.ts +0 -14
- package/src/agent-tools/tools/integrations/greenhouse.ts +0 -14
- package/src/agent-tools/tools/integrations/gusto.ts +0 -14
- package/src/agent-tools/tools/integrations/hashicorp-vault.ts +0 -14
- package/src/agent-tools/tools/integrations/heroku.ts +0 -14
- package/src/agent-tools/tools/integrations/hibob.ts +0 -14
- package/src/agent-tools/tools/integrations/hootsuite.ts +0 -14
- package/src/agent-tools/tools/integrations/hubspot.ts +0 -14
- package/src/agent-tools/tools/integrations/huggingface.ts +0 -14
- package/src/agent-tools/tools/integrations/index.ts +0 -474
- package/src/agent-tools/tools/integrations/intercom.ts +0 -14
- package/src/agent-tools/tools/integrations/jira.ts +0 -14
- package/src/agent-tools/tools/integrations/klaviyo.ts +0 -14
- package/src/agent-tools/tools/integrations/kubernetes.ts +0 -14
- package/src/agent-tools/tools/integrations/lattice.ts +0 -14
- package/src/agent-tools/tools/integrations/launchdarkly.ts +0 -14
- package/src/agent-tools/tools/integrations/lever.ts +0 -14
- package/src/agent-tools/tools/integrations/linear.ts +0 -14
- package/src/agent-tools/tools/integrations/linkedin.ts +0 -14
- package/src/agent-tools/tools/integrations/livechat.ts +0 -14
- package/src/agent-tools/tools/integrations/loom.ts +0 -14
- package/src/agent-tools/tools/integrations/mailchimp.ts +0 -14
- package/src/agent-tools/tools/integrations/mailgun.ts +0 -14
- package/src/agent-tools/tools/integrations/miro.ts +0 -14
- package/src/agent-tools/tools/integrations/mixpanel.ts +0 -14
- package/src/agent-tools/tools/integrations/monday.ts +0 -14
- package/src/agent-tools/tools/integrations/mongodb-atlas.ts +0 -14
- package/src/agent-tools/tools/integrations/neon.ts +0 -14
- package/src/agent-tools/tools/integrations/netlify.ts +0 -14
- package/src/agent-tools/tools/integrations/netsuite.ts +0 -14
- package/src/agent-tools/tools/integrations/newrelic.ts +0 -14
- package/src/agent-tools/tools/integrations/notion.ts +0 -14
- package/src/agent-tools/tools/integrations/okta.ts +0 -14
- package/src/agent-tools/tools/integrations/openai.ts +0 -14
- package/src/agent-tools/tools/integrations/opsgenie.ts +0 -14
- package/src/agent-tools/tools/integrations/outreach.ts +0 -14
- package/src/agent-tools/tools/integrations/paddle.ts +0 -14
- package/src/agent-tools/tools/integrations/pagerduty.ts +0 -14
- package/src/agent-tools/tools/integrations/pandadoc.ts +0 -14
- package/src/agent-tools/tools/integrations/paypal.ts +0 -14
- package/src/agent-tools/tools/integrations/personio.ts +0 -14
- package/src/agent-tools/tools/integrations/pinecone.ts +0 -14
- package/src/agent-tools/tools/integrations/pipedrive.ts +0 -14
- package/src/agent-tools/tools/integrations/plaid.ts +0 -14
- package/src/agent-tools/tools/integrations/postmark.ts +0 -14
- package/src/agent-tools/tools/integrations/power-automate.ts +0 -14
- package/src/agent-tools/tools/integrations/quickbooks.ts +0 -14
- package/src/agent-tools/tools/integrations/recurly.ts +0 -14
- package/src/agent-tools/tools/integrations/reddit.ts +0 -14
- package/src/agent-tools/tools/integrations/render.ts +0 -14
- package/src/agent-tools/tools/integrations/ringcentral.ts +0 -14
- package/src/agent-tools/tools/integrations/rippling.ts +0 -14
- package/src/agent-tools/tools/integrations/salesforce.ts +0 -14
- package/src/agent-tools/tools/integrations/salesloft.ts +0 -14
- package/src/agent-tools/tools/integrations/sanity.ts +0 -14
- package/src/agent-tools/tools/integrations/sap.ts +0 -14
- package/src/agent-tools/tools/integrations/segment.ts +0 -14
- package/src/agent-tools/tools/integrations/sendgrid.ts +0 -14
- package/src/agent-tools/tools/integrations/sentry.ts +0 -14
- package/src/agent-tools/tools/integrations/servicenow.ts +0 -14
- package/src/agent-tools/tools/integrations/shopify.ts +0 -14
- package/src/agent-tools/tools/integrations/shortcut.ts +0 -14
- package/src/agent-tools/tools/integrations/slack.ts +0 -14
- package/src/agent-tools/tools/integrations/smartsheet.ts +0 -14
- package/src/agent-tools/tools/integrations/snowflake.ts +0 -14
- package/src/agent-tools/tools/integrations/snyk.ts +0 -14
- package/src/agent-tools/tools/integrations/splunk.ts +0 -14
- package/src/agent-tools/tools/integrations/square.ts +0 -14
- package/src/agent-tools/tools/integrations/statuspage.ts +0 -14
- package/src/agent-tools/tools/integrations/stripe.ts +0 -14
- package/src/agent-tools/tools/integrations/supabase.ts +0 -14
- package/src/agent-tools/tools/integrations/teamwork.ts +0 -14
- package/src/agent-tools/tools/integrations/telegram.ts +0 -14
- package/src/agent-tools/tools/integrations/terraform.ts +0 -14
- package/src/agent-tools/tools/integrations/todoist.ts +0 -14
- package/src/agent-tools/tools/integrations/trello.ts +0 -14
- package/src/agent-tools/tools/integrations/twilio.ts +0 -14
- package/src/agent-tools/tools/integrations/twitter.ts +0 -14
- package/src/agent-tools/tools/integrations/vercel.ts +0 -14
- package/src/agent-tools/tools/integrations/weaviate.ts +0 -14
- package/src/agent-tools/tools/integrations/webex.ts +0 -14
- package/src/agent-tools/tools/integrations/webflow.ts +0 -14
- package/src/agent-tools/tools/integrations/whatsapp.ts +0 -14
- package/src/agent-tools/tools/integrations/whereby.ts +0 -14
- package/src/agent-tools/tools/integrations/woocommerce.ts +0 -14
- package/src/agent-tools/tools/integrations/wordpress.ts +0 -14
- package/src/agent-tools/tools/integrations/workday.ts +0 -14
- package/src/agent-tools/tools/integrations/wrike.ts +0 -14
- package/src/agent-tools/tools/integrations/xero.ts +0 -14
- package/src/agent-tools/tools/integrations/youtube.ts +0 -14
- package/src/agent-tools/tools/integrations/zendesk.ts +0 -14
- package/src/agent-tools/tools/integrations/zoho-crm.ts +0 -14
- package/src/agent-tools/tools/integrations/zoom.ts +0 -14
- package/src/agent-tools/tools/integrations/zuora.ts +0 -14
- package/src/agent-tools/tools/knowledge-search.ts +0 -318
- package/src/agent-tools/tools/local/coding.ts +0 -626
- package/src/agent-tools/tools/local/dependency-manager.ts +0 -647
- package/src/agent-tools/tools/local/file-edit.ts +0 -31
- package/src/agent-tools/tools/local/file-list.ts +0 -39
- package/src/agent-tools/tools/local/file-ops.ts +0 -48
- package/src/agent-tools/tools/local/file-read.ts +0 -39
- package/src/agent-tools/tools/local/file-search.ts +0 -46
- package/src/agent-tools/tools/local/file-write.ts +0 -28
- package/src/agent-tools/tools/local/filesystem.ts +0 -5
- package/src/agent-tools/tools/local/index.ts +0 -55
- package/src/agent-tools/tools/local/resolve-path.ts +0 -18
- package/src/agent-tools/tools/local/shell.ts +0 -277
- package/src/agent-tools/tools/local/system-info.ts +0 -29
- package/src/agent-tools/tools/management.ts +0 -425
- package/src/agent-tools/tools/mcp-bridge.ts +0 -142
- package/src/agent-tools/tools/mcp-server-tools.ts +0 -91
- package/src/agent-tools/tools/meeting-lifecycle.ts +0 -438
- package/src/agent-tools/tools/memory.ts +0 -509
- package/src/agent-tools/tools/messaging/index.ts +0 -6
- package/src/agent-tools/tools/messaging/telegram.ts +0 -167
- package/src/agent-tools/tools/messaging/whatsapp.ts +0 -651
- package/src/agent-tools/tools/microsoft/contacts.ts +0 -176
- package/src/agent-tools/tools/microsoft/excel-vba.ts +0 -331
- package/src/agent-tools/tools/microsoft/excel.ts +0 -261
- package/src/agent-tools/tools/microsoft/graph-api.ts +0 -161
- package/src/agent-tools/tools/microsoft/index.ts +0 -95
- package/src/agent-tools/tools/microsoft/onedrive.ts +0 -429
- package/src/agent-tools/tools/microsoft/onenote.ts +0 -186
- package/src/agent-tools/tools/microsoft/outlook-calendar.ts +0 -286
- package/src/agent-tools/tools/microsoft/outlook-mail.ts +0 -723
- package/src/agent-tools/tools/microsoft/planner.ts +0 -200
- package/src/agent-tools/tools/microsoft/powerbi.ts +0 -266
- package/src/agent-tools/tools/microsoft/powerpoint.ts +0 -186
- package/src/agent-tools/tools/microsoft/sharepoint.ts +0 -328
- package/src/agent-tools/tools/microsoft/teams.ts +0 -463
- package/src/agent-tools/tools/microsoft/todo.ts +0 -181
- package/src/agent-tools/tools/oauth-token-provider.ts +0 -101
- package/src/agent-tools/tools/read.ts +0 -160
- package/src/agent-tools/tools/visual-memory/capture.ts +0 -217
- package/src/agent-tools/tools/visual-memory/diff.ts +0 -283
- package/src/agent-tools/tools/visual-memory/index.ts +0 -698
- package/src/agent-tools/tools/visual-memory/phash.ts +0 -120
- package/src/agent-tools/tools/visual-memory/similarity.ts +0 -354
- package/src/agent-tools/tools/visual-memory/storage.ts +0 -534
- package/src/agent-tools/tools/visual-memory/types.ts +0 -100
- package/src/agent-tools/tools/web-fetch-utils.ts +0 -202
- package/src/agent-tools/tools/web-fetch.ts +0 -464
- package/src/agent-tools/tools/web-search.ts +0 -480
- package/src/agent-tools/tools/web-shared.ts +0 -232
- package/src/agent-tools/tools/write.ts +0 -68
- package/src/agent-tools/types.ts +0 -214
- package/src/agenticmail/index.ts +0 -34
- package/src/agenticmail/manager.ts +0 -253
- package/src/agenticmail/providers/google.ts +0 -391
- package/src/agenticmail/providers/imap.ts +0 -454
- package/src/agenticmail/providers/index.ts +0 -28
- package/src/agenticmail/providers/microsoft.ts +0 -260
- package/src/agenticmail/types.ts +0 -173
- package/src/auth/routes.ts +0 -1589
- package/src/browser/bridge-auth-registry.ts +0 -34
- package/src/browser/bridge-server.ts +0 -93
- package/src/browser/cdp.helpers.ts +0 -180
- package/src/browser/cdp.ts +0 -466
- package/src/browser/chrome.executables.ts +0 -625
- package/src/browser/chrome.profile-decoration.ts +0 -198
- package/src/browser/chrome.ts +0 -349
- package/src/browser/client-actions-core.ts +0 -259
- package/src/browser/client-actions-observe.ts +0 -184
- package/src/browser/client-actions-state.ts +0 -284
- package/src/browser/client-actions-types.ts +0 -16
- package/src/browser/client-actions-url.ts +0 -11
- package/src/browser/client-actions.ts +0 -4
- package/src/browser/client-fetch.ts +0 -253
- package/src/browser/client.ts +0 -337
- package/src/browser/config.ts +0 -301
- package/src/browser/constants.ts +0 -8
- package/src/browser/control-auth.ts +0 -94
- package/src/browser/control-service.ts +0 -81
- package/src/browser/csrf.ts +0 -87
- package/src/browser/enterprise-compat.ts +0 -562
- package/src/browser/extension-relay.ts +0 -834
- package/src/browser/http-auth.ts +0 -63
- package/src/browser/navigation-guard.ts +0 -50
- package/src/browser/paths.ts +0 -49
- package/src/browser/playwright.d.ts +0 -12
- package/src/browser/profiles-service.ts +0 -187
- package/src/browser/profiles.ts +0 -114
- package/src/browser/proxy-files.ts +0 -41
- package/src/browser/pw-ai-module.ts +0 -52
- package/src/browser/pw-ai-state.ts +0 -9
- package/src/browser/pw-ai.ts +0 -65
- package/src/browser/pw-role-snapshot.ts +0 -434
- package/src/browser/pw-session.ts +0 -810
- package/src/browser/pw-tools-core.activity.ts +0 -68
- package/src/browser/pw-tools-core.downloads.ts +0 -281
- package/src/browser/pw-tools-core.interactions.ts +0 -646
- package/src/browser/pw-tools-core.responses.ts +0 -124
- package/src/browser/pw-tools-core.shared.ts +0 -70
- package/src/browser/pw-tools-core.snapshot.ts +0 -213
- package/src/browser/pw-tools-core.state.ts +0 -209
- package/src/browser/pw-tools-core.storage.ts +0 -128
- package/src/browser/pw-tools-core.trace.ts +0 -37
- package/src/browser/pw-tools-core.ts +0 -8
- package/src/browser/resolved-config-refresh.ts +0 -59
- package/src/browser/routes/agent.act.shared.ts +0 -52
- package/src/browser/routes/agent.act.ts +0 -575
- package/src/browser/routes/agent.debug.ts +0 -149
- package/src/browser/routes/agent.shared.ts +0 -143
- package/src/browser/routes/agent.snapshot.ts +0 -333
- package/src/browser/routes/agent.storage.ts +0 -451
- package/src/browser/routes/agent.ts +0 -13
- package/src/browser/routes/basic.ts +0 -202
- package/src/browser/routes/dispatcher.ts +0 -126
- package/src/browser/routes/index.ts +0 -11
- package/src/browser/routes/path-output.ts +0 -1
- package/src/browser/routes/tabs.ts +0 -217
- package/src/browser/routes/types.ts +0 -26
- package/src/browser/routes/utils.ts +0 -73
- package/src/browser/screenshot.ts +0 -54
- package/src/browser/server-context.ts +0 -688
- package/src/browser/server-context.types.ts +0 -65
- package/src/browser/server-lifecycle.ts +0 -48
- package/src/browser/server-middleware.ts +0 -37
- package/src/browser/server.ts +0 -110
- package/src/browser/target-id.ts +0 -30
- package/src/browser/trash.ts +0 -21
- package/src/cli-agent.ts +0 -2452
- package/src/cli-reset-password.ts +0 -138
- package/src/cli-serve.ts +0 -314
- package/src/cli.ts +0 -103
- package/src/dashboard/app.js +0 -579
- package/src/dashboard/assets/brand-logos.js +0 -350
- package/src/dashboard/assets/icons/emoji-icons.js +0 -893
- package/src/dashboard/assets/logo.png +0 -0
- package/src/dashboard/assets/provider-logos.js +0 -139
- package/src/dashboard/components/error-boundary.js +0 -21
- package/src/dashboard/components/help-button.js +0 -65
- package/src/dashboard/components/icons.js +0 -64
- package/src/dashboard/components/knowledge-link.js +0 -79
- package/src/dashboard/components/modal.js +0 -125
- package/src/dashboard/components/org-switcher.js +0 -156
- package/src/dashboard/components/persona-fields.js +0 -460
- package/src/dashboard/components/settings-help.js +0 -193
- package/src/dashboard/components/tag-input.js +0 -96
- package/src/dashboard/components/timezones.js +0 -352
- package/src/dashboard/components/transport-encryption.js +0 -288
- package/src/dashboard/components/utils.js +0 -205
- package/src/dashboard/data/countries.js +0 -255
- package/src/dashboard/docs/activity.html +0 -253
- package/src/dashboard/docs/agent-activity.html +0 -199
- package/src/dashboard/docs/agent-autonomy.html +0 -161
- package/src/dashboard/docs/agent-budget.html +0 -190
- package/src/dashboard/docs/agent-channels.html +0 -189
- package/src/dashboard/docs/agent-communication.html +0 -171
- package/src/dashboard/docs/agent-configuration.html +0 -194
- package/src/dashboard/docs/agent-deployment.html +0 -323
- package/src/dashboard/docs/agent-email.html +0 -184
- package/src/dashboard/docs/agent-guardrails.html +0 -206
- package/src/dashboard/docs/agent-manager.html +0 -226
- package/src/dashboard/docs/agent-memory.html +0 -215
- package/src/dashboard/docs/agent-overview.html +0 -226
- package/src/dashboard/docs/agent-permissions.html +0 -305
- package/src/dashboard/docs/agent-personal.html +0 -155
- package/src/dashboard/docs/agent-security.html +0 -188
- package/src/dashboard/docs/agent-skills.html +0 -224
- package/src/dashboard/docs/agent-tool-security.html +0 -205
- package/src/dashboard/docs/agent-tools.html +0 -238
- package/src/dashboard/docs/agent-whatsapp.html +0 -210
- package/src/dashboard/docs/agent-workforce.html +0 -199
- package/src/dashboard/docs/agents.html +0 -258
- package/src/dashboard/docs/approvals.html +0 -200
- package/src/dashboard/docs/audit.html +0 -206
- package/src/dashboard/docs/browser-providers.html +0 -313
- package/src/dashboard/docs/cluster.html +0 -285
- package/src/dashboard/docs/community-skills.html +0 -253
- package/src/dashboard/docs/compliance.html +0 -221
- package/src/dashboard/docs/dashboard.html +0 -84
- package/src/dashboard/docs/database-access.html +0 -322
- package/src/dashboard/docs/dlp.html +0 -268
- package/src/dashboard/docs/docs-style.css +0 -26
- package/src/dashboard/docs/domain-status.html +0 -294
- package/src/dashboard/docs/guardrails.html +0 -265
- package/src/dashboard/docs/journal.html +0 -197
- package/src/dashboard/docs/knowledge-contributions.html +0 -286
- package/src/dashboard/docs/knowledge.html +0 -268
- package/src/dashboard/docs/memory-transfer.html +0 -311
- package/src/dashboard/docs/messages.html +0 -217
- package/src/dashboard/docs/multi-tenant.html +0 -311
- package/src/dashboard/docs/org-chart.html +0 -239
- package/src/dashboard/docs/organizations.html +0 -182
- package/src/dashboard/docs/roles.html +0 -195
- package/src/dashboard/docs/settings-network.html +0 -321
- package/src/dashboard/docs/settings-security.html +0 -347
- package/src/dashboard/docs/settings-tool-security.html +0 -176
- package/src/dashboard/docs/settings.html +0 -280
- package/src/dashboard/docs/skill-connections.html +0 -270
- package/src/dashboard/docs/skills.html +0 -206
- package/src/dashboard/docs/task-pipeline.html +0 -261
- package/src/dashboard/docs/transport-encryption.html +0 -359
- package/src/dashboard/docs/users.html +0 -225
- package/src/dashboard/docs/vault.html +0 -260
- package/src/dashboard/docs/workforce.html +0 -245
- package/src/dashboard/index.html +0 -444
- package/src/dashboard/pages/activity.js +0 -379
- package/src/dashboard/pages/agent-detail/activity.js +0 -277
- package/src/dashboard/pages/agent-detail/autonomy.js +0 -244
- package/src/dashboard/pages/agent-detail/budget.js +0 -269
- package/src/dashboard/pages/agent-detail/channels.js +0 -494
- package/src/dashboard/pages/agent-detail/communication.js +0 -296
- package/src/dashboard/pages/agent-detail/configuration.js +0 -882
- package/src/dashboard/pages/agent-detail/deployment.js +0 -958
- package/src/dashboard/pages/agent-detail/email.js +0 -674
- package/src/dashboard/pages/agent-detail/guardrails.js +0 -521
- package/src/dashboard/pages/agent-detail/index.js +0 -261
- package/src/dashboard/pages/agent-detail/manager.js +0 -357
- package/src/dashboard/pages/agent-detail/meeting-browser.js +0 -933
- package/src/dashboard/pages/agent-detail/memory.js +0 -368
- package/src/dashboard/pages/agent-detail/overview.js +0 -844
- package/src/dashboard/pages/agent-detail/permissions.js +0 -1163
- package/src/dashboard/pages/agent-detail/personal-details.js +0 -404
- package/src/dashboard/pages/agent-detail/security.js +0 -409
- package/src/dashboard/pages/agent-detail/shared.js +0 -85
- package/src/dashboard/pages/agent-detail/skills-section.js +0 -183
- package/src/dashboard/pages/agent-detail/tool-security.js +0 -380
- package/src/dashboard/pages/agent-detail/tools.js +0 -322
- package/src/dashboard/pages/agent-detail/whatsapp.js +0 -824
- package/src/dashboard/pages/agent-detail/workforce.js +0 -683
- package/src/dashboard/pages/agents.js +0 -1242
- package/src/dashboard/pages/approvals.js +0 -100
- package/src/dashboard/pages/audit.js +0 -198
- package/src/dashboard/pages/cluster.js +0 -512
- package/src/dashboard/pages/community-skills.js +0 -1219
- package/src/dashboard/pages/compliance.js +0 -475
- package/src/dashboard/pages/dashboard.js +0 -180
- package/src/dashboard/pages/database-access.js +0 -812
- package/src/dashboard/pages/dlp.js +0 -293
- package/src/dashboard/pages/domain-status.js +0 -951
- package/src/dashboard/pages/guardrails.js +0 -1035
- package/src/dashboard/pages/journal.js +0 -172
- package/src/dashboard/pages/knowledge-contributions.js +0 -1682
- package/src/dashboard/pages/knowledge-import.js +0 -455
- package/src/dashboard/pages/knowledge.js +0 -582
- package/src/dashboard/pages/login.js +0 -1056
- package/src/dashboard/pages/memory-transfer.js +0 -631
- package/src/dashboard/pages/messages.js +0 -303
- package/src/dashboard/pages/org-chart.js +0 -349
- package/src/dashboard/pages/organizations.js +0 -1081
- package/src/dashboard/pages/roles.js +0 -780
- package/src/dashboard/pages/settings.js +0 -3790
- package/src/dashboard/pages/skill-connections.js +0 -982
- package/src/dashboard/pages/skills.js +0 -879
- package/src/dashboard/pages/task-pipeline.js +0 -684
- package/src/dashboard/pages/users.js +0 -867
- package/src/dashboard/pages/vault.js +0 -791
- package/src/dashboard/pages/workforce.js +0 -851
- package/src/dashboard/vendor/react-dom.development.js +0 -29924
- package/src/dashboard/vendor/react-dom.production.min.js +0 -267
- package/src/dashboard/vendor/react.development.js +0 -3343
- package/src/dashboard/vendor/react.production.min.js +0 -31
- package/src/database-access/agent-tools.ts +0 -193
- package/src/database-access/connection-manager.ts +0 -1341
- package/src/database-access/index.ts +0 -21
- package/src/database-access/query-sanitizer.ts +0 -220
- package/src/database-access/routes.ts +0 -226
- package/src/database-access/types.ts +0 -226
- package/src/db/adapter.ts +0 -510
- package/src/db/dynamodb.ts +0 -454
- package/src/db/factory.ts +0 -129
- package/src/db/mongodb.ts +0 -360
- package/src/db/mysql.ts +0 -531
- package/src/db/postgres.ts +0 -863
- package/src/db/proxy.ts +0 -39
- package/src/db/resolve-driver.ts +0 -29
- package/src/db/sql-schema.ts +0 -124
- package/src/db/sqlite.ts +0 -493
- package/src/db/turso.ts +0 -470
- package/src/deploy/fly.ts +0 -368
- package/src/deploy/managed.ts +0 -235
- package/src/domain-lock/cli-recover.ts +0 -591
- package/src/domain-lock/cli-verify.ts +0 -190
- package/src/domain-lock/index.ts +0 -220
- package/src/engine/activity-routes.ts +0 -154
- package/src/engine/activity.ts +0 -568
- package/src/engine/agent-autonomy.ts +0 -974
- package/src/engine/agent-config.ts +0 -646
- package/src/engine/agent-heartbeat.ts +0 -720
- package/src/engine/agent-hierarchy.ts +0 -1064
- package/src/engine/agent-memory.ts +0 -806
- package/src/engine/agent-notify.ts +0 -50
- package/src/engine/agent-routes.ts +0 -2583
- package/src/engine/agent-status.ts +0 -311
- package/src/engine/ambient-memory.ts +0 -401
- package/src/engine/approvals.ts +0 -615
- package/src/engine/assets/thinking-hum.mp3 +0 -0
- package/src/engine/catalog-routes.ts +0 -232
- package/src/engine/chat-poller.ts +0 -913
- package/src/engine/chat-webhook-routes.ts +0 -304
- package/src/engine/cli-build-skill.ts +0 -285
- package/src/engine/cli-submit-skill.ts +0 -200
- package/src/engine/cli-validate.ts +0 -188
- package/src/engine/cluster.ts +0 -278
- package/src/engine/communication-routes.ts +0 -139
- package/src/engine/communication.ts +0 -765
- package/src/engine/community-registry.ts +0 -1529
- package/src/engine/community-routes.ts +0 -260
- package/src/engine/compliance-routes.ts +0 -133
- package/src/engine/compliance.ts +0 -1679
- package/src/engine/config-bus.ts +0 -103
- package/src/engine/db-adapter.ts +0 -1156
- package/src/engine/db-schema.ts +0 -1945
- package/src/engine/deploy-schema-routes.ts +0 -176
- package/src/engine/deployer.ts +0 -957
- package/src/engine/dlp-routes.ts +0 -101
- package/src/engine/dlp.ts +0 -410
- package/src/engine/email-poller.ts +0 -855
- package/src/engine/emoji.ts +0 -106
- package/src/engine/guardrail-routes.ts +0 -125
- package/src/engine/guardrails.ts +0 -465
- package/src/engine/index.ts +0 -255
- package/src/engine/journal-routes.ts +0 -56
- package/src/engine/journal.ts +0 -249
- package/src/engine/knowledge-contribution-routes.ts +0 -633
- package/src/engine/knowledge-contribution.ts +0 -1386
- package/src/engine/knowledge-import/chunker.ts +0 -241
- package/src/engine/knowledge-import/import-manager.ts +0 -416
- package/src/engine/knowledge-import/index.ts +0 -27
- package/src/engine/knowledge-import/processors/clean.ts +0 -149
- package/src/engine/knowledge-import/processors/extract-gdrive.ts +0 -102
- package/src/engine/knowledge-import/processors/extract-github.ts +0 -74
- package/src/engine/knowledge-import/processors/extract-sharepoint.ts +0 -69
- package/src/engine/knowledge-import/processors/extract-web.ts +0 -275
- package/src/engine/knowledge-import/processors/index.ts +0 -18
- package/src/engine/knowledge-import/processors/pipeline.ts +0 -171
- package/src/engine/knowledge-import/processors/types.ts +0 -78
- package/src/engine/knowledge-import/processors/validate.ts +0 -150
- package/src/engine/knowledge-import/provider-file-upload.ts +0 -95
- package/src/engine/knowledge-import/provider-github.ts +0 -144
- package/src/engine/knowledge-import/provider-google-sites.ts +0 -323
- package/src/engine/knowledge-import/provider-sharepoint.ts +0 -276
- package/src/engine/knowledge-import/provider-url.ts +0 -218
- package/src/engine/knowledge-import/routes.ts +0 -94
- package/src/engine/knowledge-import/types.ts +0 -92
- package/src/engine/knowledge-routes.ts +0 -231
- package/src/engine/knowledge.ts +0 -587
- package/src/engine/lifecycle.ts +0 -1420
- package/src/engine/mcp-process-manager.ts +0 -573
- package/src/engine/meeting-monitor.ts +0 -483
- package/src/engine/meeting-voice-intelligence.ts +0 -340
- package/src/engine/memory-routes.ts +0 -142
- package/src/engine/memory-transfer-routes.ts +0 -339
- package/src/engine/messaging-history.ts +0 -177
- package/src/engine/messaging-poller.ts +0 -786
- package/src/engine/model-fallback.ts +0 -141
- package/src/engine/oauth-connect-routes.ts +0 -603
- package/src/engine/oauth-connect.ts +0 -304
- package/src/engine/onboarding-routes.ts +0 -148
- package/src/engine/onboarding.ts +0 -574
- package/src/engine/org-approval-routes.ts +0 -146
- package/src/engine/org-integration-routes.ts +0 -399
- package/src/engine/org-integrations.ts +0 -608
- package/src/engine/org-policies.ts +0 -502
- package/src/engine/policy-import-routes.ts +0 -125
- package/src/engine/policy-import.ts +0 -1186
- package/src/engine/policy-routes.ts +0 -163
- package/src/engine/routes.ts +0 -1236
- package/src/engine/screen-unlock.ts +0 -136
- package/src/engine/session-router.ts +0 -212
- package/src/engine/skill-updater-routes.ts +0 -132
- package/src/engine/skill-updater.ts +0 -480
- package/src/engine/skill-validator.ts +0 -331
- package/src/engine/skills/agent-management.ts +0 -119
- package/src/engine/skills/agent-memory.ts +0 -19
- package/src/engine/skills/agenticmail.ts +0 -116
- package/src/engine/skills/core-tools.ts +0 -25
- package/src/engine/skills/database-access.ts +0 -78
- package/src/engine/skills/enterprise-code-sandbox.ts +0 -113
- package/src/engine/skills/enterprise-database.ts +0 -123
- package/src/engine/skills/enterprise-diff.ts +0 -95
- package/src/engine/skills/enterprise-documents.ts +0 -162
- package/src/engine/skills/enterprise-http.ts +0 -99
- package/src/engine/skills/enterprise-security-scan.ts +0 -125
- package/src/engine/skills/enterprise-spreadsheet.ts +0 -171
- package/src/engine/skills/gws-admin.ts +0 -18
- package/src/engine/skills/gws-calendar.ts +0 -21
- package/src/engine/skills/gws-chat.ts +0 -29
- package/src/engine/skills/gws-contacts.ts +0 -20
- package/src/engine/skills/gws-docs.ts +0 -18
- package/src/engine/skills/gws-drive.ts +0 -23
- package/src/engine/skills/gws-forms.ts +0 -23
- package/src/engine/skills/gws-gmail.ts +0 -30
- package/src/engine/skills/gws-groups.ts +0 -17
- package/src/engine/skills/gws-keep.ts +0 -17
- package/src/engine/skills/gws-maps.ts +0 -25
- package/src/engine/skills/gws-meet.ts +0 -23
- package/src/engine/skills/gws-sheets.ts +0 -22
- package/src/engine/skills/gws-sites.ts +0 -16
- package/src/engine/skills/gws-slides.ts +0 -27
- package/src/engine/skills/gws-tasks.ts +0 -22
- package/src/engine/skills/gws-vault.ts +0 -17
- package/src/engine/skills/index.ts +0 -159
- package/src/engine/skills/knowledge-search.ts +0 -18
- package/src/engine/skills/local-system.ts +0 -61
- package/src/engine/skills/m365-admin.ts +0 -18
- package/src/engine/skills/m365-bookings.ts +0 -17
- package/src/engine/skills/m365-copilot.ts +0 -17
- package/src/engine/skills/m365-excel.ts +0 -60
- package/src/engine/skills/m365-forms.ts +0 -17
- package/src/engine/skills/m365-onedrive.ts +0 -60
- package/src/engine/skills/m365-onenote.ts +0 -17
- package/src/engine/skills/m365-outlook.ts +0 -27
- package/src/engine/skills/m365-planner.ts +0 -18
- package/src/engine/skills/m365-power-automate.ts +0 -18
- package/src/engine/skills/m365-power-bi.ts +0 -19
- package/src/engine/skills/m365-powerpoint.ts +0 -33
- package/src/engine/skills/m365-sharepoint.ts +0 -20
- package/src/engine/skills/m365-teams.ts +0 -21
- package/src/engine/skills/m365-todo.ts +0 -17
- package/src/engine/skills/m365-whiteboard.ts +0 -16
- package/src/engine/skills/m365-word.ts +0 -42
- package/src/engine/skills/mcp-bridge.ts +0 -45
- package/src/engine/skills/meeting-lifecycle.ts +0 -20
- package/src/engine/skills/messaging.ts +0 -46
- package/src/engine/skills/visual-memory.ts +0 -25
- package/src/engine/skills.ts +0 -688
- package/src/engine/soul-library.ts +0 -142
- package/src/engine/soul-templates.json +0 -1525
- package/src/engine/storage-manager.ts +0 -252
- package/src/engine/storage-routes.ts +0 -113
- package/src/engine/storage.ts +0 -528
- package/src/engine/task-poller.ts +0 -394
- package/src/engine/task-queue-after-spawn.ts +0 -66
- package/src/engine/task-queue-before-spawn.ts +0 -113
- package/src/engine/task-queue-routes.ts +0 -161
- package/src/engine/task-queue.ts +0 -664
- package/src/engine/tenant.ts +0 -409
- package/src/engine/tool-catalog.ts +0 -354
- package/src/engine/vault-routes.ts +0 -134
- package/src/engine/vault.ts +0 -601
- package/src/engine/workforce-routes.ts +0 -331
- package/src/engine/workforce.ts +0 -1161
- package/src/index.ts +0 -77
- package/src/lib/cidr.ts +0 -122
- package/src/lib/config-store.ts +0 -86
- package/src/lib/resilience.ts +0 -326
- package/src/lib/text-search.ts +0 -358
- package/src/mcp/adapters/activecampaign.adapter.ts +0 -391
- package/src/mcp/adapters/adobe-sign.adapter.ts +0 -469
- package/src/mcp/adapters/adp.adapter.ts +0 -358
- package/src/mcp/adapters/airtable.adapter.ts +0 -273
- package/src/mcp/adapters/apollo.adapter.ts +0 -420
- package/src/mcp/adapters/asana.adapter.ts +0 -315
- package/src/mcp/adapters/auth0.adapter.ts +0 -386
- package/src/mcp/adapters/aws.adapter.ts +0 -345
- package/src/mcp/adapters/azure-devops.adapter.ts +0 -389
- package/src/mcp/adapters/bamboohr.adapter.ts +0 -376
- package/src/mcp/adapters/basecamp.adapter.ts +0 -366
- package/src/mcp/adapters/bigcommerce.adapter.ts +0 -429
- package/src/mcp/adapters/bitbucket.adapter.ts +0 -260
- package/src/mcp/adapters/box.adapter.ts +0 -350
- package/src/mcp/adapters/brex.adapter.ts +0 -367
- package/src/mcp/adapters/buffer.adapter.ts +0 -303
- package/src/mcp/adapters/calendly.adapter.ts +0 -262
- package/src/mcp/adapters/canva.adapter.ts +0 -256
- package/src/mcp/adapters/chargebee.adapter.ts +0 -448
- package/src/mcp/adapters/circleci.adapter.ts +0 -216
- package/src/mcp/adapters/clickup.adapter.ts +0 -335
- package/src/mcp/adapters/close.adapter.ts +0 -390
- package/src/mcp/adapters/cloudflare.adapter.ts +0 -378
- package/src/mcp/adapters/confluence.adapter.ts +0 -301
- package/src/mcp/adapters/contentful.adapter.ts +0 -355
- package/src/mcp/adapters/copper.adapter.ts +0 -468
- package/src/mcp/adapters/crisp.adapter.ts +0 -415
- package/src/mcp/adapters/crowdstrike.adapter.ts +0 -413
- package/src/mcp/adapters/datadog.adapter.ts +0 -373
- package/src/mcp/adapters/digitalocean.adapter.ts +0 -336
- package/src/mcp/adapters/discord.adapter.ts +0 -248
- package/src/mcp/adapters/docker.adapter.ts +0 -238
- package/src/mcp/adapters/docusign.adapter.ts +0 -431
- package/src/mcp/adapters/drift.adapter.ts +0 -386
- package/src/mcp/adapters/dropbox.adapter.ts +0 -315
- package/src/mcp/adapters/figma.adapter.ts +0 -302
- package/src/mcp/adapters/firebase.adapter.ts +0 -446
- package/src/mcp/adapters/flyio.adapter.ts +0 -302
- package/src/mcp/adapters/freshbooks.adapter.ts +0 -474
- package/src/mcp/adapters/freshdesk.adapter.ts +0 -441
- package/src/mcp/adapters/freshsales.adapter.ts +0 -457
- package/src/mcp/adapters/freshservice.adapter.ts +0 -481
- package/src/mcp/adapters/front.adapter.ts +0 -357
- package/src/mcp/adapters/github-actions.adapter.ts +0 -329
- package/src/mcp/adapters/github.adapter.ts +0 -387
- package/src/mcp/adapters/gitlab.adapter.ts +0 -368
- package/src/mcp/adapters/gong.adapter.ts +0 -386
- package/src/mcp/adapters/google-ads.adapter.ts +0 -363
- package/src/mcp/adapters/google-analytics.adapter.ts +0 -316
- package/src/mcp/adapters/google-cloud.adapter.ts +0 -312
- package/src/mcp/adapters/gotomeeting.adapter.ts +0 -255
- package/src/mcp/adapters/grafana.adapter.ts +0 -361
- package/src/mcp/adapters/greenhouse.adapter.ts +0 -354
- package/src/mcp/adapters/gusto.adapter.ts +0 -329
- package/src/mcp/adapters/hashicorp-vault.adapter.ts +0 -355
- package/src/mcp/adapters/heroku.adapter.ts +0 -291
- package/src/mcp/adapters/hibob.adapter.ts +0 -334
- package/src/mcp/adapters/hootsuite.adapter.ts +0 -322
- package/src/mcp/adapters/hubspot.adapter.ts +0 -400
- package/src/mcp/adapters/huggingface.adapter.ts +0 -349
- package/src/mcp/adapters/index.ts +0 -524
- package/src/mcp/adapters/intercom.adapter.ts +0 -269
- package/src/mcp/adapters/jira.adapter.ts +0 -482
- package/src/mcp/adapters/klaviyo.adapter.ts +0 -353
- package/src/mcp/adapters/kubernetes.adapter.ts +0 -431
- package/src/mcp/adapters/lattice.adapter.ts +0 -339
- package/src/mcp/adapters/launchdarkly.adapter.ts +0 -368
- package/src/mcp/adapters/lever.adapter.ts +0 -347
- package/src/mcp/adapters/linear.adapter.ts +0 -300
- package/src/mcp/adapters/linkedin.adapter.ts +0 -331
- package/src/mcp/adapters/livechat.adapter.ts +0 -259
- package/src/mcp/adapters/loom.adapter.ts +0 -230
- package/src/mcp/adapters/mailchimp.adapter.ts +0 -394
- package/src/mcp/adapters/mailgun.adapter.ts +0 -425
- package/src/mcp/adapters/miro.adapter.ts +0 -274
- package/src/mcp/adapters/mixpanel.adapter.ts +0 -324
- package/src/mcp/adapters/monday.adapter.ts +0 -308
- package/src/mcp/adapters/mongodb-atlas.adapter.ts +0 -345
- package/src/mcp/adapters/neon.adapter.ts +0 -312
- package/src/mcp/adapters/netlify.adapter.ts +0 -324
- package/src/mcp/adapters/netsuite.adapter.ts +0 -411
- package/src/mcp/adapters/newrelic.adapter.ts +0 -339
- package/src/mcp/adapters/notion.adapter.ts +0 -338
- package/src/mcp/adapters/okta.adapter.ts +0 -394
- package/src/mcp/adapters/openai.adapter.ts +0 -315
- package/src/mcp/adapters/opsgenie.adapter.ts +0 -375
- package/src/mcp/adapters/outreach.adapter.ts +0 -372
- package/src/mcp/adapters/paddle.adapter.ts +0 -467
- package/src/mcp/adapters/pagerduty.adapter.ts +0 -412
- package/src/mcp/adapters/pandadoc.adapter.ts +0 -389
- package/src/mcp/adapters/paypal.adapter.ts +0 -465
- package/src/mcp/adapters/personio.adapter.ts +0 -401
- package/src/mcp/adapters/pinecone.adapter.ts +0 -340
- package/src/mcp/adapters/pipedrive.adapter.ts +0 -324
- package/src/mcp/adapters/plaid.adapter.ts +0 -444
- package/src/mcp/adapters/postmark.adapter.ts +0 -387
- package/src/mcp/adapters/power-automate.adapter.ts +0 -388
- package/src/mcp/adapters/quickbooks.adapter.ts +0 -431
- package/src/mcp/adapters/recurly.adapter.ts +0 -433
- package/src/mcp/adapters/reddit.adapter.ts +0 -371
- package/src/mcp/adapters/render.adapter.ts +0 -332
- package/src/mcp/adapters/ringcentral.adapter.ts +0 -281
- package/src/mcp/adapters/rippling.adapter.ts +0 -287
- package/src/mcp/adapters/salesforce.adapter.ts +0 -321
- package/src/mcp/adapters/salesloft.adapter.ts +0 -413
- package/src/mcp/adapters/sanity.adapter.ts +0 -363
- package/src/mcp/adapters/sap.adapter.ts +0 -483
- package/src/mcp/adapters/segment.adapter.ts +0 -260
- package/src/mcp/adapters/sendgrid.adapter.ts +0 -265
- package/src/mcp/adapters/sentry.adapter.ts +0 -331
- package/src/mcp/adapters/servicenow.adapter.ts +0 -468
- package/src/mcp/adapters/shopify.adapter.ts +0 -451
- package/src/mcp/adapters/shortcut.adapter.ts +0 -290
- package/src/mcp/adapters/slack.adapter.ts +0 -380
- package/src/mcp/adapters/smartsheet.adapter.ts +0 -326
- package/src/mcp/adapters/snowflake.adapter.ts +0 -347
- package/src/mcp/adapters/snyk.adapter.ts +0 -394
- package/src/mcp/adapters/splunk.adapter.ts +0 -403
- package/src/mcp/adapters/square.adapter.ts +0 -467
- package/src/mcp/adapters/statuspage.adapter.ts +0 -401
- package/src/mcp/adapters/stripe.adapter.ts +0 -380
- package/src/mcp/adapters/supabase.adapter.ts +0 -334
- package/src/mcp/adapters/teamwork.adapter.ts +0 -404
- package/src/mcp/adapters/telegram.adapter.ts +0 -299
- package/src/mcp/adapters/terraform.adapter.ts +0 -300
- package/src/mcp/adapters/todoist.adapter.ts +0 -239
- package/src/mcp/adapters/trello.adapter.ts +0 -316
- package/src/mcp/adapters/twilio.adapter.ts +0 -233
- package/src/mcp/adapters/twitter.adapter.ts +0 -348
- package/src/mcp/adapters/vercel.adapter.ts +0 -219
- package/src/mcp/adapters/weaviate.adapter.ts +0 -371
- package/src/mcp/adapters/webex.adapter.ts +0 -237
- package/src/mcp/adapters/webflow.adapter.ts +0 -287
- package/src/mcp/adapters/whatsapp.adapter.ts +0 -273
- package/src/mcp/adapters/whereby.adapter.ts +0 -240
- package/src/mcp/adapters/woocommerce.adapter.ts +0 -454
- package/src/mcp/adapters/wordpress.adapter.ts +0 -455
- package/src/mcp/adapters/workday.adapter.ts +0 -354
- package/src/mcp/adapters/wrike.adapter.ts +0 -349
- package/src/mcp/adapters/xero.adapter.ts +0 -472
- package/src/mcp/adapters/youtube.adapter.ts +0 -401
- package/src/mcp/adapters/zendesk.adapter.ts +0 -399
- package/src/mcp/adapters/zoho-crm.adapter.ts +0 -410
- package/src/mcp/adapters/zoom.adapter.ts +0 -241
- package/src/mcp/adapters/zuora.adapter.ts +0 -476
- package/src/mcp/framework/api-executor.ts +0 -192
- package/src/mcp/framework/aws-sigv4.ts +0 -216
- package/src/mcp/framework/credential-resolver.ts +0 -128
- package/src/mcp/framework/oauth-token-manager.ts +0 -22
- package/src/mcp/framework/skill-mcp-framework.ts +0 -226
- package/src/mcp/framework/types.ts +0 -130
- package/src/mcp/index.ts +0 -124
- package/src/mcp/integration-catalog.ts +0 -178
- package/src/middleware/dns-rebinding.ts +0 -44
- package/src/middleware/egress-filter.ts +0 -104
- package/src/middleware/firewall.ts +0 -192
- package/src/middleware/geo-ip.ts +0 -156
- package/src/middleware/index.ts +0 -390
- package/src/middleware/network-config.ts +0 -90
- package/src/middleware/proxy-config.ts +0 -71
- package/src/middleware/request-limits.ts +0 -59
- package/src/middleware/transport-encryption.ts +0 -398
- package/src/registry/cli.ts +0 -63
- package/src/registry/server.ts +0 -504
- package/src/runtime/agent-loop.ts +0 -779
- package/src/runtime/compaction.ts +0 -638
- package/src/runtime/email-channel.ts +0 -120
- package/src/runtime/environment.ts +0 -300
- package/src/runtime/followup.ts +0 -211
- package/src/runtime/gateway.ts +0 -260
- package/src/runtime/hooks.ts +0 -564
- package/src/runtime/index.ts +0 -1110
- package/src/runtime/llm-client.ts +0 -1056
- package/src/runtime/model-router.ts +0 -97
- package/src/runtime/providers.ts +0 -228
- package/src/runtime/session-manager.ts +0 -345
- package/src/runtime/subagent.ts +0 -153
- package/src/runtime/tool-executor.ts +0 -208
- package/src/runtime/types.ts +0 -255
- package/src/security/brute-force.ts +0 -423
- package/src/security/config.ts +0 -159
- package/src/security/csp.ts +0 -407
- package/src/security/external-content.ts +0 -299
- package/src/security/index.ts +0 -557
- package/src/security/input-sanitizer.ts +0 -452
- package/src/security/output-filter.ts +0 -575
- package/src/security/port-scanner.ts +0 -342
- package/src/security/prompt-guard.ts +0 -387
- package/src/security/sql-guard.ts +0 -338
- package/src/security/threat-logger.ts +0 -484
- package/src/server.ts +0 -828
- package/src/setup/company.ts +0 -183
- package/src/setup/database.ts +0 -153
- package/src/setup/deployment.ts +0 -561
- package/src/setup/domain.ts +0 -112
- package/src/setup/index.ts +0 -171
- package/src/setup/provision.ts +0 -532
- package/src/setup/registration.ts +0 -302
- package/src/system-prompts/catchup.ts +0 -48
- package/src/system-prompts/google/calendar.ts +0 -37
- package/src/system-prompts/google/chat.ts +0 -92
- package/src/system-prompts/google/contacts.ts +0 -25
- package/src/system-prompts/google/docs.ts +0 -29
- package/src/system-prompts/google/drive.ts +0 -34
- package/src/system-prompts/google/forms.ts +0 -25
- package/src/system-prompts/google/gmail.ts +0 -50
- package/src/system-prompts/google/index.ts +0 -23
- package/src/system-prompts/google/maps.ts +0 -20
- package/src/system-prompts/google/meet.ts +0 -130
- package/src/system-prompts/google/sheets.ts +0 -32
- package/src/system-prompts/google/slides.ts +0 -26
- package/src/system-prompts/google/tasks.ts +0 -27
- package/src/system-prompts/index.ts +0 -88
- package/src/system-prompts/microsoft/contacts.ts +0 -34
- package/src/system-prompts/microsoft/excel.ts +0 -52
- package/src/system-prompts/microsoft/index.ts +0 -31
- package/src/system-prompts/microsoft/onedrive.ts +0 -41
- package/src/system-prompts/microsoft/onenote.ts +0 -36
- package/src/system-prompts/microsoft/outlook-calendar.ts +0 -37
- package/src/system-prompts/microsoft/outlook-mail.ts +0 -46
- package/src/system-prompts/microsoft/planner.ts +0 -37
- package/src/system-prompts/microsoft/powerbi.ts +0 -38
- package/src/system-prompts/microsoft/powerpoint.ts +0 -35
- package/src/system-prompts/microsoft/sharepoint.ts +0 -44
- package/src/system-prompts/microsoft/teams.ts +0 -49
- package/src/system-prompts/microsoft/todo.ts +0 -37
- package/src/system-prompts/shared-blocks.ts +0 -87
- package/src/system-prompts/task.ts +0 -21
- package/src/system-prompts/triage.ts +0 -34
- package/src/types/hono-env.ts +0 -18
- package/src/types/optional-deps.d.ts +0 -10
- /package/{src → dist}/dashboard/HELP-TOOLTIPS-GUIDE.md +0 -0
|
@@ -1,149 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Layer 2: CLEAN — Deep Content Cleaning & Normalization
|
|
3
|
-
*
|
|
4
|
-
* Source-agnostic. Takes extracted text and applies multiple cleaning passes:
|
|
5
|
-
* Pass 1: Structural — Remove boilerplate patterns, navigation, UI artifacts
|
|
6
|
-
* Pass 2: Content — Normalize formatting, fix encoding, deduplicate content
|
|
7
|
-
* Pass 3: Quality — Remove low-value content, trim noise, normalize whitespace
|
|
8
|
-
*
|
|
9
|
-
* Every pass reports what it removed for auditability.
|
|
10
|
-
*/
|
|
11
|
-
|
|
12
|
-
import type { LayerReport } from './types.js';
|
|
13
|
-
|
|
14
|
-
export interface CleanResult {
|
|
15
|
-
content: string;
|
|
16
|
-
report: LayerReport;
|
|
17
|
-
}
|
|
18
|
-
|
|
19
|
-
export function cleanContent(input: string): CleanResult {
|
|
20
|
-
const start = Date.now();
|
|
21
|
-
const operations: string[] = [];
|
|
22
|
-
const inputSize = input.length;
|
|
23
|
-
|
|
24
|
-
let text = input;
|
|
25
|
-
|
|
26
|
-
// ─── Pass 1: Structural Cleaning ──────────────────
|
|
27
|
-
|
|
28
|
-
const beforePass1 = text.length;
|
|
29
|
-
|
|
30
|
-
// Remove anchor references (#section-id)
|
|
31
|
-
text = text.replace(/\(#[a-zA-Z0-9_-]+\)/g, '');
|
|
32
|
-
// Remove empty markdown links
|
|
33
|
-
text = text.replace(/\[([^\]]*)\]\(\s*\)/g, '$1');
|
|
34
|
-
// Remove empty anchor tags leftovers
|
|
35
|
-
text = text.replace(/\[\s*\]\([^)]*\)/g, '');
|
|
36
|
-
// Remove "Skip to main content", "Skip to navigation", etc.
|
|
37
|
-
text = text.replace(/^.*skip\s+to\s+(?:main\s+)?(?:content|navigation|search).*$/gim, '');
|
|
38
|
-
// Remove breadcrumb trails (Home > Section > Page)
|
|
39
|
-
text = text.replace(/^(?:Home|Main)\s*(?:>|›|»|→)\s*(?:\w[\w\s]*(?:>|›|»|→)\s*)+\w[\w\s]*$/gm, '');
|
|
40
|
-
// Remove breadcrumbs with < style (< "Page" < "Section")
|
|
41
|
-
text = text.replace(/(?:<\s*"[^"]*"\s*)+/g, '');
|
|
42
|
-
// Remove "Table of contents" headers + their content (list of # links)
|
|
43
|
-
text = text.replace(/#{1,3}\s*(?:Table of Contents|Contents|In this (?:article|page|guide))\s*\n(?:\s*[-*]\s*\[.*?\].*\n?)*/gi, '');
|
|
44
|
-
text = text.replace(/^(?:Table of [Cc]ontents|On this page|In this article)\s*$/gm, '');
|
|
45
|
-
// Remove standalone "- - - -" separators
|
|
46
|
-
text = text.replace(/^[\s\-–—*=]{4,}$/gm, '');
|
|
47
|
-
// Remove page numbers
|
|
48
|
-
text = text.replace(/^(?:Page\s+)?\d+\s*(?:of\s+\d+)?\s*$/gm, '');
|
|
49
|
-
|
|
50
|
-
if (text.length < beforePass1) operations.push(`pass1:structural removed ${beforePass1 - text.length} chars`);
|
|
51
|
-
|
|
52
|
-
// ─── Pass 2: Content Normalization ────────────────
|
|
53
|
-
|
|
54
|
-
const beforePass2 = text.length;
|
|
55
|
-
|
|
56
|
-
// Fix broken UTF-8 / mojibake
|
|
57
|
-
text = text.replace(/’/g, "'").replace(/“/g, '"').replace(/â€\u009D/g, '"');
|
|
58
|
-
text = text.replace(/â€"/g, '—').replace(/â€"/g, '–').replace(/ /g, ' ');
|
|
59
|
-
text = text.replace(/é/g, 'é').replace(/è/g, 'è').replace(/ü/g, 'ü').replace(/ö/g, 'ö');
|
|
60
|
-
|
|
61
|
-
// Normalize quotes and dashes
|
|
62
|
-
text = text.replace(/[\u2018\u2019\u201A\u201B]/g, "'");
|
|
63
|
-
text = text.replace(/[\u201C\u201D\u201E\u201F]/g, '"');
|
|
64
|
-
text = text.replace(/[\u2013\u2014]/g, '-');
|
|
65
|
-
text = text.replace(/\u2026/g, '...');
|
|
66
|
-
|
|
67
|
-
// Normalize bullet points
|
|
68
|
-
text = text.replace(/^[\s]*[•●○◦▪▸►▹‣⁃]\s*/gm, '- ');
|
|
69
|
-
|
|
70
|
-
// Remove zero-width characters
|
|
71
|
-
text = text.replace(/[\u200B\u200C\u200D\uFEFF\u00AD]/g, '');
|
|
72
|
-
|
|
73
|
-
// Remove excessive markdown emphasis (****text****)
|
|
74
|
-
text = text.replace(/\*{3,}([^*]+)\*{3,}/g, '**$1**');
|
|
75
|
-
|
|
76
|
-
// Normalize markdown headings (ensure space after #)
|
|
77
|
-
text = text.replace(/^(#{1,6})([^ #\n])/gm, '$1 $2');
|
|
78
|
-
|
|
79
|
-
// Remove duplicate headings (same heading appearing twice in a row)
|
|
80
|
-
text = text.replace(/(^#{1,6}\s+.+$)\n+\1/gm, '$1');
|
|
81
|
-
|
|
82
|
-
// Remove repeated content blocks (paragraphs appearing multiple times)
|
|
83
|
-
const paragraphs = text.split(/\n{2,}/);
|
|
84
|
-
const seen = new Set<string>();
|
|
85
|
-
const deduped: string[] = [];
|
|
86
|
-
for (const p of paragraphs) {
|
|
87
|
-
const normalized = p.trim().toLowerCase().replace(/\s+/g, ' ');
|
|
88
|
-
if (normalized.length < 10 || !seen.has(normalized)) {
|
|
89
|
-
deduped.push(p);
|
|
90
|
-
if (normalized.length >= 10) seen.add(normalized);
|
|
91
|
-
}
|
|
92
|
-
}
|
|
93
|
-
text = deduped.join('\n\n');
|
|
94
|
-
|
|
95
|
-
if (text.length < beforePass2) operations.push(`pass2:normalize removed ${beforePass2 - text.length} chars, deduped ${paragraphs.length - deduped.length} blocks`);
|
|
96
|
-
|
|
97
|
-
// ─── Pass 3: Quality Trim ────────────────────────
|
|
98
|
-
|
|
99
|
-
const beforePass3 = text.length;
|
|
100
|
-
|
|
101
|
-
// Remove "Written by..." bylines
|
|
102
|
-
text = text.replace(/(?:written|authored|published|posted)\s+by\s+[\w\s.]+(?:updated|modified|edited)?\s*[\w\s]*(?:ago)?/gi, '');
|
|
103
|
-
// Remove "Did this answer your question?" type feedback
|
|
104
|
-
text = text.replace(/(?:did\s+this\s+(?:answer\s+your\s+question|help)|was\s+this\s+(?:article\s+)?helpful|rate\s+this\s+article|thumbs\s+up|thumbs\s+down|yes\s+no)[^.]*[.?]?\s*[😞😐😃🙁😊👍👎☹️🙂😀\s]*/gi, '');
|
|
105
|
-
// Remove "Share this article" / social sharing prompts
|
|
106
|
-
text = text.replace(/(?:share\s+(?:this\s+)?(?:article|page|post)|tweet\s+this|share\s+on\s+(?:facebook|twitter|linkedin|x))[^.]*[.?]?/gi, '');
|
|
107
|
-
// Remove "Subscribe to newsletter" prompts
|
|
108
|
-
text = text.replace(/(?:subscribe\s+to\s+(?:our|the)?\s*(?:newsletter|updates|blog)|sign\s+up\s+for\s+(?:updates|our))[^.]*[.?]?/gi, '');
|
|
109
|
-
// Remove cookie/privacy notices
|
|
110
|
-
text = text.replace(/(?:we\s+use\s+cookies|cookie\s+(?:policy|preferences|settings)|accept\s+(?:all\s+)?cookies|by\s+continuing\s+to\s+(?:use|browse))[^.]*\.?/gi, '');
|
|
111
|
-
// Remove "Copyright ©" lines
|
|
112
|
-
text = text.replace(/^.*(?:copyright|©|\(c\))\s*\d{4}.*$/gim, '');
|
|
113
|
-
// Remove "All rights reserved"
|
|
114
|
-
text = text.replace(/all\s+rights?\s+reserved\.?/gi, '');
|
|
115
|
-
// Remove "Last updated/modified on..."
|
|
116
|
-
text = text.replace(/(?:last\s+)?(?:updated|modified|edited|reviewed)\s+(?:on\s+)?(?:\d{1,2}[-/]\d{1,2}[-/]\d{2,4}|\w+\s+\d{1,2},?\s+\d{4}|\d+\s+\w+\s+ago)/gi, '');
|
|
117
|
-
// Remove "Print this page" / "Download PDF"
|
|
118
|
-
text = text.replace(/(?:print\s+this\s+(?:page|article)|download\s+(?:as\s+)?pdf|export\s+to\s+pdf)/gi, '');
|
|
119
|
-
// Remove standalone URLs on their own line
|
|
120
|
-
text = text.replace(/^\s*https?:\/\/[^\s]+\s*$/gm, '');
|
|
121
|
-
// Remove emoji-only lines
|
|
122
|
-
text = text.replace(/^[\s]*(?:[\u{1F600}-\u{1F64F}\u{1F300}-\u{1F5FF}\u{1F680}-\u{1F6FF}\u{1F1E0}-\u{1F1FF}\u{2600}-\u{26FF}\u{2700}-\u{27BF}]+[\s]*)+$/gmu, '');
|
|
123
|
-
// Remove navigation prompts ("Back to top", "Next article", "Previous page")
|
|
124
|
-
text = text.replace(/^.*(?:back\s+to\s+top|next\s+(?:article|page|step)|previous\s+(?:article|page|step)|go\s+(?:back|to\s+top)).*$/gim, '');
|
|
125
|
-
|
|
126
|
-
// Final whitespace normalization
|
|
127
|
-
text = text
|
|
128
|
-
.split('\n')
|
|
129
|
-
.map(line => line.trimEnd()) // trim trailing spaces per line
|
|
130
|
-
.join('\n')
|
|
131
|
-
.replace(/\n{4,}/g, '\n\n\n') // max 2 blank lines
|
|
132
|
-
.replace(/^\n+/, '') // no leading blank lines
|
|
133
|
-
.replace(/\n+$/, '') // no trailing blank lines
|
|
134
|
-
.trim();
|
|
135
|
-
|
|
136
|
-
if (text.length < beforePass3) operations.push(`pass3:quality removed ${beforePass3 - text.length} chars`);
|
|
137
|
-
|
|
138
|
-
return {
|
|
139
|
-
content: text,
|
|
140
|
-
report: {
|
|
141
|
-
name: 'clean',
|
|
142
|
-
inputSize,
|
|
143
|
-
outputSize: text.length,
|
|
144
|
-
removedBytes: inputSize - text.length,
|
|
145
|
-
operations,
|
|
146
|
-
durationMs: Date.now() - start,
|
|
147
|
-
},
|
|
148
|
-
};
|
|
149
|
-
}
|
|
@@ -1,102 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Layer 1: EXTRACT — Google Drive / Google Sites Content Extractor
|
|
3
|
-
*
|
|
4
|
-
* Handles: Google Docs (HTML export), Google Sites pages, Google Slides (text export).
|
|
5
|
-
* Strips: Google-specific wrapper divs, suggested edits, comment markers,
|
|
6
|
-
* revision metadata, Google Sites navigation/chrome.
|
|
7
|
-
*/
|
|
8
|
-
|
|
9
|
-
import type { ContentExtractor, ExtractResult } from './types.js';
|
|
10
|
-
|
|
11
|
-
export class GoogleDriveContentExtractor implements ContentExtractor {
|
|
12
|
-
extract(raw: string, sourceUrl?: string): ExtractResult {
|
|
13
|
-
const isGoogleSites = sourceUrl?.includes('sites.google.com') || raw.includes('tyJCtd');
|
|
14
|
-
const isGoogleDoc = raw.includes('docs-internal-guid') || raw.includes('kix-');
|
|
15
|
-
|
|
16
|
-
let content = raw;
|
|
17
|
-
let title = 'Untitled';
|
|
18
|
-
|
|
19
|
-
if (isGoogleSites) {
|
|
20
|
-
({ content, title } = this.extractGoogleSites(raw));
|
|
21
|
-
} else if (isGoogleDoc) {
|
|
22
|
-
({ content, title } = this.extractGoogleDoc(raw));
|
|
23
|
-
} else {
|
|
24
|
-
// Generic: might be a plain text/markdown file from Drive
|
|
25
|
-
title = this.extractTitle(raw);
|
|
26
|
-
}
|
|
27
|
-
|
|
28
|
-
// Convert any remaining HTML to text
|
|
29
|
-
if (content.includes('<') && content.includes('>')) {
|
|
30
|
-
content = this.htmlToText(content);
|
|
31
|
-
}
|
|
32
|
-
|
|
33
|
-
return { title, content: content.trim(), contentType: 'text' };
|
|
34
|
-
}
|
|
35
|
-
|
|
36
|
-
private extractGoogleSites(html: string): { content: string; title: string } {
|
|
37
|
-
// Google Sites wraps content in divs with specific classes
|
|
38
|
-
const title = (html.match(/<title[^>]*>([\s\S]*?)<\/title>/i)?.[1] || 'Untitled')
|
|
39
|
-
.replace(/<[^>]+>/g, '').replace(/\s*-\s*Google Sites\s*$/i, '').trim();
|
|
40
|
-
|
|
41
|
-
// Remove Google Sites navigation, header, footer
|
|
42
|
-
let content = html
|
|
43
|
-
.replace(/<[^>]*class="[^"]*(?:navigation|yp5lHe|MnRGSb|VsJjTc|QxVDse|dR43Bb)[^"]*"[^>]*>[\s\S]*?<\/[^>]+>/gi, '')
|
|
44
|
-
// Remove edit buttons, share buttons
|
|
45
|
-
.replace(/<[^>]*class="[^"]*(?:edit-button|share-button|fab-container)[^"]*"[^>]*>[\s\S]*?<\/[^>]+>/gi, '');
|
|
46
|
-
|
|
47
|
-
// Try to extract main content area
|
|
48
|
-
const mainContent = this.extractByClass(content, 'tyJCtd') || this.extractByClass(content, 'IFjolb');
|
|
49
|
-
if (mainContent) content = mainContent;
|
|
50
|
-
|
|
51
|
-
return { content, title };
|
|
52
|
-
}
|
|
53
|
-
|
|
54
|
-
private extractGoogleDoc(html: string): { content: string; title: string } {
|
|
55
|
-
const title = (html.match(/<title[^>]*>([\s\S]*?)<\/title>/i)?.[1] || 'Untitled')
|
|
56
|
-
.replace(/<[^>]+>/g, '').trim();
|
|
57
|
-
|
|
58
|
-
let content = html
|
|
59
|
-
// Remove Google Docs internal GUIDs
|
|
60
|
-
.replace(/\s*id="docs-internal-guid-[^"]*"/gi, '')
|
|
61
|
-
// Remove kix-* markers
|
|
62
|
-
.replace(/<[^>]*class="[^"]*kix-[^"]*"[^>]*>/gi, '')
|
|
63
|
-
// Remove suggested edits
|
|
64
|
-
.replace(/<[^>]*class="[^"]*(?:docos-suggestion|docos-rewrite)[^"]*"[^>]*>[\s\S]*?<\/[^>]+>/gi, '')
|
|
65
|
-
// Remove comment anchors
|
|
66
|
-
.replace(/<[^>]*class="[^"]*docos-comment[^"]*"[^>]*>[\s\S]*?<\/[^>]+>/gi, '')
|
|
67
|
-
// Remove Google font imports
|
|
68
|
-
.replace(/<link[^>]*fonts\.googleapis[^>]*>/gi, '')
|
|
69
|
-
// Clean empty styled spans
|
|
70
|
-
.replace(/<span\s+style="[^"]*(?:font-weight:\s*400|font-style:\s*normal)[^"]*">([\s\S]*?)<\/span>/gi, '$1');
|
|
71
|
-
|
|
72
|
-
return { content, title };
|
|
73
|
-
}
|
|
74
|
-
|
|
75
|
-
private extractTitle(raw: string): string {
|
|
76
|
-
const h1 = raw.match(/^#\s+(.+)/m);
|
|
77
|
-
if (h1) return h1[1].trim();
|
|
78
|
-
const title = raw.match(/<title[^>]*>([\s\S]*?)<\/title>/i);
|
|
79
|
-
if (title) return title[1].replace(/<[^>]+>/g, '').trim();
|
|
80
|
-
return 'Untitled';
|
|
81
|
-
}
|
|
82
|
-
|
|
83
|
-
private extractByClass(html: string, className: string): string | null {
|
|
84
|
-
const regex = new RegExp(`<([a-z][a-z0-9]*)\\s[^>]*class="[^"]*${className}[^"]*"[^>]*>([\\s\\S]*?)<\\/\\1>`, 'i');
|
|
85
|
-
const match = regex.exec(html);
|
|
86
|
-
return match ? match[2] : null;
|
|
87
|
-
}
|
|
88
|
-
|
|
89
|
-
private htmlToText(html: string): string {
|
|
90
|
-
return html
|
|
91
|
-
.replace(/<(script|style|noscript)[^>]*>[\s\S]*?<\/\1>/gi, '')
|
|
92
|
-
.replace(/<h([1-6])[^>]*>([\s\S]*?)<\/h\1>/gi, (_, l, t) => '\n\n' + '#'.repeat(parseInt(l)) + ' ' + t.replace(/<[^>]+>/g, '').trim() + '\n\n')
|
|
93
|
-
.replace(/<\/p>/gi, '\n\n').replace(/<p[^>]*>/gi, '')
|
|
94
|
-
.replace(/<br\s*\/?>/gi, '\n')
|
|
95
|
-
.replace(/<li[^>]*>/gi, '- ').replace(/<\/li>/gi, '\n')
|
|
96
|
-
.replace(/<[^>]+>/g, '')
|
|
97
|
-
.replace(/&/g, '&').replace(/</g, '<').replace(/>/g, '>')
|
|
98
|
-
.replace(/"/g, '"').replace(/'/g, "'").replace(/ /g, ' ')
|
|
99
|
-
.replace(/\n{3,}/g, '\n\n')
|
|
100
|
-
.trim();
|
|
101
|
-
}
|
|
102
|
-
}
|
|
@@ -1,74 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Layer 1: EXTRACT — GitHub Content Extractor
|
|
3
|
-
*
|
|
4
|
-
* Handles: README.md, docs/, wiki, markdown files, RST, AsciiDoc.
|
|
5
|
-
* Strips GitHub-specific artifacts: badges, CI status, contribution guides,
|
|
6
|
-
* auto-generated TOCs, sponsor sections, PR templates.
|
|
7
|
-
*/
|
|
8
|
-
|
|
9
|
-
import type { ContentExtractor, ExtractResult } from './types.js';
|
|
10
|
-
|
|
11
|
-
export class GitHubContentExtractor implements ContentExtractor {
|
|
12
|
-
extract(raw: string, sourceUrl?: string): ExtractResult {
|
|
13
|
-
let content = raw;
|
|
14
|
-
const _isReadme = sourceUrl?.toLowerCase().includes('readme') || false;
|
|
15
|
-
|
|
16
|
-
// Remove GitHub badge images at top of README
|
|
17
|
-
content = content.replace(/^\s*(\[!\[[^\]]*\]\([^)]*\)\]\([^)]*\)\s*)+/gm, '');
|
|
18
|
-
// Remove inline badge images
|
|
19
|
-
content = content.replace(/!\[(?:build|ci|test|coverage|license|npm|version|downloads|stars|forks|issues|badge)[^\]]*\]\([^)]*\)/gi, '');
|
|
20
|
-
|
|
21
|
-
// Remove auto-generated TOC markers
|
|
22
|
-
content = content.replace(/<!--\s*(?:TOC|toc|table-of-contents)\s*-->/gi, '');
|
|
23
|
-
content = content.replace(/<!--\s*(?:START|END)\s+(?:TOC|toc|doctoc)[^-]*-->/gi, '');
|
|
24
|
-
// Remove doctoc-generated TOC blocks
|
|
25
|
-
content = content.replace(/<!--\s*START doctoc[\s\S]*?END doctoc\s*-->/gi, '');
|
|
26
|
-
|
|
27
|
-
// Remove HTML comments entirely
|
|
28
|
-
content = content.replace(/<!--[\s\S]*?-->/g, '');
|
|
29
|
-
|
|
30
|
-
// Remove sponsor/funding sections
|
|
31
|
-
content = content.replace(/#{1,3}\s*(?:Sponsors?|Funding|Support(?:ers)?|Backers?|Donate|Patron)\s*\n[\s\S]*?(?=\n#{1,3}\s|\n*$)/gi, '');
|
|
32
|
-
|
|
33
|
-
// Remove contributing section if it's just a link
|
|
34
|
-
content = content.replace(/#{1,3}\s*Contributing\s*\n+(?:(?:Please\s+)?(?:see|read|check)\s+.*CONTRIBUTING.*\n?)+/gi, '');
|
|
35
|
-
|
|
36
|
-
// Remove license section if short
|
|
37
|
-
content = content.replace(/#{1,3}\s*License\s*\n+(?:(?:MIT|Apache|BSD|ISC|GPL)[^\n]*\n?){1,3}/gi, '');
|
|
38
|
-
|
|
39
|
-
// Remove "Table of Contents" sections with only links
|
|
40
|
-
content = content.replace(/#{1,3}\s*(?:Table of Contents|Contents|TOC)\s*\n(?:\s*[-*]\s*\[.*?\]\(#.*?\)\s*\n?)+/gi, '');
|
|
41
|
-
|
|
42
|
-
// Remove GitHub-specific action prompts
|
|
43
|
-
content = content.replace(/^\s*> \[!(?:NOTE|TIP|IMPORTANT|WARNING|CAUTION)\]\s*$/gm, '');
|
|
44
|
-
|
|
45
|
-
// Extract title from first heading
|
|
46
|
-
const titleMatch = content.match(/^#\s+(.+)/m);
|
|
47
|
-
const title = titleMatch ? titleMatch[1].trim() : this.titleFromPath(sourceUrl || '');
|
|
48
|
-
|
|
49
|
-
// Clean up excessive blank lines
|
|
50
|
-
content = content.replace(/\n{4,}/g, '\n\n\n');
|
|
51
|
-
|
|
52
|
-
return {
|
|
53
|
-
title,
|
|
54
|
-
content: content.trim(),
|
|
55
|
-
contentType: 'markdown',
|
|
56
|
-
sections: this.extractSections(content),
|
|
57
|
-
};
|
|
58
|
-
}
|
|
59
|
-
|
|
60
|
-
private titleFromPath(path: string): string {
|
|
61
|
-
const filename = path.split('/').pop() || path;
|
|
62
|
-
return filename.replace(/\.[^.]+$/, '').replace(/[-_]/g, ' ');
|
|
63
|
-
}
|
|
64
|
-
|
|
65
|
-
private extractSections(content: string): string[] {
|
|
66
|
-
const sections: string[] = [];
|
|
67
|
-
const headingRegex = /^#{1,3}\s+(.+)/gm;
|
|
68
|
-
let match;
|
|
69
|
-
while ((match = headingRegex.exec(content)) !== null) {
|
|
70
|
-
sections.push(match[1].trim());
|
|
71
|
-
}
|
|
72
|
-
return sections;
|
|
73
|
-
}
|
|
74
|
-
}
|
|
@@ -1,69 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Layer 1: EXTRACT — SharePoint/OneDrive Content Extractor
|
|
3
|
-
*
|
|
4
|
-
* Handles: SharePoint pages, Word docs (HTML export), OneDrive files.
|
|
5
|
-
* Strips: SharePoint chrome, metadata panels, version history, ribbon UI,
|
|
6
|
-
* Microsoft-specific markup (mso-*, o:p, v:shape).
|
|
7
|
-
*/
|
|
8
|
-
|
|
9
|
-
import type { ContentExtractor, ExtractResult } from './types.js';
|
|
10
|
-
|
|
11
|
-
export class SharePointContentExtractor implements ContentExtractor {
|
|
12
|
-
extract(raw: string, _sourceUrl?: string): ExtractResult {
|
|
13
|
-
let content = raw;
|
|
14
|
-
|
|
15
|
-
// If HTML (SharePoint page or Word export)
|
|
16
|
-
if (content.includes('<html') || content.includes('<div') || content.includes('mso-')) {
|
|
17
|
-
content = this.cleanSharePointHtml(content);
|
|
18
|
-
}
|
|
19
|
-
|
|
20
|
-
// Extract title
|
|
21
|
-
const titleMatch = content.match(/<title[^>]*>([\s\S]*?)<\/title>/i)
|
|
22
|
-
|| content.match(/^#\s+(.+)/m);
|
|
23
|
-
const title = titleMatch
|
|
24
|
-
? titleMatch[1].replace(/<[^>]+>/g, '').replace(/\s*[-–|]\s*SharePoint.*$/i, '').trim()
|
|
25
|
-
: 'Untitled';
|
|
26
|
-
|
|
27
|
-
// Convert remaining HTML to text
|
|
28
|
-
content = this.htmlToText(content);
|
|
29
|
-
|
|
30
|
-
return { title, content: content.trim(), contentType: 'text' };
|
|
31
|
-
}
|
|
32
|
-
|
|
33
|
-
private cleanSharePointHtml(html: string): string {
|
|
34
|
-
return html
|
|
35
|
-
// Remove Microsoft Office markup
|
|
36
|
-
.replace(/<o:p>[\s\S]*?<\/o:p>/gi, '')
|
|
37
|
-
.replace(/<v:[^>]*>[\s\S]*?<\/v:[^>]+>/gi, '')
|
|
38
|
-
.replace(/<w:[^>]*>[\s\S]*?<\/w:[^>]+>/gi, '')
|
|
39
|
-
// Remove mso-* styles (Word HTML export junk)
|
|
40
|
-
.replace(/\s*mso-[^;:"']+:[^;:"']+;?/gi, '')
|
|
41
|
-
.replace(/\s*style="[\s;]*"/gi, '')
|
|
42
|
-
// Remove SharePoint UI elements
|
|
43
|
-
.replace(/<[^>]*(?:class|id)="[^"]*(?:ms-rte|ms-webpart|ms-core|ms-srch|ms-nav|ms-menu|ExternalClass|MsoNormal)[^"]*"[^>]*>[\s\S]*?<\/[^>]+>/gi, '')
|
|
44
|
-
// Remove empty spans from Word export
|
|
45
|
-
.replace(/<span[^>]*>\s*<\/span>/gi, '')
|
|
46
|
-
// Remove conditional comments (IE-specific)
|
|
47
|
-
.replace(/<!--\[if[\s\S]*?<!\[endif\]-->/gi, '')
|
|
48
|
-
// Remove SharePoint metadata tables
|
|
49
|
-
.replace(/<table[^>]*(?:class|id)="[^"]*(?:propertysheet|metadata|versionTable)[^"]*"[^>]*>[\s\S]*?<\/table>/gi, '')
|
|
50
|
-
// Remove ribbon/command bar
|
|
51
|
-
.replace(/<[^>]*(?:class|id)="[^"]*(?:ribbon|commandBar|suiteBar|globalNav)[^"]*"[^>]*>[\s\S]*?<\/[^>]+>/gi, '');
|
|
52
|
-
}
|
|
53
|
-
|
|
54
|
-
private htmlToText(html: string): string {
|
|
55
|
-
return html
|
|
56
|
-
.replace(/<(script|style|noscript)[^>]*>[\s\S]*?<\/\1>/gi, '')
|
|
57
|
-
.replace(/<h([1-6])[^>]*>([\s\S]*?)<\/h\1>/gi, (_, l, t) => '\n\n' + '#'.repeat(parseInt(l)) + ' ' + t.replace(/<[^>]+>/g, '').trim() + '\n\n')
|
|
58
|
-
.replace(/<\/p>/gi, '\n\n').replace(/<p[^>]*>/gi, '')
|
|
59
|
-
.replace(/<br\s*\/?>/gi, '\n')
|
|
60
|
-
.replace(/<li[^>]*>/gi, '- ').replace(/<\/li>/gi, '\n')
|
|
61
|
-
.replace(/<(?:strong|b)[^>]*>([\s\S]*?)<\/(?:strong|b)>/gi, '**$1**')
|
|
62
|
-
.replace(/<(?:em|i)[^>]*>([\s\S]*?)<\/(?:em|i)>/gi, '*$1*')
|
|
63
|
-
.replace(/<[^>]+>/g, '')
|
|
64
|
-
.replace(/&/g, '&').replace(/</g, '<').replace(/>/g, '>')
|
|
65
|
-
.replace(/"/g, '"').replace(/'/g, "'").replace(/ /g, ' ')
|
|
66
|
-
.replace(/\n{3,}/g, '\n\n')
|
|
67
|
-
.trim();
|
|
68
|
-
}
|
|
69
|
-
}
|
|
@@ -1,275 +0,0 @@
|
|
|
1
|
-
/**
|
|
2
|
-
* Layer 1: EXTRACT — Web/URL Content Extractor
|
|
3
|
-
*
|
|
4
|
-
* Handles: Intercom, Zendesk, Freshdesk, GitBook, ReadTheDocs, Docusaurus,
|
|
5
|
-
* MkDocs, generic help centers, blogs, docs sites.
|
|
6
|
-
*
|
|
7
|
-
* Strategy: Detect the platform → use platform-specific selectors → fallback to generic.
|
|
8
|
-
*/
|
|
9
|
-
|
|
10
|
-
import type { ContentExtractor, ExtractResult } from './types.js';
|
|
11
|
-
|
|
12
|
-
interface PlatformRule {
|
|
13
|
-
detect: (html: string, url?: string) => boolean;
|
|
14
|
-
name: string;
|
|
15
|
-
// CSS-style selectors to find main content (checked in order)
|
|
16
|
-
contentSelectors: string[];
|
|
17
|
-
// Elements to remove before extraction
|
|
18
|
-
removeSelectors: string[];
|
|
19
|
-
// Title extraction
|
|
20
|
-
titleSelector?: string;
|
|
21
|
-
}
|
|
22
|
-
|
|
23
|
-
const PLATFORM_RULES: PlatformRule[] = [
|
|
24
|
-
{
|
|
25
|
-
name: 'intercom',
|
|
26
|
-
detect: (html, url) => !!(url?.includes('intercom.help') || html.includes('intercom-container') || html.includes('intercom')),
|
|
27
|
-
contentSelectors: ['article__body', 'article-body', 'c__2GA', 'article__content'],
|
|
28
|
-
removeSelectors: ['intercom-reaction', 'article__actions', 'article-footer', 'article__footer', 'related-articles', 'feedback'],
|
|
29
|
-
titleSelector: 'article__title',
|
|
30
|
-
},
|
|
31
|
-
{
|
|
32
|
-
name: 'zendesk',
|
|
33
|
-
detect: (html, url) => !!(url?.includes('zendesk.com') || html.includes('zd-') || html.includes('zendesk')),
|
|
34
|
-
contentSelectors: ['article-body', 'article_body', 'zd-article-body'],
|
|
35
|
-
removeSelectors: ['article-votes', 'article-footer', 'article-sidebar', 'share-', 'follow-article'],
|
|
36
|
-
},
|
|
37
|
-
{
|
|
38
|
-
name: 'freshdesk',
|
|
39
|
-
detect: (html, url) => !!(url?.includes('freshdesk.com') || html.includes('freshdesk')),
|
|
40
|
-
contentSelectors: ['article-body', 'solution-article-body', 'fr-element-'],
|
|
41
|
-
removeSelectors: ['article-feedback', 'article-footer', 'article-tools'],
|
|
42
|
-
},
|
|
43
|
-
{
|
|
44
|
-
name: 'gitbook',
|
|
45
|
-
detect: (html, url) => !!(url?.includes('gitbook.io') || html.includes('gitbook') || html.includes('BookBody')),
|
|
46
|
-
contentSelectors: ['page-inner', 'page-body', 'markdown-section', 'page-content-wrapper'],
|
|
47
|
-
removeSelectors: ['page-footer', 'navigation', 'header', 'search-'],
|
|
48
|
-
},
|
|
49
|
-
{
|
|
50
|
-
name: 'docusaurus',
|
|
51
|
-
detect: (html) => html.includes('docusaurus') || html.includes('docs-doc-id'),
|
|
52
|
-
contentSelectors: ['markdown', 'docMainContainer', 'docs-doc-page'],
|
|
53
|
-
removeSelectors: ['pagination-nav', 'table-of-contents', 'theme-doc-sidebar', 'navbar', 'footer'],
|
|
54
|
-
},
|
|
55
|
-
{
|
|
56
|
-
name: 'readthedocs',
|
|
57
|
-
detect: (html, url) => !!(url?.includes('readthedocs') || html.includes('rst-content') || html.includes('wy-')),
|
|
58
|
-
contentSelectors: ['rst-content', 'document', 'body-content'],
|
|
59
|
-
removeSelectors: ['wy-nav-side', 'wy-nav-top', 'rst-footer', 'footer'],
|
|
60
|
-
},
|
|
61
|
-
{
|
|
62
|
-
name: 'mkdocs',
|
|
63
|
-
detect: (html) => html.includes('mkdocs') || html.includes('md-content'),
|
|
64
|
-
contentSelectors: ['md-content', 'md-main', 'content'],
|
|
65
|
-
removeSelectors: ['md-sidebar', 'md-header', 'md-footer', 'md-tabs'],
|
|
66
|
-
},
|
|
67
|
-
{
|
|
68
|
-
name: 'notion',
|
|
69
|
-
detect: (html, url) => !!(url?.includes('notion.so') || url?.includes('notion.site') || html.includes('notion-')),
|
|
70
|
-
contentSelectors: ['notion-page-content', 'layout-content', 'notion-frame'],
|
|
71
|
-
removeSelectors: ['notion-topbar', 'notion-sidebar', 'notion-overlay-container'],
|
|
72
|
-
},
|
|
73
|
-
{
|
|
74
|
-
name: 'confluence',
|
|
75
|
-
detect: (html, url) => !!(url?.includes('atlassian.net/wiki') || html.includes('confluence') || html.includes('wiki-content')),
|
|
76
|
-
contentSelectors: ['wiki-content', 'confluence-information-macro', 'page-content-body'],
|
|
77
|
-
removeSelectors: ['page-metadata', 'likes-section', 'content-navigation', 'page-restrictions'],
|
|
78
|
-
},
|
|
79
|
-
{
|
|
80
|
-
name: 'medium',
|
|
81
|
-
detect: (html, url) => !!(url?.includes('medium.com') || html.includes('Medium') || html.includes('graf--')),
|
|
82
|
-
contentSelectors: ['postArticle-content', 'section-content', 'story-body'],
|
|
83
|
-
removeSelectors: ['metabar', 'postActions', 'js-postShareWidget', 'response'],
|
|
84
|
-
},
|
|
85
|
-
];
|
|
86
|
-
|
|
87
|
-
export class WebContentExtractor implements ContentExtractor {
|
|
88
|
-
extract(raw: string, sourceUrl?: string): ExtractResult {
|
|
89
|
-
// Detect platform
|
|
90
|
-
const platform = PLATFORM_RULES.find(r => r.detect(raw, sourceUrl));
|
|
91
|
-
|
|
92
|
-
// Extract title
|
|
93
|
-
const title = this.extractTitle(raw, platform);
|
|
94
|
-
|
|
95
|
-
// Extract main content
|
|
96
|
-
let content = platform
|
|
97
|
-
? this.extractWithPlatformRules(raw, platform)
|
|
98
|
-
: this.extractGeneric(raw);
|
|
99
|
-
|
|
100
|
-
// Convert HTML to markdown-like text
|
|
101
|
-
content = this.htmlToCleanText(content);
|
|
102
|
-
|
|
103
|
-
// Extract author
|
|
104
|
-
const author = this.extractAuthor(raw);
|
|
105
|
-
|
|
106
|
-
return { title, content, contentType: 'text', author };
|
|
107
|
-
}
|
|
108
|
-
|
|
109
|
-
private extractTitle(html: string, platform?: PlatformRule): string {
|
|
110
|
-
// Try platform-specific title
|
|
111
|
-
if (platform?.titleSelector) {
|
|
112
|
-
const match = this.extractByClassOrId(html, platform.titleSelector);
|
|
113
|
-
if (match) return this.stripTags(match).trim();
|
|
114
|
-
}
|
|
115
|
-
|
|
116
|
-
// Try og:title
|
|
117
|
-
const ogTitle = html.match(/<meta\s+property="og:title"\s+content="([^"]*?)"/i);
|
|
118
|
-
if (ogTitle) return this.decodeEntities(ogTitle[1]);
|
|
119
|
-
|
|
120
|
-
// Try <h1>
|
|
121
|
-
const h1 = html.match(/<h1[^>]*>([\s\S]*?)<\/h1>/i);
|
|
122
|
-
if (h1) return this.stripTags(h1[1]).trim();
|
|
123
|
-
|
|
124
|
-
// Try <title>
|
|
125
|
-
const title = html.match(/<title[^>]*>([\s\S]*?)<\/title>/i);
|
|
126
|
-
if (title) {
|
|
127
|
-
return this.decodeEntities(title[1])
|
|
128
|
-
.replace(/\s*[|–—-]\s*.+$/, '') // remove site name suffix
|
|
129
|
-
.trim();
|
|
130
|
-
}
|
|
131
|
-
|
|
132
|
-
return 'Untitled';
|
|
133
|
-
}
|
|
134
|
-
|
|
135
|
-
private extractWithPlatformRules(html: string, platform: PlatformRule): string {
|
|
136
|
-
// Remove unwanted elements first
|
|
137
|
-
let cleaned = html;
|
|
138
|
-
for (const sel of platform.removeSelectors) {
|
|
139
|
-
// Remove by class or id containing the selector
|
|
140
|
-
const regex = new RegExp(`<[^>]*(?:class|id)="[^"]*${this.escRegex(sel)}[^"]*"[^>]*>[\\s\\S]*?<\\/[^>]+>`, 'gi');
|
|
141
|
-
cleaned = cleaned.replace(regex, '');
|
|
142
|
-
}
|
|
143
|
-
|
|
144
|
-
// Try each content selector
|
|
145
|
-
for (const sel of platform.contentSelectors) {
|
|
146
|
-
const extracted = this.extractByClassOrId(cleaned, sel);
|
|
147
|
-
if (extracted && extracted.length > 100) return extracted;
|
|
148
|
-
}
|
|
149
|
-
|
|
150
|
-
// Fallback to generic
|
|
151
|
-
return this.extractGeneric(cleaned);
|
|
152
|
-
}
|
|
153
|
-
|
|
154
|
-
private extractGeneric(html: string): string {
|
|
155
|
-
let content = html;
|
|
156
|
-
|
|
157
|
-
// Remove definitely-not-content elements
|
|
158
|
-
const removePatterns = [
|
|
159
|
-
/<(script|style|noscript|iframe|svg|object|embed|applet|video|audio|canvas|map|form)[^>]*>[\s\S]*?<\/\1>/gi,
|
|
160
|
-
/<(nav|header|footer|aside)[^>]*>[\s\S]*?<\/\1>/gi,
|
|
161
|
-
/<[^>]*(?:class|id)="[^"]*(?:nav|menu|sidebar|footer|header|cookie|banner|modal|popup|overlay|breadcrumb|pagination|social|share|comment|ad-|ads-|advert|promo|signup|newsletter|subscribe)[^"]*"[^>]*>[\s\S]*?<\/[^>]+>/gi,
|
|
162
|
-
/<[^>]*role="(?:navigation|banner|complementary|contentinfo|search)"[^>]*>[\s\S]*?<\/[^>]+>/gi,
|
|
163
|
-
/<[^>]*aria-hidden="true"[^>]*>[\s\S]*?<\/[^>]+>/gi,
|
|
164
|
-
];
|
|
165
|
-
|
|
166
|
-
for (const pattern of removePatterns) {
|
|
167
|
-
content = content.replace(pattern, '');
|
|
168
|
-
}
|
|
169
|
-
|
|
170
|
-
// Try to find <main>, <article>, or role="main"
|
|
171
|
-
const mainMatch = content.match(/<(?:main|article)[^>]*>([\s\S]*?)<\/(?:main|article)>/i)
|
|
172
|
-
|| content.match(/<[^>]*role="main"[^>]*>([\s\S]*?)<\/[^>]+>/i);
|
|
173
|
-
|
|
174
|
-
if (mainMatch) return mainMatch[1];
|
|
175
|
-
|
|
176
|
-
// Try common content class names
|
|
177
|
-
for (const cls of ['content', 'post-content', 'entry-content', 'article-content', 'page-content', 'main-content', 'doc-content', 'body-content']) {
|
|
178
|
-
const extracted = this.extractByClassOrId(content, cls);
|
|
179
|
-
if (extracted && extracted.length > 200) return extracted;
|
|
180
|
-
}
|
|
181
|
-
|
|
182
|
-
// Last resort: extract body
|
|
183
|
-
const bodyMatch = content.match(/<body[^>]*>([\s\S]*?)<\/body>/i);
|
|
184
|
-
return bodyMatch ? bodyMatch[1] : content;
|
|
185
|
-
}
|
|
186
|
-
|
|
187
|
-
private htmlToCleanText(html: string): string {
|
|
188
|
-
return html
|
|
189
|
-
// Headings → markdown
|
|
190
|
-
.replace(/<h([1-6])[^>]*>([\s\S]*?)<\/h\1>/gi, (_, l, t) => '\n\n' + '#'.repeat(parseInt(l)) + ' ' + this.stripTags(t).trim() + '\n\n')
|
|
191
|
-
// Paragraphs
|
|
192
|
-
.replace(/<\/p>/gi, '\n\n').replace(/<p[^>]*>/gi, '')
|
|
193
|
-
// Line breaks
|
|
194
|
-
.replace(/<br\s*\/?>/gi, '\n')
|
|
195
|
-
// Lists
|
|
196
|
-
.replace(/<\/li>/gi, '\n').replace(/<li[^>]*>/gi, '- ')
|
|
197
|
-
.replace(/<\/?[ou]l[^>]*>/gi, '\n')
|
|
198
|
-
// Blockquotes
|
|
199
|
-
.replace(/<blockquote[^>]*>([\s\S]*?)<\/blockquote>/gi, (_, t) => '\n> ' + this.stripTags(t).trim().replace(/\n/g, '\n> ') + '\n')
|
|
200
|
-
// Code
|
|
201
|
-
.replace(/<pre[^>]*><code[^>]*>([\s\S]*?)<\/code><\/pre>/gi, '\n```\n$1\n```\n')
|
|
202
|
-
.replace(/<code[^>]*>([\s\S]*?)<\/code>/gi, '`$1`')
|
|
203
|
-
// Bold/italic
|
|
204
|
-
.replace(/<(?:strong|b)[^>]*>([\s\S]*?)<\/(?:strong|b)>/gi, '**$1**')
|
|
205
|
-
.replace(/<(?:em|i)[^>]*>([\s\S]*?)<\/(?:em|i)>/gi, '*$1*')
|
|
206
|
-
// Tables → simple text
|
|
207
|
-
.replace(/<tr[^>]*>/gi, '\n').replace(/<td[^>]*>/gi, ' | ').replace(/<th[^>]*>/gi, ' | ')
|
|
208
|
-
.replace(/<\/?table[^>]*>/gi, '\n').replace(/<\/?t(?:head|body|foot|r|d|h)[^>]*>/gi, '')
|
|
209
|
-
// Images → alt text
|
|
210
|
-
.replace(/<img[^>]*alt="([^"]*)"[^>]*>/gi, '[$1]')
|
|
211
|
-
.replace(/<img[^>]*>/gi, '')
|
|
212
|
-
// Anchors → text only (drop href)
|
|
213
|
-
.replace(/<a[^>]*>([\s\S]*?)<\/a>/gi, '$1')
|
|
214
|
-
// Strip all remaining tags
|
|
215
|
-
.replace(/<[^>]+>/g, '')
|
|
216
|
-
// Decode entities
|
|
217
|
-
.replace(/&/g, '&').replace(/</g, '<').replace(/>/g, '>').replace(/"/g, '"')
|
|
218
|
-
.replace(/'/g, "'").replace(/ /g, ' ').replace(/&#(\d+);/g, (_, n) => String.fromCharCode(parseInt(n)))
|
|
219
|
-
.replace(/&[a-z]+;/gi, ' ')
|
|
220
|
-
.trim();
|
|
221
|
-
}
|
|
222
|
-
|
|
223
|
-
private extractByClassOrId(html: string, selector: string): string | null {
|
|
224
|
-
// Match elements where class or id contains the selector
|
|
225
|
-
const regex = new RegExp(`<([a-z][a-z0-9]*)\\s[^>]*(?:class|id)="[^"]*${this.escRegex(selector)}[^"]*"[^>]*>`, 'i');
|
|
226
|
-
const match = regex.exec(html);
|
|
227
|
-
if (!match) return null;
|
|
228
|
-
|
|
229
|
-
const tag = match[1];
|
|
230
|
-
const startIdx = match.index + match[0].length;
|
|
231
|
-
// Find the matching closing tag (handle nesting)
|
|
232
|
-
let depth = 1;
|
|
233
|
-
let idx = startIdx;
|
|
234
|
-
const openTag = new RegExp(`<${tag}[\\s>]`, 'gi');
|
|
235
|
-
const closeTag = new RegExp(`</${tag}>`, 'gi');
|
|
236
|
-
|
|
237
|
-
while (depth > 0 && idx < html.length) {
|
|
238
|
-
openTag.lastIndex = idx;
|
|
239
|
-
closeTag.lastIndex = idx;
|
|
240
|
-
const nextOpen = openTag.exec(html);
|
|
241
|
-
const nextClose = closeTag.exec(html);
|
|
242
|
-
|
|
243
|
-
if (!nextClose) break;
|
|
244
|
-
|
|
245
|
-
if (nextOpen && nextOpen.index < nextClose.index) {
|
|
246
|
-
depth++;
|
|
247
|
-
idx = nextOpen.index + nextOpen[0].length;
|
|
248
|
-
} else {
|
|
249
|
-
depth--;
|
|
250
|
-
if (depth === 0) return html.slice(startIdx, nextClose.index);
|
|
251
|
-
idx = nextClose.index + nextClose[0].length;
|
|
252
|
-
}
|
|
253
|
-
}
|
|
254
|
-
return null;
|
|
255
|
-
}
|
|
256
|
-
|
|
257
|
-
private extractAuthor(html: string): string | undefined {
|
|
258
|
-
const meta = html.match(/<meta\s+(?:name="author"|property="article:author")\s+content="([^"]*?)"/i);
|
|
259
|
-
if (meta) return meta[1];
|
|
260
|
-
const byline = html.match(/(?:by|author|written\s+by)\s*[:\s]*([A-Z][a-z]+\s+[A-Z][a-z]+)/i);
|
|
261
|
-
return byline ? byline[1] : undefined;
|
|
262
|
-
}
|
|
263
|
-
|
|
264
|
-
private stripTags(html: string): string {
|
|
265
|
-
return html.replace(/<[^>]+>/g, '');
|
|
266
|
-
}
|
|
267
|
-
|
|
268
|
-
private decodeEntities(text: string): string {
|
|
269
|
-
return text.replace(/&/g, '&').replace(/</g, '<').replace(/>/g, '>').replace(/"/g, '"').replace(/'/g, "'");
|
|
270
|
-
}
|
|
271
|
-
|
|
272
|
-
private escRegex(str: string): string {
|
|
273
|
-
return str.replace(/[.*+?^${}()|[\]\\]/g, '\\$&');
|
|
274
|
-
}
|
|
275
|
-
}
|