@hongmaple0820/med-scale-research-os 0.43.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.scale/mcp-servers.yaml +144 -0
- package/.scale/skills.json +830 -0
- package/.scale/verification.json +52 -0
- package/LICENSE +15 -0
- package/README.en.md +156 -0
- package/README.md +156 -0
- package/dist/adapters/AiderAdapter.d.ts +22 -0
- package/dist/adapters/AiderAdapter.js +262 -0
- package/dist/adapters/AiderAdapter.js.map +1 -0
- package/dist/adapters/AntigravityAdapter.d.ts +4 -0
- package/dist/adapters/AntigravityAdapter.js +21 -0
- package/dist/adapters/AntigravityAdapter.js.map +1 -0
- package/dist/adapters/ClaudeCodeAdapter.d.ts +54 -0
- package/dist/adapters/ClaudeCodeAdapter.js +185 -0
- package/dist/adapters/ClaudeCodeAdapter.js.map +1 -0
- package/dist/adapters/ClineAdapter.d.ts +4 -0
- package/dist/adapters/ClineAdapter.js +20 -0
- package/dist/adapters/ClineAdapter.js.map +1 -0
- package/dist/adapters/CodexAdapter.d.ts +15 -0
- package/dist/adapters/CodexAdapter.js +160 -0
- package/dist/adapters/CodexAdapter.js.map +1 -0
- package/dist/adapters/CursorAdapter.d.ts +14 -0
- package/dist/adapters/CursorAdapter.js +171 -0
- package/dist/adapters/CursorAdapter.js.map +1 -0
- package/dist/adapters/DeepSeekTuiAdapter.d.ts +19 -0
- package/dist/adapters/DeepSeekTuiAdapter.js +263 -0
- package/dist/adapters/DeepSeekTuiAdapter.js.map +1 -0
- package/dist/adapters/DoubaoAdapter.d.ts +14 -0
- package/dist/adapters/DoubaoAdapter.js +184 -0
- package/dist/adapters/DoubaoAdapter.js.map +1 -0
- package/dist/adapters/GeminiAdapter.d.ts +14 -0
- package/dist/adapters/GeminiAdapter.js +163 -0
- package/dist/adapters/GeminiAdapter.js.map +1 -0
- package/dist/adapters/GenericProjectAgentAdapter.d.ts +29 -0
- package/dist/adapters/GenericProjectAgentAdapter.js +204 -0
- package/dist/adapters/GenericProjectAgentAdapter.js.map +1 -0
- package/dist/adapters/HermesAdapter.d.ts +14 -0
- package/dist/adapters/HermesAdapter.js +163 -0
- package/dist/adapters/HermesAdapter.js.map +1 -0
- package/dist/adapters/JCodeAdapter.d.ts +4 -0
- package/dist/adapters/JCodeAdapter.js +19 -0
- package/dist/adapters/JCodeAdapter.js.map +1 -0
- package/dist/adapters/KiloCodeAdapter.d.ts +4 -0
- package/dist/adapters/KiloCodeAdapter.js +20 -0
- package/dist/adapters/KiloCodeAdapter.js.map +1 -0
- package/dist/adapters/KimiAdapter.d.ts +14 -0
- package/dist/adapters/KimiAdapter.js +183 -0
- package/dist/adapters/KimiAdapter.js.map +1 -0
- package/dist/adapters/KiroAdapter.d.ts +14 -0
- package/dist/adapters/KiroAdapter.js +180 -0
- package/dist/adapters/KiroAdapter.js.map +1 -0
- package/dist/adapters/OpenClawAdapter.d.ts +14 -0
- package/dist/adapters/OpenClawAdapter.js +163 -0
- package/dist/adapters/OpenClawAdapter.js.map +1 -0
- package/dist/adapters/OpenCodeAdapter.d.ts +14 -0
- package/dist/adapters/OpenCodeAdapter.js +172 -0
- package/dist/adapters/OpenCodeAdapter.js.map +1 -0
- package/dist/adapters/QCoderAdapter.d.ts +14 -0
- package/dist/adapters/QCoderAdapter.js +159 -0
- package/dist/adapters/QCoderAdapter.js.map +1 -0
- package/dist/adapters/QoderAdapter.d.ts +4 -0
- package/dist/adapters/QoderAdapter.js +21 -0
- package/dist/adapters/QoderAdapter.js.map +1 -0
- package/dist/adapters/TraeAdapter.d.ts +14 -0
- package/dist/adapters/TraeAdapter.js +159 -0
- package/dist/adapters/TraeAdapter.js.map +1 -0
- package/dist/adapters/VSCAdapter.d.ts +14 -0
- package/dist/adapters/VSCAdapter.js +159 -0
- package/dist/adapters/VSCAdapter.js.map +1 -0
- package/dist/adapters/WindsurfAdapter.d.ts +14 -0
- package/dist/adapters/WindsurfAdapter.js +185 -0
- package/dist/adapters/WindsurfAdapter.js.map +1 -0
- package/dist/adapters/WorkBuddyAdapter.d.ts +14 -0
- package/dist/adapters/WorkBuddyAdapter.js +159 -0
- package/dist/adapters/WorkBuddyAdapter.js.map +1 -0
- package/dist/adapters/index.d.ts +32 -0
- package/dist/adapters/index.js +87 -0
- package/dist/adapters/index.js.map +1 -0
- package/dist/agents/AgentChannel.d.ts +43 -0
- package/dist/agents/AgentChannel.js +136 -0
- package/dist/agents/AgentChannel.js.map +1 -0
- package/dist/agents/AgentCoordinator.d.ts +29 -0
- package/dist/agents/AgentCoordinator.js +136 -0
- package/dist/agents/AgentCoordinator.js.map +1 -0
- package/dist/agents/AgentDispatcher.d.ts +24 -0
- package/dist/agents/AgentDispatcher.js +112 -0
- package/dist/agents/AgentDispatcher.js.map +1 -0
- package/dist/agents/AgentManager.d.ts +14 -0
- package/dist/agents/AgentManager.js +85 -0
- package/dist/agents/AgentManager.js.map +1 -0
- package/dist/agents/AgentPool.d.ts +59 -0
- package/dist/agents/AgentPool.js +192 -0
- package/dist/agents/AgentPool.js.map +1 -0
- package/dist/agents/AgentRegistry.d.ts +20 -0
- package/dist/agents/AgentRegistry.js +36 -0
- package/dist/agents/AgentRegistry.js.map +1 -0
- package/dist/agents/AgentSourceLoader.d.ts +73 -0
- package/dist/agents/AgentSourceLoader.js +103 -0
- package/dist/agents/AgentSourceLoader.js.map +1 -0
- package/dist/agents/IAgent.d.ts +53 -0
- package/dist/agents/IAgent.js +4 -0
- package/dist/agents/IAgent.js.map +1 -0
- package/dist/agents/LeadershipPresets.d.ts +16 -0
- package/dist/agents/LeadershipPresets.js +152 -0
- package/dist/agents/LeadershipPresets.js.map +1 -0
- package/dist/agents/definitions/debugger.d.ts +2 -0
- package/dist/agents/definitions/debugger.js +6 -0
- package/dist/agents/definitions/debugger.js.map +1 -0
- package/dist/agents/definitions/doc-writer.d.ts +2 -0
- package/dist/agents/definitions/doc-writer.js +6 -0
- package/dist/agents/definitions/doc-writer.js.map +1 -0
- package/dist/agents/definitions/implementer.d.ts +2 -0
- package/dist/agents/definitions/implementer.js +6 -0
- package/dist/agents/definitions/implementer.js.map +1 -0
- package/dist/agents/definitions/planner.d.ts +2 -0
- package/dist/agents/definitions/planner.js +6 -0
- package/dist/agents/definitions/planner.js.map +1 -0
- package/dist/agents/definitions/researcher.d.ts +2 -0
- package/dist/agents/definitions/researcher.js +6 -0
- package/dist/agents/definitions/researcher.js.map +1 -0
- package/dist/agents/definitions/reviewer.d.ts +2 -0
- package/dist/agents/definitions/reviewer.js +6 -0
- package/dist/agents/definitions/reviewer.js.map +1 -0
- package/dist/agents/definitions/security.d.ts +2 -0
- package/dist/agents/definitions/security.js +6 -0
- package/dist/agents/definitions/security.js.map +1 -0
- package/dist/agents/definitions/tester.d.ts +2 -0
- package/dist/agents/definitions/tester.js +6 -0
- package/dist/agents/definitions/tester.js.map +1 -0
- package/dist/agents/index.d.ts +23 -0
- package/dist/agents/index.js +44 -0
- package/dist/agents/index.js.map +1 -0
- package/dist/agents/profiles.d.ts +26 -0
- package/dist/agents/profiles.js +197 -0
- package/dist/agents/profiles.js.map +1 -0
- package/dist/agents/types.d.ts +262 -0
- package/dist/agents/types.js +4 -0
- package/dist/agents/types.js.map +1 -0
- package/dist/api/cli.d.ts +2 -0
- package/dist/api/cli.js +6678 -0
- package/dist/api/cli.js.map +1 -0
- package/dist/api/doctor.d.ts +83 -0
- package/dist/api/doctor.js +982 -0
- package/dist/api/doctor.js.map +1 -0
- package/dist/api/mcp.d.ts +32 -0
- package/dist/api/mcp.js +223 -0
- package/dist/api/mcp.js.map +1 -0
- package/dist/api/medscale.d.ts +2 -0
- package/dist/api/medscale.js +20 -0
- package/dist/api/medscale.js.map +1 -0
- package/dist/api/quickstart.d.ts +86 -0
- package/dist/api/quickstart.js +291 -0
- package/dist/api/quickstart.js.map +1 -0
- package/dist/artifact/fsm.d.ts +41 -0
- package/dist/artifact/fsm.js +221 -0
- package/dist/artifact/fsm.js.map +1 -0
- package/dist/artifact/fsmDefinitions.d.ts +18 -0
- package/dist/artifact/fsmDefinitions.js +296 -0
- package/dist/artifact/fsmDefinitions.js.map +1 -0
- package/dist/artifact/sqliteStore.d.ts +61 -0
- package/dist/artifact/sqliteStore.js +381 -0
- package/dist/artifact/sqliteStore.js.map +1 -0
- package/dist/artifact/store.d.ts +49 -0
- package/dist/artifact/store.js +116 -0
- package/dist/artifact/store.js.map +1 -0
- package/dist/artifact/types.d.ts +535 -0
- package/dist/artifact/types.js +74 -0
- package/dist/artifact/types.js.map +1 -0
- package/dist/bootstrap/DependencyBootstrap.d.ts +112 -0
- package/dist/bootstrap/DependencyBootstrap.js +1046 -0
- package/dist/bootstrap/DependencyBootstrap.js.map +1 -0
- package/dist/bootstrap/DependencyBootstrapRenderer.d.ts +3 -0
- package/dist/bootstrap/DependencyBootstrapRenderer.js +138 -0
- package/dist/bootstrap/DependencyBootstrapRenderer.js.map +1 -0
- package/dist/bridge/PythonBridge.d.ts +80 -0
- package/dist/bridge/PythonBridge.js +437 -0
- package/dist/bridge/PythonBridge.js.map +1 -0
- package/dist/bridge/index.d.ts +2 -0
- package/dist/bridge/index.js +7 -0
- package/dist/bridge/index.js.map +1 -0
- package/dist/bridge/medicalWorkflows.d.ts +29 -0
- package/dist/bridge/medicalWorkflows.js +156 -0
- package/dist/bridge/medicalWorkflows.js.map +1 -0
- package/dist/bridge/types.d.ts +381 -0
- package/dist/bridge/types.js +113 -0
- package/dist/bridge/types.js.map +1 -0
- package/dist/cache/ScanCache.d.ts +41 -0
- package/dist/cache/ScanCache.js +120 -0
- package/dist/cache/ScanCache.js.map +1 -0
- package/dist/capabilities/BrowserCapability.d.ts +30 -0
- package/dist/capabilities/BrowserCapability.js +73 -0
- package/dist/capabilities/BrowserCapability.js.map +1 -0
- package/dist/capabilities/BrowserQACapability.d.ts +165 -0
- package/dist/capabilities/BrowserQACapability.js +438 -0
- package/dist/capabilities/BrowserQACapability.js.map +1 -0
- package/dist/capabilities/CapabilityRegistry.d.ts +17 -0
- package/dist/capabilities/CapabilityRegistry.js +65 -0
- package/dist/capabilities/CapabilityRegistry.js.map +1 -0
- package/dist/capabilities/ComputerCapability.d.ts +28 -0
- package/dist/capabilities/ComputerCapability.js +40 -0
- package/dist/capabilities/ComputerCapability.js.map +1 -0
- package/dist/capabilities/InstalledSkillsIntegration.d.ts +69 -0
- package/dist/capabilities/InstalledSkillsIntegration.js +240 -0
- package/dist/capabilities/InstalledSkillsIntegration.js.map +1 -0
- package/dist/capabilities/SearchCapability.d.ts +46 -0
- package/dist/capabilities/SearchCapability.js +88 -0
- package/dist/capabilities/SearchCapability.js.map +1 -0
- package/dist/capabilities/index.d.ts +6 -0
- package/dist/capabilities/index.js +9 -0
- package/dist/capabilities/index.js.map +1 -0
- package/dist/capabilities/types.d.ts +92 -0
- package/dist/capabilities/types.js +7 -0
- package/dist/capabilities/types.js.map +1 -0
- package/dist/cli/autofixCommands.d.ts +22 -0
- package/dist/cli/autofixCommands.js +32 -0
- package/dist/cli/autofixCommands.js.map +1 -0
- package/dist/cli/cortexCommands.d.ts +71 -0
- package/dist/cli/cortexCommands.js +335 -0
- package/dist/cli/cortexCommands.js.map +1 -0
- package/dist/cli/costCommands.d.ts +13 -0
- package/dist/cli/costCommands.js +48 -0
- package/dist/cli/costCommands.js.map +1 -0
- package/dist/cli/evolutionCommands.d.ts +112 -0
- package/dist/cli/evolutionCommands.js +246 -0
- package/dist/cli/evolutionCommands.js.map +1 -0
- package/dist/cli/gateStatusCommands.d.ts +1 -0
- package/dist/cli/gateStatusCommands.js +52 -0
- package/dist/cli/gateStatusCommands.js.map +1 -0
- package/dist/cli/liteCommands.d.ts +81 -0
- package/dist/cli/liteCommands.js +148 -0
- package/dist/cli/liteCommands.js.map +1 -0
- package/dist/cli/orchCommands.d.ts +43 -0
- package/dist/cli/orchCommands.js +135 -0
- package/dist/cli/orchCommands.js.map +1 -0
- package/dist/cli/phaseCommands.d.ts +248 -0
- package/dist/cli/phaseCommands.js +1878 -0
- package/dist/cli/phaseCommands.js.map +1 -0
- package/dist/cli/promptCommands.d.ts +1 -0
- package/dist/cli/promptCommands.js +57 -0
- package/dist/cli/promptCommands.js.map +1 -0
- package/dist/cli/qaCommands.d.ts +22 -0
- package/dist/cli/qaCommands.js +84 -0
- package/dist/cli/qaCommands.js.map +1 -0
- package/dist/cli/quickstartCommands.d.ts +17 -0
- package/dist/cli/quickstartCommands.js +47 -0
- package/dist/cli/quickstartCommands.js.map +1 -0
- package/dist/cli/runCommand.d.ts +39 -0
- package/dist/cli/runCommand.js +113 -0
- package/dist/cli/runCommand.js.map +1 -0
- package/dist/cli/scoreCommands.d.ts +1 -0
- package/dist/cli/scoreCommands.js +112 -0
- package/dist/cli/scoreCommands.js.map +1 -0
- package/dist/cli/shieldCommands.d.ts +30 -0
- package/dist/cli/shieldCommands.js +212 -0
- package/dist/cli/shieldCommands.js.map +1 -0
- package/dist/cli/targetCommands.d.ts +552 -0
- package/dist/cli/targetCommands.js +3173 -0
- package/dist/cli/targetCommands.js.map +1 -0
- package/dist/cli/tuiCommands.d.ts +7 -0
- package/dist/cli/tuiCommands.js +33 -0
- package/dist/cli/tuiCommands.js.map +1 -0
- package/dist/cli/vibeCommands.d.ts +64 -0
- package/dist/cli/vibeCommands.js +221 -0
- package/dist/cli/vibeCommands.js.map +1 -0
- package/dist/codegraph/CodeIntelligence.d.ts +147 -0
- package/dist/codegraph/CodeIntelligence.js +681 -0
- package/dist/codegraph/CodeIntelligence.js.map +1 -0
- package/dist/config/profiles.d.ts +64 -0
- package/dist/config/profiles.js +223 -0
- package/dist/config/profiles.js.map +1 -0
- package/dist/context/AntiPatternRegistry.d.ts +38 -0
- package/dist/context/AntiPatternRegistry.js +203 -0
- package/dist/context/AntiPatternRegistry.js.map +1 -0
- package/dist/context/CavemanCompressor.d.ts +20 -0
- package/dist/context/CavemanCompressor.js +14 -0
- package/dist/context/CavemanCompressor.js.map +1 -0
- package/dist/context/ContextBudget.d.ts +128 -0
- package/dist/context/ContextBudget.js +423 -0
- package/dist/context/ContextBudget.js.map +1 -0
- package/dist/context/ContextBuilder.d.ts +71 -0
- package/dist/context/ContextBuilder.js +372 -0
- package/dist/context/ContextBuilder.js.map +1 -0
- package/dist/context/ContextCompiler.d.ts +34 -0
- package/dist/context/ContextCompiler.js +120 -0
- package/dist/context/ContextCompiler.js.map +1 -0
- package/dist/context/ProjectAnatomy.d.ts +18 -0
- package/dist/context/ProjectAnatomy.js +287 -0
- package/dist/context/ProjectAnatomy.js.map +1 -0
- package/dist/context/SessionStartSequence.d.ts +54 -0
- package/dist/context/SessionStartSequence.js +162 -0
- package/dist/context/SessionStartSequence.js.map +1 -0
- package/dist/core/ExternalCommand.d.ts +9 -0
- package/dist/core/ExternalCommand.js +70 -0
- package/dist/core/ExternalCommand.js.map +1 -0
- package/dist/core/GbrainRuntime.d.ts +25 -0
- package/dist/core/GbrainRuntime.js +270 -0
- package/dist/core/GbrainRuntime.js.map +1 -0
- package/dist/core/container.d.ts +14 -0
- package/dist/core/container.js +35 -0
- package/dist/core/container.js.map +1 -0
- package/dist/core/eventBus.d.ts +60 -0
- package/dist/core/eventBus.js +157 -0
- package/dist/core/eventBus.js.map +1 -0
- package/dist/core/logger.d.ts +5 -0
- package/dist/core/logger.js +51 -0
- package/dist/core/logger.js.map +1 -0
- package/dist/cortex/GovernanceMetrics.d.ts +66 -0
- package/dist/cortex/GovernanceMetrics.js +230 -0
- package/dist/cortex/GovernanceMetrics.js.map +1 -0
- package/dist/cortex/InstinctExtractor.d.ts +61 -0
- package/dist/cortex/InstinctExtractor.js +184 -0
- package/dist/cortex/InstinctExtractor.js.map +1 -0
- package/dist/cortex/InstinctStore.d.ts +54 -0
- package/dist/cortex/InstinctStore.js +266 -0
- package/dist/cortex/InstinctStore.js.map +1 -0
- package/dist/cortex/ReflexionEngine.d.ts +34 -0
- package/dist/cortex/ReflexionEngine.js +157 -0
- package/dist/cortex/ReflexionEngine.js.map +1 -0
- package/dist/cortex/SessionInjector.d.ts +44 -0
- package/dist/cortex/SessionInjector.js +127 -0
- package/dist/cortex/SessionInjector.js.map +1 -0
- package/dist/cortex/adapters/ClaudeAdapter.d.ts +17 -0
- package/dist/cortex/adapters/ClaudeAdapter.js +61 -0
- package/dist/cortex/adapters/ClaudeAdapter.js.map +1 -0
- package/dist/cortex/adapters/CodexAdapter.d.ts +10 -0
- package/dist/cortex/adapters/CodexAdapter.js +52 -0
- package/dist/cortex/adapters/CodexAdapter.js.map +1 -0
- package/dist/cortex/adapters/CursorAdapter.d.ts +10 -0
- package/dist/cortex/adapters/CursorAdapter.js +46 -0
- package/dist/cortex/adapters/CursorAdapter.js.map +1 -0
- package/dist/cortex/adapters/GeminiAdapter.d.ts +11 -0
- package/dist/cortex/adapters/GeminiAdapter.js +48 -0
- package/dist/cortex/adapters/GeminiAdapter.js.map +1 -0
- package/dist/dashboard/DashboardServer.d.ts +86 -0
- package/dist/dashboard/DashboardServer.js +380 -0
- package/dist/dashboard/DashboardServer.js.map +1 -0
- package/dist/dashboard/MedicalWorkflowData.d.ts +155 -0
- package/dist/dashboard/MedicalWorkflowData.js +664 -0
- package/dist/dashboard/MedicalWorkflowData.js.map +1 -0
- package/dist/dashboard/MetricsAggregator.d.ts +38 -0
- package/dist/dashboard/MetricsAggregator.js +99 -0
- package/dist/dashboard/MetricsAggregator.js.map +1 -0
- package/dist/dashboard/index.d.ts +4 -0
- package/dist/dashboard/index.js +3 -0
- package/dist/dashboard/index.js.map +1 -0
- package/dist/dashboard/server.d.ts +52 -0
- package/dist/dashboard/server.js +84 -0
- package/dist/dashboard/server.js.map +1 -0
- package/dist/env/EnvironmentDoctor.d.ts +66 -0
- package/dist/env/EnvironmentDoctor.js +581 -0
- package/dist/env/EnvironmentDoctor.js.map +1 -0
- package/dist/eval/BenchmarkPublisher.d.ts +25 -0
- package/dist/eval/BenchmarkPublisher.js +27 -0
- package/dist/eval/BenchmarkPublisher.js.map +1 -0
- package/dist/eval/WorkflowEval.d.ts +161 -0
- package/dist/eval/WorkflowEval.js +377 -0
- package/dist/eval/WorkflowEval.js.map +1 -0
- package/dist/evolution/AutoDefectCreator.d.ts +43 -0
- package/dist/evolution/AutoDefectCreator.js +157 -0
- package/dist/evolution/AutoDefectCreator.js.map +1 -0
- package/dist/evolution/BehaviorTracker.d.ts +46 -0
- package/dist/evolution/BehaviorTracker.js +67 -0
- package/dist/evolution/BehaviorTracker.js.map +1 -0
- package/dist/evolution/EvolutionEngine.d.ts +102 -0
- package/dist/evolution/EvolutionEngine.js +326 -0
- package/dist/evolution/EvolutionEngine.js.map +1 -0
- package/dist/evolution/EvolutionEvaluator.d.ts +61 -0
- package/dist/evolution/EvolutionEvaluator.js +118 -0
- package/dist/evolution/EvolutionEvaluator.js.map +1 -0
- package/dist/evolution/LessonValidator.d.ts +36 -0
- package/dist/evolution/LessonValidator.js +132 -0
- package/dist/evolution/LessonValidator.js.map +1 -0
- package/dist/evolution/PatternExtractor.d.ts +40 -0
- package/dist/evolution/PatternExtractor.js +83 -0
- package/dist/evolution/PatternExtractor.js.map +1 -0
- package/dist/evolution/RuleMaturity.d.ts +39 -0
- package/dist/evolution/RuleMaturity.js +70 -0
- package/dist/evolution/RuleMaturity.js.map +1 -0
- package/dist/evolution/SessionLearnings.d.ts +70 -0
- package/dist/evolution/SessionLearnings.js +217 -0
- package/dist/evolution/SessionLearnings.js.map +1 -0
- package/dist/evolution/SkillCreator.d.ts +75 -0
- package/dist/evolution/SkillCreator.js +219 -0
- package/dist/evolution/SkillCreator.js.map +1 -0
- package/dist/fsm/FSMAgentBridge.d.ts +59 -0
- package/dist/fsm/FSMAgentBridge.js +193 -0
- package/dist/fsm/FSMAgentBridge.js.map +1 -0
- package/dist/fsm/index.d.ts +2 -0
- package/dist/fsm/index.js +3 -0
- package/dist/fsm/index.js.map +1 -0
- package/dist/governance/GovernanceRoi.d.ts +30 -0
- package/dist/governance/GovernanceRoi.js +102 -0
- package/dist/governance/GovernanceRoi.js.map +1 -0
- package/dist/governance/ProgressiveGovernance.d.ts +22 -0
- package/dist/governance/ProgressiveGovernance.js +159 -0
- package/dist/governance/ProgressiveGovernance.js.map +1 -0
- package/dist/guardrails/ActiveRedTeam.d.ts +46 -0
- package/dist/guardrails/ActiveRedTeam.js +203 -0
- package/dist/guardrails/ActiveRedTeam.js.map +1 -0
- package/dist/guardrails/DependencyAuditor.d.ts +68 -0
- package/dist/guardrails/DependencyAuditor.js +378 -0
- package/dist/guardrails/DependencyAuditor.js.map +1 -0
- package/dist/guardrails/DetectorEnhanced.d.ts +111 -0
- package/dist/guardrails/DetectorEnhanced.js +202 -0
- package/dist/guardrails/DetectorEnhanced.js.map +1 -0
- package/dist/guardrails/GateEvaluator.d.ts +18 -0
- package/dist/guardrails/GateEvaluator.js +129 -0
- package/dist/guardrails/GateEvaluator.js.map +1 -0
- package/dist/guardrails/Gateway.d.ts +26 -0
- package/dist/guardrails/Gateway.js +56 -0
- package/dist/guardrails/Gateway.js.map +1 -0
- package/dist/guardrails/OWASPDetector.d.ts +58 -0
- package/dist/guardrails/OWASPDetector.js +508 -0
- package/dist/guardrails/OWASPDetector.js.map +1 -0
- package/dist/guardrails/ReviewEnforcer.d.ts +52 -0
- package/dist/guardrails/ReviewEnforcer.js +117 -0
- package/dist/guardrails/ReviewEnforcer.js.map +1 -0
- package/dist/guardrails/advancedDetectors.d.ts +38 -0
- package/dist/guardrails/advancedDetectors.js +188 -0
- package/dist/guardrails/advancedDetectors.js.map +1 -0
- package/dist/guardrails/detectors.d.ts +34 -0
- package/dist/guardrails/detectors.js +332 -0
- package/dist/guardrails/detectors.js.map +1 -0
- package/dist/guardrails/roles.d.ts +4 -0
- package/dist/guardrails/roles.js +54 -0
- package/dist/guardrails/roles.js.map +1 -0
- package/dist/hooks/BugPatternDetector.d.ts +36 -0
- package/dist/hooks/BugPatternDetector.js +207 -0
- package/dist/hooks/BugPatternDetector.js.map +1 -0
- package/dist/hooks/HookDeployer.d.ts +44 -0
- package/dist/hooks/HookDeployer.js +144 -0
- package/dist/hooks/HookDeployer.js.map +1 -0
- package/dist/hooks/HookGeneratorEnhanced.d.ts +67 -0
- package/dist/hooks/HookGeneratorEnhanced.js +641 -0
- package/dist/hooks/HookGeneratorEnhanced.js.map +1 -0
- package/dist/hooks/WorkflowHooksManager.d.ts +30 -0
- package/dist/hooks/WorkflowHooksManager.js +160 -0
- package/dist/hooks/WorkflowHooksManager.js.map +1 -0
- package/dist/hooks/index.d.ts +6 -0
- package/dist/hooks/index.js +5 -0
- package/dist/hooks/index.js.map +1 -0
- package/dist/i18n/Language.d.ts +9 -0
- package/dist/i18n/Language.js +38 -0
- package/dist/i18n/Language.js.map +1 -0
- package/dist/index.d.ts +101 -0
- package/dist/index.js +104 -0
- package/dist/index.js.map +1 -0
- package/dist/knowledge/CerebrumManager.d.ts +25 -0
- package/dist/knowledge/CerebrumManager.js +127 -0
- package/dist/knowledge/CerebrumManager.js.map +1 -0
- package/dist/knowledge/GraphifyKnowledgeBase.d.ts +38 -0
- package/dist/knowledge/GraphifyKnowledgeBase.js +409 -0
- package/dist/knowledge/GraphifyKnowledgeBase.js.map +1 -0
- package/dist/knowledge/KnowledgeBase.d.ts +51 -0
- package/dist/knowledge/KnowledgeBase.js +182 -0
- package/dist/knowledge/KnowledgeBase.js.map +1 -0
- package/dist/knowledge/SQLiteKnowledgeBase.d.ts +29 -0
- package/dist/knowledge/SQLiteKnowledgeBase.js +203 -0
- package/dist/knowledge/SQLiteKnowledgeBase.js.map +1 -0
- package/dist/knowledge/TfidfIndex.d.ts +50 -0
- package/dist/knowledge/TfidfIndex.js +177 -0
- package/dist/knowledge/TfidfIndex.js.map +1 -0
- package/dist/knowledge/UbiquitousLanguageManager.d.ts +49 -0
- package/dist/knowledge/UbiquitousLanguageManager.js +133 -0
- package/dist/knowledge/UbiquitousLanguageManager.js.map +1 -0
- package/dist/memory/MemoryBrain.d.ts +146 -0
- package/dist/memory/MemoryBrain.js +679 -0
- package/dist/memory/MemoryBrain.js.map +1 -0
- package/dist/memory/MemoryFabric.d.ts +130 -0
- package/dist/memory/MemoryFabric.js +317 -0
- package/dist/memory/MemoryFabric.js.map +1 -0
- package/dist/memory/MemoryIntelligence.d.ts +42 -0
- package/dist/memory/MemoryIntelligence.js +215 -0
- package/dist/memory/MemoryIntelligence.js.map +1 -0
- package/dist/memory/MemoryLearning.d.ts +62 -0
- package/dist/memory/MemoryLearning.js +209 -0
- package/dist/memory/MemoryLearning.js.map +1 -0
- package/dist/memory/MemoryProviders.d.ts +165 -0
- package/dist/memory/MemoryProviders.js +940 -0
- package/dist/memory/MemoryProviders.js.map +1 -0
- package/dist/memory/MemoryReview.d.ts +65 -0
- package/dist/memory/MemoryReview.js +260 -0
- package/dist/memory/MemoryReview.js.map +1 -0
- package/dist/memory/index.d.ts +6 -0
- package/dist/memory/index.js +7 -0
- package/dist/memory/index.js.map +1 -0
- package/dist/orchestration/EffectsWiring.d.ts +8 -0
- package/dist/orchestration/EffectsWiring.js +87 -0
- package/dist/orchestration/EffectsWiring.js.map +1 -0
- package/dist/orchestrator/OrchestratorDaemon.d.ts +44 -0
- package/dist/orchestrator/OrchestratorDaemon.js +150 -0
- package/dist/orchestrator/OrchestratorDaemon.js.map +1 -0
- package/dist/orchestrator/PolicyLoader.d.ts +80 -0
- package/dist/orchestrator/PolicyLoader.js +229 -0
- package/dist/orchestrator/PolicyLoader.js.map +1 -0
- package/dist/orchestrator/ReconciliationLoop.d.ts +71 -0
- package/dist/orchestrator/ReconciliationLoop.js +266 -0
- package/dist/orchestrator/ReconciliationLoop.js.map +1 -0
- package/dist/orchestrator/TrackerAdapter.d.ts +60 -0
- package/dist/orchestrator/TrackerAdapter.js +147 -0
- package/dist/orchestrator/TrackerAdapter.js.map +1 -0
- package/dist/orchestrator/WorkspaceManager.d.ts +66 -0
- package/dist/orchestrator/WorkspaceManager.js +257 -0
- package/dist/orchestrator/WorkspaceManager.js.map +1 -0
- package/dist/output/BrandThemeLoader.d.ts +54 -0
- package/dist/output/BrandThemeLoader.js +340 -0
- package/dist/output/BrandThemeLoader.js.map +1 -0
- package/dist/output/GovernanceDashboard.d.ts +59 -0
- package/dist/output/GovernanceDashboard.js +281 -0
- package/dist/output/GovernanceDashboard.js.map +1 -0
- package/dist/output/HTMLArtifactLayer.d.ts +97 -0
- package/dist/output/HTMLArtifactLayer.js +576 -0
- package/dist/output/HTMLArtifactLayer.js.map +1 -0
- package/dist/output/HTMLDocumentRenderer.d.ts +83 -0
- package/dist/output/HTMLDocumentRenderer.js +718 -0
- package/dist/output/HTMLDocumentRenderer.js.map +1 -0
- package/dist/output/UIPrototypeRenderer.d.ts +61 -0
- package/dist/output/UIPrototypeRenderer.js +500 -0
- package/dist/output/UIPrototypeRenderer.js.map +1 -0
- package/dist/output/index.d.ts +10 -0
- package/dist/output/index.js +8 -0
- package/dist/output/index.js.map +1 -0
- package/dist/prompts/PhasePromptRegistry.d.ts +53 -0
- package/dist/prompts/PhasePromptRegistry.js +517 -0
- package/dist/prompts/PhasePromptRegistry.js.map +1 -0
- package/dist/prompts/PromptOptimizer.d.ts +42 -0
- package/dist/prompts/PromptOptimizer.js +309 -0
- package/dist/prompts/PromptOptimizer.js.map +1 -0
- package/dist/prompts/VibeTemplateGallery.d.ts +25 -0
- package/dist/prompts/VibeTemplateGallery.js +295 -0
- package/dist/prompts/VibeTemplateGallery.js.map +1 -0
- package/dist/qa/BrowserDaemon.d.ts +23 -0
- package/dist/qa/BrowserDaemon.js +79 -0
- package/dist/qa/BrowserDaemon.js.map +1 -0
- package/dist/qa/E2ETestOrchestrator.d.ts +14 -0
- package/dist/qa/E2ETestOrchestrator.js +19 -0
- package/dist/qa/E2ETestOrchestrator.js.map +1 -0
- package/dist/review/CrossModelReviewer.d.ts +35 -0
- package/dist/review/CrossModelReviewer.js +75 -0
- package/dist/review/CrossModelReviewer.js.map +1 -0
- package/dist/review/ReviewAggregator.d.ts +13 -0
- package/dist/review/ReviewAggregator.js +28 -0
- package/dist/review/ReviewAggregator.js.map +1 -0
- package/dist/review/reviewCommands.d.ts +15 -0
- package/dist/review/reviewCommands.js +24 -0
- package/dist/review/reviewCommands.js.map +1 -0
- package/dist/routing/LocalModelProvider.d.ts +11 -0
- package/dist/routing/LocalModelProvider.js +21 -0
- package/dist/routing/LocalModelProvider.js.map +1 -0
- package/dist/routing/ModelRouter.d.ts +42 -0
- package/dist/routing/ModelRouter.js +94 -0
- package/dist/routing/ModelRouter.js.map +1 -0
- package/dist/routing/PromptCachePolicy.d.ts +37 -0
- package/dist/routing/PromptCachePolicy.js +97 -0
- package/dist/routing/PromptCachePolicy.js.map +1 -0
- package/dist/runtime/AiOsRuntime.d.ts +485 -0
- package/dist/runtime/AiOsRuntime.js +1846 -0
- package/dist/runtime/AiOsRuntime.js.map +1 -0
- package/dist/runtime/CostAnalyzer.d.ts +53 -0
- package/dist/runtime/CostAnalyzer.js +160 -0
- package/dist/runtime/CostAnalyzer.js.map +1 -0
- package/dist/runtime/CostOptimizer.d.ts +11 -0
- package/dist/runtime/CostOptimizer.js +21 -0
- package/dist/runtime/CostOptimizer.js.map +1 -0
- package/dist/runtime/ExecutionLedger.d.ts +46 -0
- package/dist/runtime/ExecutionLedger.js +71 -0
- package/dist/runtime/ExecutionLedger.js.map +1 -0
- package/dist/runtime/FinalReportGuard.d.ts +16 -0
- package/dist/runtime/FinalReportGuard.js +14 -0
- package/dist/runtime/FinalReportGuard.js.map +1 -0
- package/dist/runtime/ModelUsageLedger.d.ts +101 -0
- package/dist/runtime/ModelUsageLedger.js +296 -0
- package/dist/runtime/ModelUsageLedger.js.map +1 -0
- package/dist/runtime/RuntimeDoctor.d.ts +23 -0
- package/dist/runtime/RuntimeDoctor.js +151 -0
- package/dist/runtime/RuntimeDoctor.js.map +1 -0
- package/dist/runtime/RuntimeEvidenceLedger.d.ts +50 -0
- package/dist/runtime/RuntimeEvidenceLedger.js +89 -0
- package/dist/runtime/RuntimeEvidenceLedger.js.map +1 -0
- package/dist/runtime/SessionLedger.d.ts +53 -0
- package/dist/runtime/SessionLedger.js +104 -0
- package/dist/runtime/SessionLedger.js.map +1 -0
- package/dist/runtime/index.d.ts +7 -0
- package/dist/runtime/index.js +8 -0
- package/dist/runtime/index.js.map +1 -0
- package/dist/setup/SetupVerification.d.ts +42 -0
- package/dist/setup/SetupVerification.js +180 -0
- package/dist/setup/SetupVerification.js.map +1 -0
- package/dist/setup/SetupWizard.d.ts +45 -0
- package/dist/setup/SetupWizard.js +216 -0
- package/dist/setup/SetupWizard.js.map +1 -0
- package/dist/shield/PolicyCompiler.d.ts +70 -0
- package/dist/shield/PolicyCompiler.js +540 -0
- package/dist/shield/PolicyCompiler.js.map +1 -0
- package/dist/shield/ProtectedPaths.d.ts +39 -0
- package/dist/shield/ProtectedPaths.js +179 -0
- package/dist/shield/ProtectedPaths.js.map +1 -0
- package/dist/shield/ShieldProtocol.d.ts +50 -0
- package/dist/shield/ShieldProtocol.js +103 -0
- package/dist/shield/ShieldProtocol.js.map +1 -0
- package/dist/skills/ExternalSkills.d.ts +3 -0
- package/dist/skills/ExternalSkills.js +27 -0
- package/dist/skills/ExternalSkills.js.map +1 -0
- package/dist/skills/GrillingSessionSkill.d.ts +65 -0
- package/dist/skills/GrillingSessionSkill.js +113 -0
- package/dist/skills/GrillingSessionSkill.js.map +1 -0
- package/dist/skills/GrillingTemplates.d.ts +7 -0
- package/dist/skills/GrillingTemplates.js +38 -0
- package/dist/skills/GrillingTemplates.js.map +1 -0
- package/dist/skills/RoleSkills.d.ts +20 -0
- package/dist/skills/RoleSkills.js +154 -0
- package/dist/skills/RoleSkills.js.map +1 -0
- package/dist/skills/SkillCatalog.d.ts +13 -0
- package/dist/skills/SkillCatalog.js +184 -0
- package/dist/skills/SkillCatalog.js.map +1 -0
- package/dist/skills/SkillDiscovery.d.ts +84 -0
- package/dist/skills/SkillDiscovery.js +402 -0
- package/dist/skills/SkillDiscovery.js.map +1 -0
- package/dist/skills/SkillDoctor.d.ts +37 -0
- package/dist/skills/SkillDoctor.js +267 -0
- package/dist/skills/SkillDoctor.js.map +1 -0
- package/dist/skills/SkillExecutor.d.ts +38 -0
- package/dist/skills/SkillExecutor.js +237 -0
- package/dist/skills/SkillExecutor.js.map +1 -0
- package/dist/skills/SkillFrontmatter.d.ts +28 -0
- package/dist/skills/SkillFrontmatter.js +152 -0
- package/dist/skills/SkillFrontmatter.js.map +1 -0
- package/dist/skills/SkillInstaller.d.ts +40 -0
- package/dist/skills/SkillInstaller.js +117 -0
- package/dist/skills/SkillInstaller.js.map +1 -0
- package/dist/skills/SkillMdStandard.d.ts +33 -0
- package/dist/skills/SkillMdStandard.js +88 -0
- package/dist/skills/SkillMdStandard.js.map +1 -0
- package/dist/skills/SkillRadar.d.ts +83 -0
- package/dist/skills/SkillRadar.js +404 -0
- package/dist/skills/SkillRadar.js.map +1 -0
- package/dist/skills/SkillRegistry.d.ts +112 -0
- package/dist/skills/SkillRegistry.js +161 -0
- package/dist/skills/SkillRegistry.js.map +1 -0
- package/dist/skills/SkillRepository.d.ts +71 -0
- package/dist/skills/SkillRepository.js +435 -0
- package/dist/skills/SkillRepository.js.map +1 -0
- package/dist/skills/TriggerEngine.d.ts +43 -0
- package/dist/skills/TriggerEngine.js +142 -0
- package/dist/skills/TriggerEngine.js.map +1 -0
- package/dist/skills/coreSkills.d.ts +6 -0
- package/dist/skills/coreSkills.js +41 -0
- package/dist/skills/coreSkills.js.map +1 -0
- package/dist/skills/index.d.ts +10 -0
- package/dist/skills/index.js +12 -0
- package/dist/skills/index.js.map +1 -0
- package/dist/skills/interop/GStackInterop.d.ts +15 -0
- package/dist/skills/interop/GStackInterop.js +34 -0
- package/dist/skills/interop/GStackInterop.js.map +1 -0
- package/dist/skills/interop/OMCInterop.d.ts +15 -0
- package/dist/skills/interop/OMCInterop.js +34 -0
- package/dist/skills/interop/OMCInterop.js.map +1 -0
- package/dist/skills/routing/SkillGate.d.ts +12 -0
- package/dist/skills/routing/SkillGate.js +117 -0
- package/dist/skills/routing/SkillGate.js.map +1 -0
- package/dist/skills/routing/SkillPlanner.d.ts +8 -0
- package/dist/skills/routing/SkillPlanner.js +179 -0
- package/dist/skills/routing/SkillPlanner.js.map +1 -0
- package/dist/skills/routing/SkillPolicy.d.ts +6 -0
- package/dist/skills/routing/SkillPolicy.js +336 -0
- package/dist/skills/routing/SkillPolicy.js.map +1 -0
- package/dist/skills/routing/SkillRoutingTypes.d.ts +89 -0
- package/dist/skills/routing/SkillRoutingTypes.js +2 -0
- package/dist/skills/routing/SkillRoutingTypes.js.map +1 -0
- package/dist/skills/routing/TaskIntentClassifier.d.ts +6 -0
- package/dist/skills/routing/TaskIntentClassifier.js +79 -0
- package/dist/skills/routing/TaskIntentClassifier.js.map +1 -0
- package/dist/skills/routing/index.d.ts +5 -0
- package/dist/skills/routing/index.js +6 -0
- package/dist/skills/routing/index.js.map +1 -0
- package/dist/tasks/IssueTriageFSM.d.ts +26 -0
- package/dist/tasks/IssueTriageFSM.js +107 -0
- package/dist/tasks/IssueTriageFSM.js.map +1 -0
- package/dist/tasks/TaskEngine.d.ts +97 -0
- package/dist/tasks/TaskEngine.js +289 -0
- package/dist/tasks/TaskEngine.js.map +1 -0
- package/dist/testing/DiffTestSelector.d.ts +22 -0
- package/dist/testing/DiffTestSelector.js +114 -0
- package/dist/testing/DiffTestSelector.js.map +1 -0
- package/dist/testing/index.d.ts +1 -0
- package/dist/testing/index.js +3 -0
- package/dist/testing/index.js.map +1 -0
- package/dist/tools/CommandOutputCompressor.d.ts +28 -0
- package/dist/tools/CommandOutputCompressor.js +242 -0
- package/dist/tools/CommandOutputCompressor.js.map +1 -0
- package/dist/tools/CommandRunLedger.d.ts +77 -0
- package/dist/tools/CommandRunLedger.js +111 -0
- package/dist/tools/CommandRunLedger.js.map +1 -0
- package/dist/tools/RtkRuntime.d.ts +9 -0
- package/dist/tools/RtkRuntime.js +43 -0
- package/dist/tools/RtkRuntime.js.map +1 -0
- package/dist/tools/SafeCommandRunner.d.ts +16 -0
- package/dist/tools/SafeCommandRunner.js +83 -0
- package/dist/tools/SafeCommandRunner.js.map +1 -0
- package/dist/tools/ToolCapabilityRegistry.d.ts +51 -0
- package/dist/tools/ToolCapabilityRegistry.js +295 -0
- package/dist/tools/ToolCapabilityRegistry.js.map +1 -0
- package/dist/tools/ToolEvidenceGate.d.ts +39 -0
- package/dist/tools/ToolEvidenceGate.js +117 -0
- package/dist/tools/ToolEvidenceGate.js.map +1 -0
- package/dist/tools/ToolEvidenceStore.d.ts +58 -0
- package/dist/tools/ToolEvidenceStore.js +129 -0
- package/dist/tools/ToolEvidenceStore.js.map +1 -0
- package/dist/tools/ToolOrchestrator.d.ts +67 -0
- package/dist/tools/ToolOrchestrator.js +252 -0
- package/dist/tools/ToolOrchestrator.js.map +1 -0
- package/dist/tools/ToolPolicy.d.ts +33 -0
- package/dist/tools/ToolPolicy.js +172 -0
- package/dist/tools/ToolPolicy.js.map +1 -0
- package/dist/tools/index.d.ts +7 -0
- package/dist/tools/index.js +8 -0
- package/dist/tools/index.js.map +1 -0
- package/dist/tui/TuiDashboard.d.ts +3 -0
- package/dist/tui/TuiDashboard.js +120 -0
- package/dist/tui/TuiDashboard.js.map +1 -0
- package/dist/version.d.ts +3 -0
- package/dist/version.js +15 -0
- package/dist/version.js.map +1 -0
- package/dist/workflow/AdaptiveWorkflowRouter.d.ts +38 -0
- package/dist/workflow/AdaptiveWorkflowRouter.js +214 -0
- package/dist/workflow/AdaptiveWorkflowRouter.js.map +1 -0
- package/dist/workflow/CommitDiscipline.d.ts +68 -0
- package/dist/workflow/CommitDiscipline.js +328 -0
- package/dist/workflow/CommitDiscipline.js.map +1 -0
- package/dist/workflow/ContextGovernance.d.ts +51 -0
- package/dist/workflow/ContextGovernance.js +233 -0
- package/dist/workflow/ContextGovernance.js.map +1 -0
- package/dist/workflow/CrossRepoOrchestrator.d.ts +92 -0
- package/dist/workflow/CrossRepoOrchestrator.js +408 -0
- package/dist/workflow/CrossRepoOrchestrator.js.map +1 -0
- package/dist/workflow/DiagnosticLoop.d.ts +40 -0
- package/dist/workflow/DiagnosticLoop.js +105 -0
- package/dist/workflow/DiagnosticLoop.js.map +1 -0
- package/dist/workflow/EngineeringStandards.d.ts +212 -0
- package/dist/workflow/EngineeringStandards.js +1113 -0
- package/dist/workflow/EngineeringStandards.js.map +1 -0
- package/dist/workflow/EvidenceStore.d.ts +20 -0
- package/dist/workflow/EvidenceStore.js +48 -0
- package/dist/workflow/EvidenceStore.js.map +1 -0
- package/dist/workflow/EvolutionShadowPromoter.d.ts +46 -0
- package/dist/workflow/EvolutionShadowPromoter.js +73 -0
- package/dist/workflow/EvolutionShadowPromoter.js.map +1 -0
- package/dist/workflow/GateCatalog.d.ts +63 -0
- package/dist/workflow/GateCatalog.js +268 -0
- package/dist/workflow/GateCatalog.js.map +1 -0
- package/dist/workflow/GovernanceLock.d.ts +35 -0
- package/dist/workflow/GovernanceLock.js +58 -0
- package/dist/workflow/GovernanceLock.js.map +1 -0
- package/dist/workflow/GovernanceRoi.d.ts +52 -0
- package/dist/workflow/GovernanceRoi.js +204 -0
- package/dist/workflow/GovernanceRoi.js.map +1 -0
- package/dist/workflow/GovernanceTemplatePacks.d.ts +24 -0
- package/dist/workflow/GovernanceTemplatePacks.js +2134 -0
- package/dist/workflow/GovernanceTemplatePacks.js.map +1 -0
- package/dist/workflow/GovernanceTemplates.d.ts +19 -0
- package/dist/workflow/GovernanceTemplates.js +1291 -0
- package/dist/workflow/GovernanceTemplates.js.map +1 -0
- package/dist/workflow/McpGovernance.d.ts +63 -0
- package/dist/workflow/McpGovernance.js +198 -0
- package/dist/workflow/McpGovernance.js.map +1 -0
- package/dist/workflow/OutOfScopeStore.d.ts +37 -0
- package/dist/workflow/OutOfScopeStore.js +164 -0
- package/dist/workflow/OutOfScopeStore.js.map +1 -0
- package/dist/workflow/PhaseMarkerTracker.d.ts +63 -0
- package/dist/workflow/PhaseMarkerTracker.js +291 -0
- package/dist/workflow/PhaseMarkerTracker.js.map +1 -0
- package/dist/workflow/ResourceGovernance.d.ts +120 -0
- package/dist/workflow/ResourceGovernance.js +531 -0
- package/dist/workflow/ResourceGovernance.js.map +1 -0
- package/dist/workflow/ReviewAnalyzer.d.ts +80 -0
- package/dist/workflow/ReviewAnalyzer.js +438 -0
- package/dist/workflow/ReviewAnalyzer.js.map +1 -0
- package/dist/workflow/ReviewStore.d.ts +36 -0
- package/dist/workflow/ReviewStore.js +42 -0
- package/dist/workflow/ReviewStore.js.map +1 -0
- package/dist/workflow/SecurityAudit.d.ts +27 -0
- package/dist/workflow/SecurityAudit.js +294 -0
- package/dist/workflow/SecurityAudit.js.map +1 -0
- package/dist/workflow/SessionCoordinator.d.ts +103 -0
- package/dist/workflow/SessionCoordinator.js +401 -0
- package/dist/workflow/SessionCoordinator.js.map +1 -0
- package/dist/workflow/SessionPreamble.d.ts +19 -0
- package/dist/workflow/SessionPreamble.js +130 -0
- package/dist/workflow/SessionPreamble.js.map +1 -0
- package/dist/workflow/SessionStateTracker.d.ts +74 -0
- package/dist/workflow/SessionStateTracker.js +270 -0
- package/dist/workflow/SessionStateTracker.js.map +1 -0
- package/dist/workflow/ShipPipeline.d.ts +30 -0
- package/dist/workflow/ShipPipeline.js +366 -0
- package/dist/workflow/ShipPipeline.js.map +1 -0
- package/dist/workflow/TaskArtifactScaffolder.d.ts +69 -0
- package/dist/workflow/TaskArtifactScaffolder.js +333 -0
- package/dist/workflow/TaskArtifactScaffolder.js.map +1 -0
- package/dist/workflow/TaskDependencyGraph.d.ts +73 -0
- package/dist/workflow/TaskDependencyGraph.js +245 -0
- package/dist/workflow/TaskDependencyGraph.js.map +1 -0
- package/dist/workflow/TaskLevelDetector.d.ts +41 -0
- package/dist/workflow/TaskLevelDetector.js +219 -0
- package/dist/workflow/TaskLevelDetector.js.map +1 -0
- package/dist/workflow/TaskMetricsStore.d.ts +49 -0
- package/dist/workflow/TaskMetricsStore.js +149 -0
- package/dist/workflow/TaskMetricsStore.js.map +1 -0
- package/dist/workflow/TaskScoreEngine.d.ts +42 -0
- package/dist/workflow/TaskScoreEngine.js +181 -0
- package/dist/workflow/TaskScoreEngine.js.map +1 -0
- package/dist/workflow/TddLoop.d.ts +49 -0
- package/dist/workflow/TddLoop.js +78 -0
- package/dist/workflow/TddLoop.js.map +1 -0
- package/dist/workflow/UpgradeManager.d.ts +178 -0
- package/dist/workflow/UpgradeManager.js +665 -0
- package/dist/workflow/UpgradeManager.js.map +1 -0
- package/dist/workflow/VerificationCommands.d.ts +36 -0
- package/dist/workflow/VerificationCommands.js +123 -0
- package/dist/workflow/VerificationCommands.js.map +1 -0
- package/dist/workflow/VerificationProfile.d.ts +67 -0
- package/dist/workflow/VerificationProfile.js +241 -0
- package/dist/workflow/VerificationProfile.js.map +1 -0
- package/dist/workflow/VerificationSchema.d.ts +46 -0
- package/dist/workflow/VerificationSchema.js +97 -0
- package/dist/workflow/VerificationSchema.js.map +1 -0
- package/dist/workflow/WorkflowArtifactWriter.d.ts +113 -0
- package/dist/workflow/WorkflowArtifactWriter.js +242 -0
- package/dist/workflow/WorkflowArtifactWriter.js.map +1 -0
- package/dist/workflow/WorkflowEngine.d.ts +83 -0
- package/dist/workflow/WorkflowEngine.js +183 -0
- package/dist/workflow/WorkflowEngine.js.map +1 -0
- package/dist/workflow/WorkflowGuidance.d.ts +30 -0
- package/dist/workflow/WorkflowGuidance.js +204 -0
- package/dist/workflow/WorkflowGuidance.js.map +1 -0
- package/dist/workflow/WorkflowOpenTasks.d.ts +16 -0
- package/dist/workflow/WorkflowOpenTasks.js +37 -0
- package/dist/workflow/WorkflowOpenTasks.js.map +1 -0
- package/dist/workflow/WorkflowOrchestrator.d.ts +59 -0
- package/dist/workflow/WorkflowOrchestrator.js +326 -0
- package/dist/workflow/WorkflowOrchestrator.js.map +1 -0
- package/dist/workflow/WorkflowTemplates.d.ts +38 -0
- package/dist/workflow/WorkflowTemplates.js +371 -0
- package/dist/workflow/WorkflowTemplates.js.map +1 -0
- package/dist/workflow/WorkspaceLifecycle.d.ts +71 -0
- package/dist/workflow/WorkspaceLifecycle.js +401 -0
- package/dist/workflow/WorkspaceLifecycle.js.map +1 -0
- package/dist/workflow/WorkspacePolicy.d.ts +46 -0
- package/dist/workflow/WorkspacePolicy.js +141 -0
- package/dist/workflow/WorkspacePolicy.js.map +1 -0
- package/dist/workflow/WorkspaceSafety.d.ts +9 -0
- package/dist/workflow/WorkspaceSafety.js +49 -0
- package/dist/workflow/WorkspaceSafety.js.map +1 -0
- package/dist/workflow/WorkspaceTopology.d.ts +58 -0
- package/dist/workflow/WorkspaceTopology.js +176 -0
- package/dist/workflow/WorkspaceTopology.js.map +1 -0
- package/dist/workflow/autofix/AutoFixEngine.d.ts +37 -0
- package/dist/workflow/autofix/AutoFixEngine.js +169 -0
- package/dist/workflow/autofix/AutoFixEngine.js.map +1 -0
- package/dist/workflow/autonomous/AutonomousDevLoop.d.ts +88 -0
- package/dist/workflow/autonomous/AutonomousDevLoop.js +381 -0
- package/dist/workflow/autonomous/AutonomousDevLoop.js.map +1 -0
- package/dist/workflow/autonomous/BackgroundHunter.d.ts +74 -0
- package/dist/workflow/autonomous/BackgroundHunter.js +220 -0
- package/dist/workflow/autonomous/BackgroundHunter.js.map +1 -0
- package/dist/workflow/autonomous/WorklogManager.d.ts +50 -0
- package/dist/workflow/autonomous/WorklogManager.js +264 -0
- package/dist/workflow/autonomous/WorklogManager.js.map +1 -0
- package/dist/workflow/autonomous/index.d.ts +3 -0
- package/dist/workflow/autonomous/index.js +5 -0
- package/dist/workflow/autonomous/index.js.map +1 -0
- package/dist/workflow/cognitive/AmbiguityScorer.d.ts +17 -0
- package/dist/workflow/cognitive/AmbiguityScorer.js +107 -0
- package/dist/workflow/cognitive/AmbiguityScorer.js.map +1 -0
- package/dist/workflow/cognitive/ConsensusPlanner.d.ts +26 -0
- package/dist/workflow/cognitive/ConsensusPlanner.js +141 -0
- package/dist/workflow/cognitive/ConsensusPlanner.js.map +1 -0
- package/dist/workflow/cognitive/SocraticQuestioner.d.ts +33 -0
- package/dist/workflow/cognitive/SocraticQuestioner.js +276 -0
- package/dist/workflow/cognitive/SocraticQuestioner.js.map +1 -0
- package/dist/workflow/evolution/LessonExtractor.d.ts +90 -0
- package/dist/workflow/evolution/LessonExtractor.js +317 -0
- package/dist/workflow/evolution/LessonExtractor.js.map +1 -0
- package/dist/workflow/evolution/SelfImproveEngine.d.ts +156 -0
- package/dist/workflow/evolution/SelfImproveEngine.js +361 -0
- package/dist/workflow/evolution/SelfImproveEngine.js.map +1 -0
- package/dist/workflow/execution/RalphEngine.d.ts +54 -0
- package/dist/workflow/execution/RalphEngine.js +145 -0
- package/dist/workflow/execution/RalphEngine.js.map +1 -0
- package/dist/workflow/execution/UltraworkEngine.d.ts +43 -0
- package/dist/workflow/execution/UltraworkEngine.js +135 -0
- package/dist/workflow/execution/UltraworkEngine.js.map +1 -0
- package/dist/workflow/gates/EnhancedGates.d.ts +74 -0
- package/dist/workflow/gates/EnhancedGates.js +653 -0
- package/dist/workflow/gates/EnhancedGates.js.map +1 -0
- package/dist/workflow/gates/GateSystem.d.ts +180 -0
- package/dist/workflow/gates/GateSystem.js +1279 -0
- package/dist/workflow/gates/GateSystem.js.map +1 -0
- package/dist/workflow/gates/MetaGovernanceGates.d.ts +70 -0
- package/dist/workflow/gates/MetaGovernanceGates.js +617 -0
- package/dist/workflow/gates/MetaGovernanceGates.js.map +1 -0
- package/dist/workflow/gates/VisualGate.d.ts +41 -0
- package/dist/workflow/gates/VisualGate.js +174 -0
- package/dist/workflow/gates/VisualGate.js.map +1 -0
- package/dist/workflow/index.d.ts +45 -0
- package/dist/workflow/index.js +47 -0
- package/dist/workflow/index.js.map +1 -0
- package/dist/workflow/qa/E2ETestRunner.d.ts +102 -0
- package/dist/workflow/qa/E2ETestRunner.js +227 -0
- package/dist/workflow/qa/E2ETestRunner.js.map +1 -0
- package/dist/workflow/quality/HonestDelivery.d.ts +19 -0
- package/dist/workflow/quality/HonestDelivery.js +77 -0
- package/dist/workflow/quality/HonestDelivery.js.map +1 -0
- package/dist/workflow/quality/KarpathyEvaluator.d.ts +18 -0
- package/dist/workflow/quality/KarpathyEvaluator.js +76 -0
- package/dist/workflow/quality/KarpathyEvaluator.js.map +1 -0
- package/dist/workflow/types.d.ts +151 -0
- package/dist/workflow/types.js +4 -0
- package/dist/workflow/types.js.map +1 -0
- package/dist/workflows/DAGBuilder.d.ts +52 -0
- package/dist/workflows/DAGBuilder.js +169 -0
- package/dist/workflows/DAGBuilder.js.map +1 -0
- package/dist/workflows/GateParser.d.ts +55 -0
- package/dist/workflows/GateParser.js +73 -0
- package/dist/workflows/GateParser.js.map +1 -0
- package/dist/workflows/WorkflowExecutor.d.ts +56 -0
- package/dist/workflows/WorkflowExecutor.js +143 -0
- package/dist/workflows/WorkflowExecutor.js.map +1 -0
- package/dist/workflows/WorkflowOrchestrator.d.ts +81 -0
- package/dist/workflows/WorkflowOrchestrator.js +337 -0
- package/dist/workflows/WorkflowOrchestrator.js.map +1 -0
- package/dist/workflows/index.d.ts +2 -0
- package/dist/workflows/index.js +5 -0
- package/dist/workflows/index.js.map +1 -0
- package/dist/workflows/presets.d.ts +34 -0
- package/dist/workflows/presets.js +224 -0
- package/dist/workflows/presets.js.map +1 -0
- package/docs/README.md +105 -0
- package/docs/guides/DEVELOPMENT_WORKFLOW.md +99 -0
- package/docs/guides/GETTING_STARTED.md +93 -0
- package/docs/guides/MEDICAL_AGENT_OPERATING_GUIDE.md +61 -0
- package/docs/guides/MEDICAL_RESEARCH_DELIVERY.md +217 -0
- package/docs/guides/MIGRATION.md +119 -0
- package/docs/reference/cli.md +2921 -0
- package/docs/start/README.md +79 -0
- package/docs/start/agent-governance-demo.md +107 -0
- package/docs/start/artifact-lifecycle.md +326 -0
- package/docs/start/quickstart.md +191 -0
- package/docs/start/workflow-upgrade.md +198 -0
- package/docs/workflow/GATES_AND_SCORE.md +89 -0
- package/docs/workflow/PROMPT_OPTIMIZATION.md +44 -0
- package/docs/workflow/README.md +123 -0
- package/docs/workflow/node-library.md +52 -0
- package/docs/workflow/templates/api-contract.md +29 -0
- package/docs/workflow/templates/architecture-review.md +23 -0
- package/docs/workflow/templates/db-change-plan.md +20 -0
- package/docs/workflow/templates/docs-impact.md +17 -0
- package/docs/workflow/templates/e2e-plan.md +20 -0
- package/docs/workflow/templates/explore.md +16 -0
- package/docs/workflow/templates/github-actions-scale-preflight.yml +32 -0
- package/docs/workflow/templates/mini-prd.md +16 -0
- package/docs/workflow/templates/plan.md +37 -0
- package/docs/workflow/templates/pre-push-scale-preflight.sh +8 -0
- package/docs/workflow/templates/product-smoke.md +61 -0
- package/docs/workflow/templates/reality-check.md +28 -0
- package/docs/workflow/templates/resource-cleanup.md +17 -0
- package/docs/workflow/templates/resource-impact.md +25 -0
- package/docs/workflow/templates/review.md +12 -0
- package/docs/workflow/templates/runtime.md +23 -0
- package/docs/workflow/templates/security-review.md +26 -0
- package/docs/workflow/templates/skill-evidence.md +33 -0
- package/docs/workflow/templates/skill-plan.md +39 -0
- package/docs/workflow/templates/spec.md +17 -0
- package/docs/workflow/templates/standards-impact.md +28 -0
- package/docs/workflow/templates/summary.md +16 -0
- package/docs/workflow/templates/tasks.md +8 -0
- package/docs/workflow/templates/ui-spec.md +29 -0
- package/docs/workflow/templates/verification.md +20 -0
- package/docs/workflow/templates/visual-review.md +20 -0
- package/docs/zh/quickstart.md +108 -0
- package/examples/demo-projects/agent-governance-demo/CONTEXT.md +14 -0
- package/examples/demo-projects/agent-governance-demo/README.md +48 -0
- package/examples/demo-projects/agent-governance-demo/docs/CONTEXT-MAP.md +14 -0
- package/examples/demo-projects/agent-governance-demo/package.json +22 -0
- package/examples/demo-projects/agent-governance-demo/src/oauth-state.ts +39 -0
- package/examples/demo-projects/agent-governance-demo/tests/oauth-state.test.ts +52 -0
- package/mcp-configs/_INDEX.md +55 -0
- package/mcp-configs/context7/config.json +9 -0
- package/mcp-configs/fetch/config.json +9 -0
- package/mcp-configs/filesystem/config.json +9 -0
- package/mcp-configs/github/config.json +11 -0
- package/mcp-configs/memory/config.json +9 -0
- package/mcp-configs/neon/config.json +11 -0
- package/mcp-configs/playwright/config.json +9 -0
- package/mcp-configs/postgres/config.json +11 -0
- package/mcp-configs/puppeteer/config.json +9 -0
- package/mcp-configs/sequential-thinking/config.json +9 -0
- package/package.json +113 -0
- package/scripts/workflow/lib/gbrain-runtime.mjs +185 -0
- package/scripts/workflow/lib/report-output.mjs +107 -0
- package/scripts/workflow/medscale-release-smoke.mjs +338 -0
- package/scripts/workflow/provider-rehearsal.mjs +597 -0
- package/scripts/workflow/setup-smoke.mjs +433 -0
- package/target-research-platform/bridge_runner.py +310 -0
- package/target-research-platform/config.yaml +148 -0
- package/target-research-platform/data/immune_infiltration/ACC.csv +201 -0
- package/target-research-platform/data/immune_infiltration/BLCA.csv +201 -0
- package/target-research-platform/data/immune_infiltration/BRCA.csv +201 -0
- package/target-research-platform/data/immune_infiltration/CESC.csv +201 -0
- package/target-research-platform/data/immune_infiltration/CHOL.csv +201 -0
- package/target-research-platform/data/immune_infiltration/COAD.csv +201 -0
- package/target-research-platform/data/immune_infiltration/DLBC.csv +201 -0
- package/target-research-platform/data/immune_infiltration/ESCA.csv +201 -0
- package/target-research-platform/data/immune_infiltration/GBM.csv +201 -0
- package/target-research-platform/data/immune_infiltration/HNSC.csv +201 -0
- package/target-research-platform/data/immune_infiltration/KICH.csv +201 -0
- package/target-research-platform/data/immune_infiltration/KIRC.csv +201 -0
- package/target-research-platform/data/immune_infiltration/KIRP.csv +201 -0
- package/target-research-platform/data/immune_infiltration/LAML.csv +201 -0
- package/target-research-platform/data/immune_infiltration/LGG.csv +201 -0
- package/target-research-platform/data/immune_infiltration/LIHC.csv +201 -0
- package/target-research-platform/data/immune_infiltration/LUAD.csv +201 -0
- package/target-research-platform/data/immune_infiltration/LUSC.csv +201 -0
- package/target-research-platform/data/immune_infiltration/MESO.csv +201 -0
- package/target-research-platform/data/immune_infiltration/OV.csv +201 -0
- package/target-research-platform/data/immune_infiltration/PAAD.csv +201 -0
- package/target-research-platform/data/immune_infiltration/PCPG.csv +201 -0
- package/target-research-platform/data/immune_infiltration/PRAD.csv +201 -0
- package/target-research-platform/data/immune_infiltration/READ.csv +201 -0
- package/target-research-platform/data/immune_infiltration/SARC.csv +201 -0
- package/target-research-platform/data/immune_infiltration/SKCM.csv +201 -0
- package/target-research-platform/data/immune_infiltration/STAD.csv +201 -0
- package/target-research-platform/data/immune_infiltration/TGCT.csv +201 -0
- package/target-research-platform/data/immune_infiltration/THCA.csv +201 -0
- package/target-research-platform/data/immune_infiltration/THYM.csv +201 -0
- package/target-research-platform/data/immune_infiltration/UCEC.csv +201 -0
- package/target-research-platform/data/immune_infiltration/UCS.csv +201 -0
- package/target-research-platform/data/immune_infiltration/UVM.csv +201 -0
- package/target-research-platform/docs/JSON_SCHEMA.md +352 -0
- package/target-research-platform/docs/PROGRESS_2026-06-09.md +140 -0
- package/target-research-platform/main.py +755 -0
- package/target-research-platform/pyproject.toml +54 -0
- package/target-research-platform/requirements.txt +9 -0
- package/target-research-platform/run_dashboard.py +5 -0
- package/target-research-platform/run_real_medical_workflow.py +28 -0
- package/target-research-platform/scripts/demo_report.py +481 -0
- package/target-research-platform/scripts/generate_evidence_package.py +75 -0
- package/target-research-platform/scripts/prepare_immune_data.py +386 -0
- package/target-research-platform/src/__init__.py +4 -0
- package/target-research-platform/src/analysis/__init__.py +3 -0
- package/target-research-platform/src/analysis/stage1_expression/__init__.py +12 -0
- package/target-research-platform/src/analysis/stage1_expression/immune_correlation.py +366 -0
- package/target-research-platform/src/analysis/stage1_expression/pipeline.py +579 -0
- package/target-research-platform/src/analysis/stage1_expression/survival_analysis.py +382 -0
- package/target-research-platform/src/analysis/stage2_screening/__init__.py +12 -0
- package/target-research-platform/src/analysis/stage2_screening/differential_expression.py +451 -0
- package/target-research-platform/src/analysis/stage2_screening/druggability_score.py +477 -0
- package/target-research-platform/src/analysis/stage2_screening/pipeline.py +822 -0
- package/target-research-platform/src/analysis/stage3_deep_research/__init__.py +12 -0
- package/target-research-platform/src/analysis/stage3_deep_research/competitive_landscape.py +479 -0
- package/target-research-platform/src/analysis/stage3_deep_research/pipeline.py +763 -0
- package/target-research-platform/src/analysis/stage3_deep_research/target_function.py +290 -0
- package/target-research-platform/src/analysis/stage4_business/__init__.py +12 -0
- package/target-research-platform/src/analysis/stage4_business/business_plan.py +816 -0
- package/target-research-platform/src/analysis/stage4_business/milestone_planner.py +844 -0
- package/target-research-platform/src/analysis/stage4_business/pipeline.py +284 -0
- package/target-research-platform/src/api_clients/__init__.py +29 -0
- package/target-research-platform/src/api_clients/aminer_client.py +163 -0
- package/target-research-platform/src/api_clients/base_client.py +186 -0
- package/target-research-platform/src/api_clients/clinicaltrials_client.py +411 -0
- package/target-research-platform/src/api_clients/geo_client.py +1420 -0
- package/target-research-platform/src/api_clients/gtex_client.py +209 -0
- package/target-research-platform/src/api_clients/hpa_client.py +170 -0
- package/target-research-platform/src/api_clients/immune_data_manager.py +247 -0
- package/target-research-platform/src/api_clients/openalex_client.py +86 -0
- package/target-research-platform/src/api_clients/opentargets_client.py +558 -0
- package/target-research-platform/src/api_clients/pubmed_client.py +361 -0
- package/target-research-platform/src/api_clients/tcga_client.py +712 -0
- package/target-research-platform/src/api_clients/timer_client.py +169 -0
- package/target-research-platform/src/dashboard/app.py +2283 -0
- package/target-research-platform/src/dashboard/deliverables.py +710 -0
- package/target-research-platform/src/dashboard/static/artifactPreview.js +96 -0
- package/target-research-platform/src/dashboard/static/index.html +1292 -0
- package/target-research-platform/src/dashboard/status_tracker.py +237 -0
- package/target-research-platform/src/output/__init__.py +42 -0
- package/target-research-platform/src/output/agent_llm_provider.py +171 -0
- package/target-research-platform/src/output/chart_generator.py +550 -0
- package/target-research-platform/src/output/data_exporter.py +215 -0
- package/target-research-platform/src/output/delivery_packager.py +791 -0
- package/target-research-platform/src/output/evidence_package.py +230 -0
- package/target-research-platform/src/output/journal_templates.py +193 -0
- package/target-research-platform/src/output/literature_enricher.py +395 -0
- package/target-research-platform/src/output/literature_reviewer.py +420 -0
- package/target-research-platform/src/output/manuscript_fact_checker.py +279 -0
- package/target-research-platform/src/output/manuscript_generator.py +1189 -0
- package/target-research-platform/src/output/manuscript_quality.py +401 -0
- package/target-research-platform/src/output/medical_skills_bridge.py +140 -0
- package/target-research-platform/src/output/report_generator.py +542 -0
- package/target-research-platform/src/output/usage_envelope.py +193 -0
- package/target-research-platform/src/utils/__init__.py +1 -0
- package/target-research-platform/src/utils/config.py +125 -0
- package/target-research-platform/src/utils/logger.py +71 -0
- package/target-research-platform/src/validators/__init__.py +13 -0
- package/target-research-platform/src/validators/cross_validator.py +394 -0
- package/target-research-platform/src/validators/data_provenance.py +298 -0
|
@@ -0,0 +1,1420 @@
|
|
|
1
|
+
"""
|
|
2
|
+
GEO (Gene Expression Omnibus) API客户端
|
|
3
|
+
用于获取基因表达数据集
|
|
4
|
+
API文档:https://www.ncbi.nlm.nih.gov/geo/info/geo_acqu.html
|
|
5
|
+
"""
|
|
6
|
+
import gzip
|
|
7
|
+
import re
|
|
8
|
+
import tempfile
|
|
9
|
+
from pathlib import Path
|
|
10
|
+
from typing import Optional
|
|
11
|
+
from .base_client import BaseAPIClient, APIResponse
|
|
12
|
+
|
|
13
|
+
|
|
14
|
+
class GEOClient(BaseAPIClient):
|
|
15
|
+
"""GEO API客户端"""
|
|
16
|
+
|
|
17
|
+
@property
|
|
18
|
+
def source_name(self) -> str:
|
|
19
|
+
return "GEO"
|
|
20
|
+
|
|
21
|
+
@property
|
|
22
|
+
def base_url(self) -> str:
|
|
23
|
+
return "https://eutils.ncbi.nlm.nih.gov/entrez/eutils"
|
|
24
|
+
|
|
25
|
+
def health_check(self) -> bool:
|
|
26
|
+
"""检查GEO API可用性"""
|
|
27
|
+
response = self._make_request(
|
|
28
|
+
"GET",
|
|
29
|
+
"/einfo.fcgi",
|
|
30
|
+
params={"db": "gds", "retmode": "json"},
|
|
31
|
+
use_cache=False
|
|
32
|
+
)
|
|
33
|
+
return response.success
|
|
34
|
+
|
|
35
|
+
def search_datasets(
|
|
36
|
+
self,
|
|
37
|
+
disease: str,
|
|
38
|
+
organism: str = "Homo sapiens",
|
|
39
|
+
dataset_type: str = "Expression profiling by array",
|
|
40
|
+
max_results: int = 20
|
|
41
|
+
) -> APIResponse:
|
|
42
|
+
"""
|
|
43
|
+
搜索GEO数据集
|
|
44
|
+
|
|
45
|
+
Args:
|
|
46
|
+
disease: 疾病名称
|
|
47
|
+
organism: 物种
|
|
48
|
+
dataset_type: 数据集类型
|
|
49
|
+
max_results: 最大返回数量
|
|
50
|
+
|
|
51
|
+
Returns:
|
|
52
|
+
包含数据集列表的APIResponse
|
|
53
|
+
"""
|
|
54
|
+
# 构建搜索查询
|
|
55
|
+
query = f"{disease} AND {organism}[orgn] AND {dataset_type}[gdstype] AND gds[entry_type]"
|
|
56
|
+
|
|
57
|
+
params = {
|
|
58
|
+
"db": "gds",
|
|
59
|
+
"term": query,
|
|
60
|
+
"retmax": max_results,
|
|
61
|
+
"retmode": "json"
|
|
62
|
+
}
|
|
63
|
+
|
|
64
|
+
response = self._make_request("GET", "/esearch.fcgi", params=params)
|
|
65
|
+
|
|
66
|
+
if not response.success:
|
|
67
|
+
return response
|
|
68
|
+
|
|
69
|
+
return self._parse_search_response(response, disease, query)
|
|
70
|
+
|
|
71
|
+
def _parse_search_response(
|
|
72
|
+
self,
|
|
73
|
+
response: APIResponse,
|
|
74
|
+
disease: str,
|
|
75
|
+
query: str
|
|
76
|
+
) -> APIResponse:
|
|
77
|
+
"""解析搜索结果"""
|
|
78
|
+
try:
|
|
79
|
+
raw_data = response.data
|
|
80
|
+
if not raw_data or 'esearchresult' not in raw_data:
|
|
81
|
+
return response
|
|
82
|
+
|
|
83
|
+
result = raw_data['esearchresult']
|
|
84
|
+
ids = result.get('idlist', [])
|
|
85
|
+
count = int(result.get('count', 0))
|
|
86
|
+
|
|
87
|
+
return APIResponse(
|
|
88
|
+
success=True,
|
|
89
|
+
data={
|
|
90
|
+
"disease": disease,
|
|
91
|
+
"query": query,
|
|
92
|
+
"total_count": count,
|
|
93
|
+
"returned_count": len(ids),
|
|
94
|
+
"dataset_ids": ids
|
|
95
|
+
},
|
|
96
|
+
source=self.source_name,
|
|
97
|
+
endpoint="/esearch.fcgi",
|
|
98
|
+
params={"disease": disease},
|
|
99
|
+
timestamp=response.timestamp
|
|
100
|
+
)
|
|
101
|
+
|
|
102
|
+
except (KeyError, ValueError, TypeError) as e:
|
|
103
|
+
return APIResponse(
|
|
104
|
+
success=False,
|
|
105
|
+
data=None,
|
|
106
|
+
source=self.source_name,
|
|
107
|
+
endpoint="/esearch.fcgi",
|
|
108
|
+
params={"disease": disease},
|
|
109
|
+
timestamp=response.timestamp,
|
|
110
|
+
error=f"搜索结果解析错误: {str(e)}"
|
|
111
|
+
)
|
|
112
|
+
|
|
113
|
+
def get_dataset_details(self, dataset_ids: list[str]) -> APIResponse:
|
|
114
|
+
"""
|
|
115
|
+
获取数据集详细信息
|
|
116
|
+
|
|
117
|
+
Args:
|
|
118
|
+
dataset_ids: 数据集ID列表
|
|
119
|
+
|
|
120
|
+
Returns:
|
|
121
|
+
包含数据集详情的APIResponse
|
|
122
|
+
"""
|
|
123
|
+
if not dataset_ids:
|
|
124
|
+
return APIResponse(
|
|
125
|
+
success=True,
|
|
126
|
+
data={"datasets": []},
|
|
127
|
+
source=self.source_name,
|
|
128
|
+
endpoint="/esummary.fcgi",
|
|
129
|
+
params={},
|
|
130
|
+
timestamp=""
|
|
131
|
+
)
|
|
132
|
+
|
|
133
|
+
params = {
|
|
134
|
+
"db": "gds",
|
|
135
|
+
"id": ",".join(dataset_ids[:50]),
|
|
136
|
+
"retmode": "json"
|
|
137
|
+
}
|
|
138
|
+
|
|
139
|
+
response = self._make_request("GET", "/esummary.fcgi", params=params)
|
|
140
|
+
|
|
141
|
+
if not response.success:
|
|
142
|
+
return response
|
|
143
|
+
|
|
144
|
+
return self._parse_details_response(response, dataset_ids)
|
|
145
|
+
|
|
146
|
+
def _parse_details_response(
|
|
147
|
+
self,
|
|
148
|
+
response: APIResponse,
|
|
149
|
+
dataset_ids: list[str]
|
|
150
|
+
) -> APIResponse:
|
|
151
|
+
"""解析数据集详情"""
|
|
152
|
+
try:
|
|
153
|
+
raw_data = response.data
|
|
154
|
+
if not raw_data or 'result' not in raw_data:
|
|
155
|
+
return response
|
|
156
|
+
|
|
157
|
+
result = raw_data['result']
|
|
158
|
+
datasets = []
|
|
159
|
+
|
|
160
|
+
for ds_id in dataset_ids:
|
|
161
|
+
if ds_id in result:
|
|
162
|
+
ds_info = result[ds_id]
|
|
163
|
+
# NCBI E-utilities v2: accession 是数据库记录 ID
|
|
164
|
+
# GDS 记录: accession=GDSxxx, gse=数字 → 构造 GSE accession
|
|
165
|
+
# GSE 记录: accession=GSExxx, gse=数字
|
|
166
|
+
gds_acc = ds_info.get('accession', '')
|
|
167
|
+
gse_num = ds_info.get('gse', '')
|
|
168
|
+
if gds_acc.startswith('GDS') and gse_num:
|
|
169
|
+
# GDS 策展数据集 → 用对应的 GSE 下载
|
|
170
|
+
download_acc = f"GSE{gse_num}"
|
|
171
|
+
else:
|
|
172
|
+
download_acc = gds_acc
|
|
173
|
+
datasets.append({
|
|
174
|
+
"accession": download_acc,
|
|
175
|
+
"gds_accession": gds_acc,
|
|
176
|
+
"title": ds_info.get('title', ''),
|
|
177
|
+
"summary": (ds_info.get('summary', '') or '')[:500],
|
|
178
|
+
"organism": ds_info.get('taxon', ''),
|
|
179
|
+
"platform": ds_info.get('gpl', ''),
|
|
180
|
+
"sample_count": self._parse_sample_count(ds_info),
|
|
181
|
+
"dataset_type": ds_info.get('gdstype', ''),
|
|
182
|
+
"pubmed_ids": ds_info.get('pmids', []),
|
|
183
|
+
"ftp_link": ds_info.get('ftplink', '')
|
|
184
|
+
})
|
|
185
|
+
|
|
186
|
+
return APIResponse(
|
|
187
|
+
success=True,
|
|
188
|
+
data={
|
|
189
|
+
"datasets": datasets,
|
|
190
|
+
"count": len(datasets)
|
|
191
|
+
},
|
|
192
|
+
source=self.source_name,
|
|
193
|
+
endpoint="/esummary.fcgi",
|
|
194
|
+
params={"ids": dataset_ids},
|
|
195
|
+
timestamp=response.timestamp
|
|
196
|
+
)
|
|
197
|
+
|
|
198
|
+
except (KeyError, ValueError, TypeError) as e:
|
|
199
|
+
return APIResponse(
|
|
200
|
+
success=False,
|
|
201
|
+
data=None,
|
|
202
|
+
source=self.source_name,
|
|
203
|
+
endpoint="/esummary.fcgi",
|
|
204
|
+
params={"ids": dataset_ids},
|
|
205
|
+
timestamp=response.timestamp,
|
|
206
|
+
error=f"详情解析错误: {str(e)}"
|
|
207
|
+
)
|
|
208
|
+
|
|
209
|
+
def find_differential_expression_datasets(
|
|
210
|
+
self,
|
|
211
|
+
disease: str,
|
|
212
|
+
tissue: Optional[str] = None,
|
|
213
|
+
max_results: int = 10
|
|
214
|
+
) -> APIResponse:
|
|
215
|
+
"""
|
|
216
|
+
查找差异表达数据集
|
|
217
|
+
|
|
218
|
+
优先搜索 RNA-seq 数据集(基因符号做行ID,无需探针映射),
|
|
219
|
+
再回退到微阵列数据集。
|
|
220
|
+
|
|
221
|
+
Args:
|
|
222
|
+
disease: 疾病名称
|
|
223
|
+
tissue: 组织类型(可选)
|
|
224
|
+
max_results: 最大返回数量
|
|
225
|
+
|
|
226
|
+
Returns:
|
|
227
|
+
包含差异表达数据集的APIResponse
|
|
228
|
+
"""
|
|
229
|
+
# 优先搜索 RNA-seq 数据集(行ID是基因符号,无需探针映射)
|
|
230
|
+
query_parts = [disease]
|
|
231
|
+
if tissue:
|
|
232
|
+
query_parts.append(tissue)
|
|
233
|
+
|
|
234
|
+
query = " AND ".join(query_parts)
|
|
235
|
+
query += " AND expression profiling by high throughput sequencing[gdstype]"
|
|
236
|
+
query += " AND Homo sapiens[orgn] AND gse[entry_type]"
|
|
237
|
+
|
|
238
|
+
params = {
|
|
239
|
+
"db": "gds",
|
|
240
|
+
"term": query,
|
|
241
|
+
"retmax": max_results,
|
|
242
|
+
"retmode": "json"
|
|
243
|
+
}
|
|
244
|
+
|
|
245
|
+
response = self._make_request("GET", "/esearch.fcgi", params=params)
|
|
246
|
+
|
|
247
|
+
if response.success:
|
|
248
|
+
parsed = self._parse_search_response(response, disease, query)
|
|
249
|
+
if parsed.success and parsed.data.get("total_count", 0) > 0:
|
|
250
|
+
parsed.data["dataset_type"] = "rnaseq"
|
|
251
|
+
return parsed
|
|
252
|
+
|
|
253
|
+
# 回退到微阵列数据集
|
|
254
|
+
return self._search_microarray_datasets(disease, tissue, max_results)
|
|
255
|
+
|
|
256
|
+
def _search_microarray_datasets(
|
|
257
|
+
self,
|
|
258
|
+
disease: str,
|
|
259
|
+
tissue: Optional[str],
|
|
260
|
+
max_results: int
|
|
261
|
+
) -> APIResponse:
|
|
262
|
+
"""搜索微阵列数据集"""
|
|
263
|
+
query_parts = [disease]
|
|
264
|
+
if tissue:
|
|
265
|
+
query_parts.append(tissue)
|
|
266
|
+
|
|
267
|
+
query = " AND ".join(query_parts)
|
|
268
|
+
query += " AND expression profiling by array[gdstype]"
|
|
269
|
+
query += " AND Homo sapiens[orgn] AND gse[entry_type]"
|
|
270
|
+
|
|
271
|
+
params = {
|
|
272
|
+
"db": "gds",
|
|
273
|
+
"term": query,
|
|
274
|
+
"retmax": max_results,
|
|
275
|
+
"retmode": "json"
|
|
276
|
+
}
|
|
277
|
+
|
|
278
|
+
return self._make_request("GET", "/esearch.fcgi", params=params)
|
|
279
|
+
|
|
280
|
+
def get_geo_to_sra(self, geo_accession: str) -> APIResponse:
|
|
281
|
+
"""
|
|
282
|
+
获取GEO数据集关联的SRA数据
|
|
283
|
+
|
|
284
|
+
Args:
|
|
285
|
+
geo_accession: GEO登录号(如GSE123456)
|
|
286
|
+
|
|
287
|
+
Returns:
|
|
288
|
+
包含SRA链接的APIResponse
|
|
289
|
+
"""
|
|
290
|
+
# 先搜索GEO
|
|
291
|
+
search_params = {
|
|
292
|
+
"db": "gds",
|
|
293
|
+
"term": f"{geo_accession}[accn]",
|
|
294
|
+
"retmode": "json"
|
|
295
|
+
}
|
|
296
|
+
|
|
297
|
+
search_response = self._make_request("GET", "/esearch.fcgi", params=search_params)
|
|
298
|
+
|
|
299
|
+
if not search_response.success:
|
|
300
|
+
return search_response
|
|
301
|
+
|
|
302
|
+
try:
|
|
303
|
+
ids = search_response.data.get('esearchresult', {}).get('idlist', [])
|
|
304
|
+
if not ids:
|
|
305
|
+
return APIResponse(
|
|
306
|
+
success=False,
|
|
307
|
+
data=None,
|
|
308
|
+
source=self.source_name,
|
|
309
|
+
endpoint="/elink.fcgi",
|
|
310
|
+
params={"accession": geo_accession},
|
|
311
|
+
timestamp=search_response.timestamp,
|
|
312
|
+
error=f"未找到GEO数据集: {geo_accession}"
|
|
313
|
+
)
|
|
314
|
+
|
|
315
|
+
# 链接到SRA
|
|
316
|
+
link_params = {
|
|
317
|
+
"dbfrom": "gds",
|
|
318
|
+
"db": "sra",
|
|
319
|
+
"id": ids[0]
|
|
320
|
+
}
|
|
321
|
+
|
|
322
|
+
link_response = self._make_request("GET", "/elink.fcgi", params=link_params)
|
|
323
|
+
|
|
324
|
+
if not link_response.success:
|
|
325
|
+
return link_response
|
|
326
|
+
|
|
327
|
+
# 解析SRA链接
|
|
328
|
+
sra_ids = []
|
|
329
|
+
if link_response.data and 'linksets' in link_response.data:
|
|
330
|
+
for linkset in link_response.data['linksets']:
|
|
331
|
+
for linkdb in linkset.get('linksetdbs', []):
|
|
332
|
+
for link in linkdb.get('links', []):
|
|
333
|
+
sra_ids.append(str(link))
|
|
334
|
+
|
|
335
|
+
return APIResponse(
|
|
336
|
+
success=True,
|
|
337
|
+
data={
|
|
338
|
+
"geo_accession": geo_accession,
|
|
339
|
+
"sra_ids": sra_ids[:20],
|
|
340
|
+
"sra_count": len(sra_ids)
|
|
341
|
+
},
|
|
342
|
+
source=self.source_name,
|
|
343
|
+
endpoint="/elink.fcgi",
|
|
344
|
+
params={"accession": geo_accession},
|
|
345
|
+
timestamp=link_response.timestamp
|
|
346
|
+
)
|
|
347
|
+
|
|
348
|
+
except (KeyError, ValueError, TypeError) as e:
|
|
349
|
+
return APIResponse(
|
|
350
|
+
success=False,
|
|
351
|
+
data=None,
|
|
352
|
+
source=self.source_name,
|
|
353
|
+
endpoint="/elink.fcgi",
|
|
354
|
+
params={"accession": geo_accession},
|
|
355
|
+
timestamp=search_response.timestamp,
|
|
356
|
+
error=f"SRA链接解析错误: {str(e)}"
|
|
357
|
+
)
|
|
358
|
+
|
|
359
|
+
@staticmethod
|
|
360
|
+
def _parse_sample_count(ds_info: dict) -> int:
|
|
361
|
+
"""从 NCBI summary 响应解析样本数"""
|
|
362
|
+
# GDS 记录有 n_samples 字段
|
|
363
|
+
n = ds_info.get('n_samples')
|
|
364
|
+
if n is not None:
|
|
365
|
+
return int(n)
|
|
366
|
+
# GSE 记录样本数在 ssinfo 字段中
|
|
367
|
+
ssinfo = ds_info.get('ssinfo', '')
|
|
368
|
+
if ssinfo:
|
|
369
|
+
import re as _re
|
|
370
|
+
m = _re.search(r'(\d+)', str(ssinfo))
|
|
371
|
+
if m:
|
|
372
|
+
return int(m.group(1))
|
|
373
|
+
return 0
|
|
374
|
+
|
|
375
|
+
def validate_dataset(self, dataset: dict) -> tuple[bool, list[str]]:
|
|
376
|
+
"""验证数据集质量"""
|
|
377
|
+
issues = []
|
|
378
|
+
|
|
379
|
+
# 检查样本量
|
|
380
|
+
sample_count = dataset.get("sample_count", 0)
|
|
381
|
+
if sample_count < 10:
|
|
382
|
+
issues.append(f"样本量不足: {sample_count} < 10")
|
|
383
|
+
|
|
384
|
+
# 检查物种
|
|
385
|
+
organism = dataset.get("organism", "")
|
|
386
|
+
if "Homo sapiens" not in organism and "human" not in organism.lower():
|
|
387
|
+
issues.append(f"非人类数据集: {organism}")
|
|
388
|
+
|
|
389
|
+
# 检查数据集类型
|
|
390
|
+
dataset_type = dataset.get("dataset_type", "")
|
|
391
|
+
if "expression" not in dataset_type.lower():
|
|
392
|
+
issues.append(f"非表达数据集: {dataset_type}")
|
|
393
|
+
|
|
394
|
+
usable, reason = self.is_usable_expression_dataset(dataset)
|
|
395
|
+
if not usable:
|
|
396
|
+
issues.append(reason)
|
|
397
|
+
|
|
398
|
+
return len(issues) == 0, issues
|
|
399
|
+
|
|
400
|
+
@staticmethod
|
|
401
|
+
def is_usable_expression_dataset(dataset: dict) -> tuple[bool, str]:
|
|
402
|
+
"""排除 SuperSeries 等无本地表达矩阵的数据集。"""
|
|
403
|
+
title = (dataset.get("title") or "").lower()
|
|
404
|
+
summary = (dataset.get("summary") or "").lower()
|
|
405
|
+
dtype = (dataset.get("dataset_type") or "").lower()
|
|
406
|
+
|
|
407
|
+
if "superseries" in title or "superseries" in summary:
|
|
408
|
+
return False, "SuperSeries 无本地表达矩阵"
|
|
409
|
+
if "composed of the subseries" in summary:
|
|
410
|
+
return False, "SuperSeries 无本地表达矩阵"
|
|
411
|
+
if "refer to individual series" in summary and "expression" not in dtype:
|
|
412
|
+
return False, "父级汇总数据集,无表达矩阵"
|
|
413
|
+
if dtype == "other" and "expression" not in title and "expression" not in summary:
|
|
414
|
+
return False, "非表达数据集 (Other)"
|
|
415
|
+
if (
|
|
416
|
+
"expression" not in dtype
|
|
417
|
+
and "high throughput" not in dtype
|
|
418
|
+
and "array" not in dtype
|
|
419
|
+
):
|
|
420
|
+
return False, f"非表达数据集: {dataset.get('dataset_type', 'unknown')}"
|
|
421
|
+
return True, ""
|
|
422
|
+
|
|
423
|
+
def filter_expression_datasets(self, datasets: list[dict]) -> list[dict]:
|
|
424
|
+
"""仅保留可用于差异表达分析的数据集。"""
|
|
425
|
+
kept: list[dict] = []
|
|
426
|
+
for dataset in datasets:
|
|
427
|
+
usable, reason = self.is_usable_expression_dataset(dataset)
|
|
428
|
+
if usable:
|
|
429
|
+
kept.append(dataset)
|
|
430
|
+
return kept
|
|
431
|
+
|
|
432
|
+
@staticmethod
|
|
433
|
+
def series_matrix_has_expression_table(file_path: str) -> bool:
|
|
434
|
+
"""快速检测 series matrix 是否含表达表(避免 SuperSeries 元数据文件)。"""
|
|
435
|
+
path = Path(file_path)
|
|
436
|
+
if not path.exists():
|
|
437
|
+
return False
|
|
438
|
+
try:
|
|
439
|
+
open_func = gzip.open if str(file_path).endswith(".gz") else open
|
|
440
|
+
mode = "rt" if str(file_path).endswith(".gz") else "r"
|
|
441
|
+
in_table = False
|
|
442
|
+
with open_func(file_path, mode, encoding="utf-8", errors="replace") as handle:
|
|
443
|
+
for _ in range(5000):
|
|
444
|
+
line = handle.readline()
|
|
445
|
+
if not line:
|
|
446
|
+
break
|
|
447
|
+
stripped = line.strip()
|
|
448
|
+
if stripped.startswith("!series_matrix_table_begin") or stripped.startswith(
|
|
449
|
+
"!sample_table_begin"
|
|
450
|
+
):
|
|
451
|
+
in_table = True
|
|
452
|
+
continue
|
|
453
|
+
if stripped.startswith("!series_matrix_table_end") or stripped.startswith(
|
|
454
|
+
"!sample_table_end"
|
|
455
|
+
):
|
|
456
|
+
break
|
|
457
|
+
if not in_table:
|
|
458
|
+
continue
|
|
459
|
+
if stripped.startswith("!") or stripped.startswith("#") or not stripped:
|
|
460
|
+
continue
|
|
461
|
+
unquoted = stripped.strip('"')
|
|
462
|
+
if unquoted.startswith("ID_REF"):
|
|
463
|
+
return True
|
|
464
|
+
parts = stripped.split("\t")
|
|
465
|
+
if len(parts) > 1:
|
|
466
|
+
probe = parts[0].strip('"')
|
|
467
|
+
if probe and probe != "ID_REF":
|
|
468
|
+
try:
|
|
469
|
+
float(parts[1].strip('"'))
|
|
470
|
+
return True
|
|
471
|
+
except ValueError:
|
|
472
|
+
pass
|
|
473
|
+
return False
|
|
474
|
+
except OSError:
|
|
475
|
+
return False
|
|
476
|
+
|
|
477
|
+
def rank_datasets(
|
|
478
|
+
self,
|
|
479
|
+
datasets: list[dict],
|
|
480
|
+
disease: str
|
|
481
|
+
) -> list[dict]:
|
|
482
|
+
"""
|
|
483
|
+
对数据集进行质量排序
|
|
484
|
+
|
|
485
|
+
Args:
|
|
486
|
+
datasets: 数据集列表
|
|
487
|
+
disease: 疾病名称
|
|
488
|
+
|
|
489
|
+
Returns:
|
|
490
|
+
排序后的数据集列表
|
|
491
|
+
"""
|
|
492
|
+
scored_datasets = []
|
|
493
|
+
datasets = self.filter_expression_datasets(datasets)
|
|
494
|
+
|
|
495
|
+
for ds in datasets:
|
|
496
|
+
score = 0
|
|
497
|
+
|
|
498
|
+
# 样本量得分
|
|
499
|
+
sample_count = ds.get("sample_count", 0)
|
|
500
|
+
if sample_count >= 100:
|
|
501
|
+
score += 3
|
|
502
|
+
elif sample_count >= 50:
|
|
503
|
+
score += 2
|
|
504
|
+
elif sample_count >= 20:
|
|
505
|
+
score += 1
|
|
506
|
+
|
|
507
|
+
# 数据类型得分
|
|
508
|
+
dataset_type = ds.get("dataset_type", "").lower()
|
|
509
|
+
if "high throughput sequencing" in dataset_type:
|
|
510
|
+
score += 3 # RNA-seq优先
|
|
511
|
+
elif "array" in dataset_type:
|
|
512
|
+
score += 2
|
|
513
|
+
|
|
514
|
+
# 疾病相关性得分
|
|
515
|
+
title = ds.get("title", "").lower()
|
|
516
|
+
if disease.lower() in title:
|
|
517
|
+
score += 2
|
|
518
|
+
|
|
519
|
+
# 有PubMed文献支持
|
|
520
|
+
if ds.get("pubmed_ids"):
|
|
521
|
+
score += 1
|
|
522
|
+
|
|
523
|
+
ds["quality_score"] = score
|
|
524
|
+
scored_datasets.append(ds)
|
|
525
|
+
|
|
526
|
+
# 按得分排序
|
|
527
|
+
scored_datasets.sort(key=lambda x: x["quality_score"], reverse=True)
|
|
528
|
+
|
|
529
|
+
return scored_datasets
|
|
530
|
+
|
|
531
|
+
def download_series_matrix(
|
|
532
|
+
self,
|
|
533
|
+
geo_accession: str,
|
|
534
|
+
output_dir: Optional[str] = None
|
|
535
|
+
) -> APIResponse:
|
|
536
|
+
"""
|
|
537
|
+
下载 GEO Series Matrix 文件
|
|
538
|
+
|
|
539
|
+
Args:
|
|
540
|
+
geo_accession: GEO 登录号,如 "GSE12345"
|
|
541
|
+
output_dir: 输出目录(默认使用临时目录)
|
|
542
|
+
|
|
543
|
+
Returns:
|
|
544
|
+
APIResponse 包含 {"file_path": str, "accession": str}
|
|
545
|
+
"""
|
|
546
|
+
import requests as req
|
|
547
|
+
|
|
548
|
+
# 构建 URL
|
|
549
|
+
# GSE12345 → GSE12nnn
|
|
550
|
+
num = int(geo_accession.replace("GSE", ""))
|
|
551
|
+
series_dir = f"GSE{num // 1000}nnn"
|
|
552
|
+
base_url = f"https://ftp.ncbi.nlm.nih.gov/geo/series/{series_dir}/{geo_accession}/matrix"
|
|
553
|
+
|
|
554
|
+
# 尝试下载
|
|
555
|
+
output_path = Path(output_dir) if output_dir else Path(tempfile.gettempdir())
|
|
556
|
+
output_path.mkdir(parents=True, exist_ok=True)
|
|
557
|
+
|
|
558
|
+
file_path = output_path / f"{geo_accession}_series_matrix.txt.gz"
|
|
559
|
+
|
|
560
|
+
# 检查缓存(无效 SuperSeries 缓存需剔除)
|
|
561
|
+
if file_path.exists():
|
|
562
|
+
if self.series_matrix_has_expression_table(str(file_path)):
|
|
563
|
+
return APIResponse(
|
|
564
|
+
success=True,
|
|
565
|
+
data={"file_path": str(file_path), "accession": geo_accession},
|
|
566
|
+
source=self.source_name,
|
|
567
|
+
endpoint=base_url,
|
|
568
|
+
params={"accession": geo_accession},
|
|
569
|
+
timestamp=""
|
|
570
|
+
)
|
|
571
|
+
try:
|
|
572
|
+
file_path.unlink()
|
|
573
|
+
except OSError:
|
|
574
|
+
pass
|
|
575
|
+
|
|
576
|
+
try:
|
|
577
|
+
# 先获取目录列表找到确切文件名
|
|
578
|
+
dir_resp = req.get(base_url + "/", timeout=30)
|
|
579
|
+
dir_resp.raise_for_status()
|
|
580
|
+
|
|
581
|
+
# 查找 series_matrix.txt.gz(兼容 GSE12345 与 GSE12345-GPLxxxx 命名)
|
|
582
|
+
candidates = re.findall(
|
|
583
|
+
rf'({re.escape(geo_accession)}(?:-GPL\d+)?_series_matrix\.txt\.gz)',
|
|
584
|
+
dir_resp.text,
|
|
585
|
+
)
|
|
586
|
+
if not candidates:
|
|
587
|
+
return APIResponse(
|
|
588
|
+
success=False, data=None, source=self.source_name,
|
|
589
|
+
endpoint=base_url, params={"accession": geo_accession},
|
|
590
|
+
timestamp="",
|
|
591
|
+
error=f"未找到 {geo_accession} 的 series matrix 文件"
|
|
592
|
+
)
|
|
593
|
+
|
|
594
|
+
def _size_hint(name: str) -> int:
|
|
595
|
+
pattern = rf'{re.escape(name)}</a>\s+[\d-]+\s+[\d:]+\s+([\d.]+)([KMG]?)'
|
|
596
|
+
m = re.search(pattern, dir_resp.text)
|
|
597
|
+
if not m:
|
|
598
|
+
return 0
|
|
599
|
+
value = float(m.group(1))
|
|
600
|
+
unit = m.group(2).upper()
|
|
601
|
+
multiplier = {"K": 1024, "M": 1024 ** 2, "G": 1024 ** 3}.get(unit, 1)
|
|
602
|
+
return int(value * multiplier)
|
|
603
|
+
|
|
604
|
+
filename = max(set(candidates), key=_size_hint)
|
|
605
|
+
file_url = f"{base_url}/{filename}"
|
|
606
|
+
|
|
607
|
+
# 下载文件
|
|
608
|
+
self._wait_for_rate_limit()
|
|
609
|
+
dl_resp = req.get(file_url, timeout=120, stream=True)
|
|
610
|
+
dl_resp.raise_for_status()
|
|
611
|
+
|
|
612
|
+
with open(file_path, 'wb') as f:
|
|
613
|
+
for chunk in dl_resp.iter_content(chunk_size=8192):
|
|
614
|
+
f.write(chunk)
|
|
615
|
+
|
|
616
|
+
if not self.series_matrix_has_expression_table(str(file_path)):
|
|
617
|
+
try:
|
|
618
|
+
file_path.unlink()
|
|
619
|
+
except OSError:
|
|
620
|
+
pass
|
|
621
|
+
return APIResponse(
|
|
622
|
+
success=False, data=None, source=self.source_name,
|
|
623
|
+
endpoint=file_url, params={"accession": geo_accession},
|
|
624
|
+
timestamp="",
|
|
625
|
+
error=f"{geo_accession} 下载文件无表达矩阵(可能为 SuperSeries)"
|
|
626
|
+
)
|
|
627
|
+
|
|
628
|
+
return APIResponse(
|
|
629
|
+
success=True,
|
|
630
|
+
data={"file_path": str(file_path), "accession": geo_accession},
|
|
631
|
+
source=self.source_name,
|
|
632
|
+
endpoint=file_url,
|
|
633
|
+
params={"accession": geo_accession},
|
|
634
|
+
timestamp=""
|
|
635
|
+
)
|
|
636
|
+
|
|
637
|
+
except Exception as e:
|
|
638
|
+
return APIResponse(
|
|
639
|
+
success=False, data=None, source=self.source_name,
|
|
640
|
+
endpoint=base_url, params={"accession": geo_accession},
|
|
641
|
+
timestamp="",
|
|
642
|
+
error=f"下载失败: {str(e)}"
|
|
643
|
+
)
|
|
644
|
+
|
|
645
|
+
def download_platform_annotation(
|
|
646
|
+
self,
|
|
647
|
+
platform_id: str,
|
|
648
|
+
output_dir: Optional[str] = None
|
|
649
|
+
) -> APIResponse:
|
|
650
|
+
"""
|
|
651
|
+
下载 GPL 平台注释文件,用于探针 ID → 基因符号映射
|
|
652
|
+
|
|
653
|
+
Args:
|
|
654
|
+
platform_id: GPL 编号,如 "GPL570"
|
|
655
|
+
output_dir: 输出目录
|
|
656
|
+
|
|
657
|
+
Returns:
|
|
658
|
+
APIResponse 包含 {"file_path": str, "platform_id": str}
|
|
659
|
+
"""
|
|
660
|
+
import requests as req
|
|
661
|
+
|
|
662
|
+
output_path = Path(output_dir) if output_dir else Path(tempfile.gettempdir())
|
|
663
|
+
output_path.mkdir(parents=True, exist_ok=True)
|
|
664
|
+
file_path = output_path / f"{platform_id}_annot.txt.gz"
|
|
665
|
+
|
|
666
|
+
# 检查缓存
|
|
667
|
+
if file_path.exists():
|
|
668
|
+
return APIResponse(
|
|
669
|
+
success=True,
|
|
670
|
+
data={"file_path": str(file_path), "platform_id": platform_id},
|
|
671
|
+
source=self.source_name,
|
|
672
|
+
endpoint="platform_annotation",
|
|
673
|
+
params={"platform_id": platform_id},
|
|
674
|
+
timestamp=""
|
|
675
|
+
)
|
|
676
|
+
|
|
677
|
+
# 尝试从 GEO FTP 下载平台注释文件
|
|
678
|
+
num = int(platform_id.replace("GPL", ""))
|
|
679
|
+
platform_dir = f"GPL{num // 1000}nnn"
|
|
680
|
+
base_url = f"https://ftp.ncbi.nlm.nih.gov/geo/platform/{platform_dir}/{platform_id}/annot"
|
|
681
|
+
|
|
682
|
+
try:
|
|
683
|
+
# 列出目录,找到注释文件
|
|
684
|
+
dir_resp = req.get(base_url + "/", timeout=30)
|
|
685
|
+
if dir_resp.status_code != 200:
|
|
686
|
+
# 尝试软平台格式 (SOFT 格式)
|
|
687
|
+
soft_url = f"https://ftp.ncbi.nlm.nih.gov/geo/platform/{platform_dir}/{platform_id}/soft/{platform_id}"
|
|
688
|
+
soft_file = output_path / f"{platform_id}_annot.txt.gz"
|
|
689
|
+
soft_resp = req.get(soft_url, timeout=60, stream=True)
|
|
690
|
+
if soft_resp.status_code == 200:
|
|
691
|
+
with open(soft_file, 'wb') as f:
|
|
692
|
+
for chunk in soft_resp.iter_content(chunk_size=8192):
|
|
693
|
+
f.write(chunk)
|
|
694
|
+
return APIResponse(
|
|
695
|
+
success=True,
|
|
696
|
+
data={"file_path": str(soft_file), "platform_id": platform_id},
|
|
697
|
+
source=self.source_name,
|
|
698
|
+
endpoint=soft_url,
|
|
699
|
+
params={"platform_id": platform_id},
|
|
700
|
+
timestamp=""
|
|
701
|
+
)
|
|
702
|
+
return APIResponse(
|
|
703
|
+
success=False, data=None, source=self.source_name,
|
|
704
|
+
endpoint=base_url, params={"platform_id": platform_id},
|
|
705
|
+
timestamp="", error=f"无法下载 {platform_id} 注释文件"
|
|
706
|
+
)
|
|
707
|
+
|
|
708
|
+
# 查找注释文件
|
|
709
|
+
match = re.search(
|
|
710
|
+
rf'({platform_id}[.-].*?\.txt\.gz)',
|
|
711
|
+
dir_resp.text
|
|
712
|
+
)
|
|
713
|
+
if not match:
|
|
714
|
+
# 回退:使用 NCBI E-utilities 获取平台信息
|
|
715
|
+
return self._fetch_platform_via_eutils(platform_id, output_path)
|
|
716
|
+
|
|
717
|
+
filename = match.group(1)
|
|
718
|
+
file_url = f"{base_url}/{filename}"
|
|
719
|
+
|
|
720
|
+
self._wait_for_rate_limit()
|
|
721
|
+
dl_resp = req.get(file_url, timeout=120, stream=True)
|
|
722
|
+
dl_resp.raise_for_status()
|
|
723
|
+
|
|
724
|
+
with open(file_path, 'wb') as f:
|
|
725
|
+
for chunk in dl_resp.iter_content(chunk_size=8192):
|
|
726
|
+
f.write(chunk)
|
|
727
|
+
|
|
728
|
+
return APIResponse(
|
|
729
|
+
success=True,
|
|
730
|
+
data={"file_path": str(file_path), "platform_id": platform_id},
|
|
731
|
+
source=self.source_name,
|
|
732
|
+
endpoint=file_url,
|
|
733
|
+
params={"platform_id": platform_id},
|
|
734
|
+
timestamp=""
|
|
735
|
+
)
|
|
736
|
+
|
|
737
|
+
except Exception as e:
|
|
738
|
+
# 最终回退:通过 E-utilities 获取
|
|
739
|
+
return self._fetch_platform_via_eutils(platform_id, output_path)
|
|
740
|
+
|
|
741
|
+
def _fetch_platform_via_eutils(
|
|
742
|
+
self,
|
|
743
|
+
platform_id: str,
|
|
744
|
+
output_path: Path
|
|
745
|
+
) -> APIResponse:
|
|
746
|
+
"""通过 NCBI E-utilities 获取平台注释数据"""
|
|
747
|
+
import requests as req
|
|
748
|
+
|
|
749
|
+
# 使用 efetch 获取 GPL SOFT 格式
|
|
750
|
+
gpl_num = platform_id.replace("GPL", "")
|
|
751
|
+
params = {
|
|
752
|
+
"db": "gpl",
|
|
753
|
+
"id": gpl_num,
|
|
754
|
+
"rettype": "soft",
|
|
755
|
+
"retmode": "text"
|
|
756
|
+
}
|
|
757
|
+
|
|
758
|
+
try:
|
|
759
|
+
self._wait_for_rate_limit()
|
|
760
|
+
resp = req.get(f"{self.base_url}/efetch.fcgi", params=params, timeout=60)
|
|
761
|
+
resp.raise_for_status()
|
|
762
|
+
|
|
763
|
+
file_path = output_path / f"{platform_id}_annot.txt"
|
|
764
|
+
with open(file_path, 'w', encoding='utf-8') as f:
|
|
765
|
+
f.write(resp.text)
|
|
766
|
+
|
|
767
|
+
return APIResponse(
|
|
768
|
+
success=True,
|
|
769
|
+
data={"file_path": str(file_path), "platform_id": platform_id},
|
|
770
|
+
source=self.source_name,
|
|
771
|
+
endpoint="/efetch.fcgi",
|
|
772
|
+
params={"platform_id": platform_id},
|
|
773
|
+
timestamp=""
|
|
774
|
+
)
|
|
775
|
+
except Exception as e:
|
|
776
|
+
return APIResponse(
|
|
777
|
+
success=False, data=None, source=self.source_name,
|
|
778
|
+
endpoint="/efetch.fcgi", params={"platform_id": platform_id},
|
|
779
|
+
timestamp="", error=f"通过 E-utilities 获取 {platform_id} 失败: {str(e)}"
|
|
780
|
+
)
|
|
781
|
+
|
|
782
|
+
def build_probe_gene_map(
|
|
783
|
+
self,
|
|
784
|
+
platform_id: str,
|
|
785
|
+
cache_dir: Optional[str] = None
|
|
786
|
+
) -> dict:
|
|
787
|
+
"""
|
|
788
|
+
构建 探针 ID → 基因符号 映射表
|
|
789
|
+
|
|
790
|
+
Args:
|
|
791
|
+
platform_id: GPL 编号,如 "GPL570"
|
|
792
|
+
cache_dir: 缓存目录
|
|
793
|
+
|
|
794
|
+
Returns:
|
|
795
|
+
{"probe_id": "gene_symbol", ...} 映射字典
|
|
796
|
+
"""
|
|
797
|
+
import pandas as pd
|
|
798
|
+
|
|
799
|
+
annot_dir = str(Path(cache_dir) / "platform_annotations") if cache_dir else None
|
|
800
|
+
|
|
801
|
+
# 1. 先检查是否有本地缓存映射
|
|
802
|
+
if cache_dir:
|
|
803
|
+
map_cache = Path(cache_dir) / "probe_maps" / f"{platform_id}_probe_map.json"
|
|
804
|
+
if map_cache.exists():
|
|
805
|
+
import json
|
|
806
|
+
with open(map_cache, 'r', encoding='utf-8') as f:
|
|
807
|
+
return json.load(f)
|
|
808
|
+
|
|
809
|
+
# 2. 下载注释文件
|
|
810
|
+
dl_result = self.download_platform_annotation(platform_id, output_dir=annot_dir)
|
|
811
|
+
if not dl_result.success:
|
|
812
|
+
return {}
|
|
813
|
+
|
|
814
|
+
file_path = dl_result.data["file_path"]
|
|
815
|
+
probe_map = {}
|
|
816
|
+
|
|
817
|
+
try:
|
|
818
|
+
# 判断文件格式并解析
|
|
819
|
+
open_func = gzip.open if file_path.endswith('.gz') else open
|
|
820
|
+
mode = 'rt' if file_path.endswith('.gz') else 'r'
|
|
821
|
+
|
|
822
|
+
in_data = False
|
|
823
|
+
header_line = None
|
|
824
|
+
id_col_idx = None
|
|
825
|
+
gene_col_idx = None
|
|
826
|
+
gene_symbol_patterns = [
|
|
827
|
+
"gene symbol", "gene_symbol", "genesymbol",
|
|
828
|
+
"gene assignment", "gene_assignment",
|
|
829
|
+
"symbol", "gene title", "gene_title",
|
|
830
|
+
"GENE_SYMBOL", "Gene Symbol"
|
|
831
|
+
]
|
|
832
|
+
|
|
833
|
+
with open_func(file_path, mode, encoding='utf-8', errors='replace') as f:
|
|
834
|
+
for line in f:
|
|
835
|
+
line = line.strip()
|
|
836
|
+
|
|
837
|
+
# SOFT 格式:找到数据表开始
|
|
838
|
+
if line.startswith('^DATABASE') or line.startswith('^PLATFORM'):
|
|
839
|
+
continue
|
|
840
|
+
|
|
841
|
+
if line.startswith('!platform_table_begin'):
|
|
842
|
+
in_data = True
|
|
843
|
+
continue
|
|
844
|
+
if line.startswith('!platform_table_end'):
|
|
845
|
+
break
|
|
846
|
+
|
|
847
|
+
# 非 SOFT 格式的 tab 分隔注释文件
|
|
848
|
+
if not in_data and not line.startswith('#') and '\t' in line:
|
|
849
|
+
# 检查是否是表头行
|
|
850
|
+
parts = [p.strip('"').strip() for p in line.split('\t')]
|
|
851
|
+
lower_parts = [p.lower() for p in parts]
|
|
852
|
+
# 找 ID 和 Gene Symbol 列
|
|
853
|
+
for idx, lp in enumerate(lower_parts):
|
|
854
|
+
if lp == "id" or lp == "probe_id" or lp == "id_ref":
|
|
855
|
+
id_col_idx = idx
|
|
856
|
+
for pattern in gene_symbol_patterns:
|
|
857
|
+
if pattern in lp:
|
|
858
|
+
gene_col_idx = idx
|
|
859
|
+
break
|
|
860
|
+
if id_col_idx is not None and gene_col_idx is not None:
|
|
861
|
+
in_data = True
|
|
862
|
+
header_line = parts
|
|
863
|
+
continue
|
|
864
|
+
|
|
865
|
+
if not in_data:
|
|
866
|
+
continue
|
|
867
|
+
|
|
868
|
+
# 跳过表头行
|
|
869
|
+
if header_line is not None and line.startswith(header_line[0]):
|
|
870
|
+
continue
|
|
871
|
+
|
|
872
|
+
if not line or line.startswith('#') or line.startswith('!'):
|
|
873
|
+
continue
|
|
874
|
+
|
|
875
|
+
parts = [p.strip('"').strip() for p in line.split('\t')]
|
|
876
|
+
|
|
877
|
+
# 如果还没找到列索引,第一行就是表头
|
|
878
|
+
if id_col_idx is None:
|
|
879
|
+
lower_parts = [p.lower() for p in parts]
|
|
880
|
+
for idx, lp in enumerate(lower_parts):
|
|
881
|
+
if lp == "id" or lp == "probe_id" or lp == "id_ref":
|
|
882
|
+
id_col_idx = idx
|
|
883
|
+
for pattern in gene_symbol_patterns:
|
|
884
|
+
if pattern in lp:
|
|
885
|
+
gene_col_idx = idx
|
|
886
|
+
break
|
|
887
|
+
continue
|
|
888
|
+
|
|
889
|
+
# 提取映射
|
|
890
|
+
if id_col_idx < len(parts):
|
|
891
|
+
probe_id = parts[id_col_idx]
|
|
892
|
+
if gene_col_idx is not None and gene_col_idx < len(parts):
|
|
893
|
+
gene_field = parts[gene_col_idx]
|
|
894
|
+
# 解析基因符号 — 多种格式:
|
|
895
|
+
# 直接: "TP53"
|
|
896
|
+
# Affymetrix: "TP53 /// MDM2" (多基因)
|
|
897
|
+
# Illumina: "NM_001126112 /// TP53" (转录本+基因)
|
|
898
|
+
# 赋值格式: "GB_ACC:NM_001126112 // STRAND:+ // SYMBOL:TP53"
|
|
899
|
+
gene_symbol = self._parse_gene_symbol(gene_field)
|
|
900
|
+
if gene_symbol:
|
|
901
|
+
probe_map[probe_id] = gene_symbol
|
|
902
|
+
|
|
903
|
+
except Exception as e:
|
|
904
|
+
# 解析失败,返回空映射
|
|
905
|
+
pass
|
|
906
|
+
|
|
907
|
+
# 3. 缓存映射结果
|
|
908
|
+
if cache_dir and probe_map:
|
|
909
|
+
map_cache = Path(cache_dir) / "probe_maps"
|
|
910
|
+
map_cache.mkdir(parents=True, exist_ok=True)
|
|
911
|
+
map_file = map_cache / f"{platform_id}_probe_map.json"
|
|
912
|
+
import json
|
|
913
|
+
with open(map_file, 'w', encoding='utf-8') as f:
|
|
914
|
+
json.dump(probe_map, f, ensure_ascii=False)
|
|
915
|
+
|
|
916
|
+
return probe_map
|
|
917
|
+
|
|
918
|
+
@staticmethod
|
|
919
|
+
def _parse_gene_symbol(gene_field: str) -> str:
|
|
920
|
+
"""
|
|
921
|
+
从平台注释字段中解析基因符号
|
|
922
|
+
|
|
923
|
+
支持多种格式:
|
|
924
|
+
- 直接基因符号: "TP53"
|
|
925
|
+
- Affymetrix 多基因: "TP53 /// MDM2" → 取第一个
|
|
926
|
+
- Illumina 赋值: "GB_ACC:NM_001126112 // STRAND:+ // SYMBOL:TP53" → 提取 SYMBOL
|
|
927
|
+
- 转录本+基因: "NM_001126112 /// TP53" → 取基因符号部分
|
|
928
|
+
"""
|
|
929
|
+
if not gene_field or gene_field in ('---', 'nan', '', 'null', 'NA'):
|
|
930
|
+
return ""
|
|
931
|
+
|
|
932
|
+
# 赋值格式: "KEY:VALUE // KEY2:VALUE2"
|
|
933
|
+
if '//' in gene_field and ':' in gene_field:
|
|
934
|
+
parts = gene_field.split('//')
|
|
935
|
+
for part in parts:
|
|
936
|
+
part = part.strip()
|
|
937
|
+
if part.upper().startswith('SYMBOL:') or part.upper().startswith('GENE SYMBOL:'):
|
|
938
|
+
symbol = part.split(':', 1)[1].strip()
|
|
939
|
+
if symbol and not symbol.startswith('NM_') and not symbol.startswith('NR_'):
|
|
940
|
+
return symbol
|
|
941
|
+
# 没有 SYMBOL 键,尝试取非转录本部分
|
|
942
|
+
for part in parts:
|
|
943
|
+
part = part.strip()
|
|
944
|
+
if ':' in part:
|
|
945
|
+
val = part.split(':', 1)[1].strip()
|
|
946
|
+
else:
|
|
947
|
+
val = part.strip()
|
|
948
|
+
if val and not val.startswith('NM_') and not val.startswith('NR_') and not val.startswith('ENST'):
|
|
949
|
+
return val
|
|
950
|
+
return ""
|
|
951
|
+
|
|
952
|
+
# Affymetrix 多基因格式: "TP53 /// MDM2"
|
|
953
|
+
if '///' in gene_field:
|
|
954
|
+
parts = gene_field.split('///')
|
|
955
|
+
for part in parts:
|
|
956
|
+
part = part.strip()
|
|
957
|
+
# 跳过转录本 ID
|
|
958
|
+
if part and not part.startswith('NM_') and not part.startswith('NR_') and not part.startswith('ENST'):
|
|
959
|
+
# 去掉引号
|
|
960
|
+
part = part.strip('"').strip("'")
|
|
961
|
+
if part:
|
|
962
|
+
return part
|
|
963
|
+
return ""
|
|
964
|
+
|
|
965
|
+
# 直接基因符号
|
|
966
|
+
gene_field = gene_field.strip().strip('"').strip("'")
|
|
967
|
+
# 如果是纯转录本 ID,跳过
|
|
968
|
+
if gene_field.startswith('NM_') or gene_field.startswith('NR_') or gene_field.startswith('ENST'):
|
|
969
|
+
return ""
|
|
970
|
+
|
|
971
|
+
return gene_field
|
|
972
|
+
|
|
973
|
+
def _parse_gene_symbol_from_data_table(
|
|
974
|
+
self,
|
|
975
|
+
data_lines: list[str],
|
|
976
|
+
header_samples: list[str]
|
|
977
|
+
) -> dict:
|
|
978
|
+
"""
|
|
979
|
+
从 series matrix 数据表中直接提取 探针ID → 基因符号 映射
|
|
980
|
+
|
|
981
|
+
很多 GEO 数据集的表达数据行格式为:
|
|
982
|
+
ID_REF Sample1 Sample2 ... (但某些平台会在数据行中包含基因符号)
|
|
983
|
+
|
|
984
|
+
也处理 SOFT 格式中 !platform_table_begin 区域的基因符号列。
|
|
985
|
+
"""
|
|
986
|
+
probe_map = {}
|
|
987
|
+
# 常见的基因符号列名模式
|
|
988
|
+
gene_col_patterns = [
|
|
989
|
+
"gene symbol", "gene_symbol", "genesymbol", "symbol",
|
|
990
|
+
"gene_assignment", "gene title", "gene_title",
|
|
991
|
+
"GENE_SYMBOL", "Gene Symbol", "gene", "gene name"
|
|
992
|
+
]
|
|
993
|
+
|
|
994
|
+
for line in data_lines[:5]: # 只检查前几行来判断格式
|
|
995
|
+
parts = [p.strip('"').strip() for p in line.split('\t')]
|
|
996
|
+
if len(parts) < 3:
|
|
997
|
+
continue
|
|
998
|
+
# 如果第二列看起来是基因符号(非数字、长度合理)
|
|
999
|
+
candidate = parts[1] if len(parts) > 1 else ""
|
|
1000
|
+
if (candidate and not candidate.replace('.', '').replace('-', '').isdigit()
|
|
1001
|
+
and len(candidate) <= 30 and not candidate.startswith('GSM')):
|
|
1002
|
+
# 可能是基因符号列
|
|
1003
|
+
# 验证:检查更多行
|
|
1004
|
+
gene_col_idx = 1
|
|
1005
|
+
mapped = 0
|
|
1006
|
+
for dl in data_lines[:200]:
|
|
1007
|
+
dp = [p.strip('"').strip() for p in dl.split('\t')]
|
|
1008
|
+
if len(dp) > gene_col_idx:
|
|
1009
|
+
probe_id = dp[0]
|
|
1010
|
+
gene_sym = dp[gene_col_idx]
|
|
1011
|
+
if gene_sym and not gene_sym.replace('.', '').replace('-', '').isdigit():
|
|
1012
|
+
# 验证看起来像基因符号
|
|
1013
|
+
if len(gene_sym) <= 30 and not gene_sym.startswith('GSM'):
|
|
1014
|
+
parsed = self._parse_gene_symbol(gene_sym)
|
|
1015
|
+
if parsed:
|
|
1016
|
+
probe_map[probe_id] = parsed
|
|
1017
|
+
mapped += 1
|
|
1018
|
+
if mapped > len(data_lines) * 0.1: # 至少10%映射成功
|
|
1019
|
+
return probe_map
|
|
1020
|
+
|
|
1021
|
+
return probe_map
|
|
1022
|
+
|
|
1023
|
+
def parse_series_matrix(
|
|
1024
|
+
self,
|
|
1025
|
+
file_path: str,
|
|
1026
|
+
target_genes: Optional[list[str]] = None,
|
|
1027
|
+
probe_id_map: Optional[dict] = None,
|
|
1028
|
+
cache_dir: Optional[str] = None
|
|
1029
|
+
) -> APIResponse:
|
|
1030
|
+
"""
|
|
1031
|
+
解析 GEO Series Matrix 文件
|
|
1032
|
+
|
|
1033
|
+
Args:
|
|
1034
|
+
file_path: series_matrix.txt.gz 文件路径
|
|
1035
|
+
target_genes: 目标基因列表(None 则解析全部)
|
|
1036
|
+
probe_id_map: 探针→基因映射(None 则自动从平台注释构建)
|
|
1037
|
+
cache_dir: 缓存目录(用于下载/缓存平台注释)
|
|
1038
|
+
|
|
1039
|
+
Returns:
|
|
1040
|
+
APIResponse 包含 {
|
|
1041
|
+
"expression_matrix": pd.DataFrame, # gene_symbols x samples
|
|
1042
|
+
"sample_metadata": dict,
|
|
1043
|
+
"platform": str,
|
|
1044
|
+
"gene_count": int,
|
|
1045
|
+
"sample_count": int,
|
|
1046
|
+
"probe_mapping_stats": dict
|
|
1047
|
+
}
|
|
1048
|
+
"""
|
|
1049
|
+
try:
|
|
1050
|
+
import pandas as pd
|
|
1051
|
+
except ImportError:
|
|
1052
|
+
return APIResponse(
|
|
1053
|
+
success=False, data=None, source=self.source_name,
|
|
1054
|
+
endpoint="parse_series_matrix", params={"file_path": file_path},
|
|
1055
|
+
timestamp="", error="需要安装 pandas"
|
|
1056
|
+
)
|
|
1057
|
+
|
|
1058
|
+
try:
|
|
1059
|
+
open_func = gzip.open if file_path.endswith('.gz') else open
|
|
1060
|
+
mode = 'rt' if file_path.endswith('.gz') else 'r'
|
|
1061
|
+
|
|
1062
|
+
metadata = {}
|
|
1063
|
+
sample_titles = {}
|
|
1064
|
+
sample_characteristics = {} # sample_index -> list of characteristic strings
|
|
1065
|
+
data_lines = []
|
|
1066
|
+
header_samples = []
|
|
1067
|
+
in_data = False
|
|
1068
|
+
# 用于从SOFT格式平台表提取基因符号
|
|
1069
|
+
platform_probe_map = {}
|
|
1070
|
+
in_platform_table = False
|
|
1071
|
+
platform_header_parsed = False
|
|
1072
|
+
platform_id_col_idx = None
|
|
1073
|
+
platform_gene_col_idx = None
|
|
1074
|
+
|
|
1075
|
+
with open_func(file_path, mode, encoding='utf-8', errors='replace') as f:
|
|
1076
|
+
for line in f:
|
|
1077
|
+
line = line.strip()
|
|
1078
|
+
|
|
1079
|
+
# SOFT 格式平台表
|
|
1080
|
+
if line.startswith('!platform_table_begin'):
|
|
1081
|
+
in_platform_table = True
|
|
1082
|
+
platform_header_parsed = False
|
|
1083
|
+
continue
|
|
1084
|
+
if line.startswith('!platform_table_end'):
|
|
1085
|
+
in_platform_table = False
|
|
1086
|
+
continue
|
|
1087
|
+
|
|
1088
|
+
if in_platform_table:
|
|
1089
|
+
if not line or line.startswith('#') or line.startswith('!'):
|
|
1090
|
+
continue
|
|
1091
|
+
parts = [p.strip('"').strip() for p in line.split('\t')]
|
|
1092
|
+
if not platform_header_parsed:
|
|
1093
|
+
# 解析表头,找 ID 和 Gene Symbol 列
|
|
1094
|
+
lower_parts = [p.lower() for p in parts]
|
|
1095
|
+
gene_symbol_patterns = [
|
|
1096
|
+
"gene symbol", "gene_symbol", "genesymbol",
|
|
1097
|
+
"gene assignment", "gene_assignment",
|
|
1098
|
+
"symbol", "gene title", "gene_title",
|
|
1099
|
+
"GENE_SYMBOL", "Gene Symbol"
|
|
1100
|
+
]
|
|
1101
|
+
for idx, lp in enumerate(lower_parts):
|
|
1102
|
+
if lp in ("id", "probe_id", "id_ref"):
|
|
1103
|
+
platform_id_col_idx = idx
|
|
1104
|
+
for pattern in gene_symbol_patterns:
|
|
1105
|
+
if pattern in lp:
|
|
1106
|
+
platform_gene_col_idx = idx
|
|
1107
|
+
break
|
|
1108
|
+
platform_header_parsed = True
|
|
1109
|
+
continue
|
|
1110
|
+
|
|
1111
|
+
# 数据行
|
|
1112
|
+
if platform_id_col_idx is not None and platform_gene_col_idx is not None:
|
|
1113
|
+
if platform_id_col_idx < len(parts) and platform_gene_col_idx < len(parts):
|
|
1114
|
+
probe_id = parts[platform_id_col_idx]
|
|
1115
|
+
gene_field = parts[platform_gene_col_idx]
|
|
1116
|
+
gene_symbol = self._parse_gene_symbol(gene_field)
|
|
1117
|
+
if gene_symbol:
|
|
1118
|
+
platform_probe_map[probe_id] = gene_symbol
|
|
1119
|
+
continue
|
|
1120
|
+
|
|
1121
|
+
if line.startswith('!series_matrix_table_begin') or line.startswith('!sample_table_begin'):
|
|
1122
|
+
in_data = True
|
|
1123
|
+
continue
|
|
1124
|
+
if line.startswith('!series_matrix_table_end') or line.startswith('!sample_table_end'):
|
|
1125
|
+
break
|
|
1126
|
+
|
|
1127
|
+
if not in_data:
|
|
1128
|
+
# 解析元数据
|
|
1129
|
+
if line.startswith('!Sample_title'):
|
|
1130
|
+
parts = line.split('\t')
|
|
1131
|
+
if len(parts) > 1:
|
|
1132
|
+
metadata['_titles'] = [p.strip('"') for p in parts[1:]]
|
|
1133
|
+
|
|
1134
|
+
elif line.startswith('!Sample_geo_accession'):
|
|
1135
|
+
parts = line.split('\t')
|
|
1136
|
+
if len(parts) > 1:
|
|
1137
|
+
metadata['_accessions'] = [p.strip('"') for p in parts[1:]]
|
|
1138
|
+
|
|
1139
|
+
elif line.startswith('!Sample_source_name_ch1'):
|
|
1140
|
+
parts = line.split('\t')
|
|
1141
|
+
if len(parts) > 1:
|
|
1142
|
+
metadata['_source_names'] = [p.strip('"') for p in parts[1:]]
|
|
1143
|
+
|
|
1144
|
+
elif line.startswith('!Sample_characteristics_ch1'):
|
|
1145
|
+
# characteristics 可能有多行,需要合并
|
|
1146
|
+
parts = line.split('\t')
|
|
1147
|
+
if len(parts) > 1:
|
|
1148
|
+
char_values = [p.strip('"') for p in parts[1:]]
|
|
1149
|
+
if '_characteristics_list' not in metadata:
|
|
1150
|
+
metadata['_characteristics_list'] = {}
|
|
1151
|
+
for i, cv in enumerate(char_values):
|
|
1152
|
+
if i not in metadata['_characteristics_list']:
|
|
1153
|
+
metadata['_characteristics_list'][i] = []
|
|
1154
|
+
metadata['_characteristics_list'][i].append(cv)
|
|
1155
|
+
|
|
1156
|
+
elif line.startswith('!Sample_group'):
|
|
1157
|
+
parts = line.split('\t')
|
|
1158
|
+
if len(parts) > 1:
|
|
1159
|
+
metadata['_groups'] = [p.strip('"') for p in parts[1:]]
|
|
1160
|
+
|
|
1161
|
+
elif line.startswith('!Sample_platform_id') or line.startswith('!Series_platform_id'):
|
|
1162
|
+
parts = line.split('\t')
|
|
1163
|
+
if len(parts) > 1:
|
|
1164
|
+
metadata['platform'] = parts[1].strip('"')
|
|
1165
|
+
|
|
1166
|
+
else:
|
|
1167
|
+
# 数据行
|
|
1168
|
+
if line.startswith('!') or line.startswith('#') or not line:
|
|
1169
|
+
continue
|
|
1170
|
+
# 去掉引号后检查 ID_REF
|
|
1171
|
+
unquoted = line.strip('"')
|
|
1172
|
+
if unquoted.startswith('ID_REF'):
|
|
1173
|
+
# 表头行
|
|
1174
|
+
parts = line.split('\t')
|
|
1175
|
+
header_samples = [p.strip('"') for p in parts[1:]]
|
|
1176
|
+
continue
|
|
1177
|
+
data_lines.append(line)
|
|
1178
|
+
|
|
1179
|
+
# 构建 sample metadata(合并多行 characteristics)
|
|
1180
|
+
accessions = metadata.get('_accessions', [])
|
|
1181
|
+
titles = metadata.get('_titles', [])
|
|
1182
|
+
source_names = metadata.get('_source_names', [])
|
|
1183
|
+
groups = metadata.get('_groups', [])
|
|
1184
|
+
char_lists = metadata.get('_characteristics_list', {})
|
|
1185
|
+
|
|
1186
|
+
sample_metadata = {}
|
|
1187
|
+
for i, acc in enumerate(accessions):
|
|
1188
|
+
# 合并该样本的所有 characteristics 行
|
|
1189
|
+
merged_chars = '; '.join(char_lists.get(i, []))
|
|
1190
|
+
sample_metadata[acc] = {
|
|
1191
|
+
"title": titles[i] if i < len(titles) else "",
|
|
1192
|
+
"characteristics": merged_chars,
|
|
1193
|
+
"source_name": source_names[i] if i < len(source_names) else "",
|
|
1194
|
+
"group": groups[i] if i < len(groups) else ""
|
|
1195
|
+
}
|
|
1196
|
+
|
|
1197
|
+
# 解析表达矩阵
|
|
1198
|
+
if not data_lines or not header_samples:
|
|
1199
|
+
return APIResponse(
|
|
1200
|
+
success=False, data=None, source=self.source_name,
|
|
1201
|
+
endpoint="parse_series_matrix",
|
|
1202
|
+
params={"file_path": file_path}, timestamp="",
|
|
1203
|
+
error="无法解析表达数据"
|
|
1204
|
+
)
|
|
1205
|
+
|
|
1206
|
+
# 构建 DataFrame
|
|
1207
|
+
rows = []
|
|
1208
|
+
gene_ids = []
|
|
1209
|
+
for line in data_lines:
|
|
1210
|
+
parts = line.split('\t')
|
|
1211
|
+
gene_id = parts[0].strip('"')
|
|
1212
|
+
values = []
|
|
1213
|
+
for v in parts[1:]:
|
|
1214
|
+
v = v.strip('"')
|
|
1215
|
+
try:
|
|
1216
|
+
values.append(float(v))
|
|
1217
|
+
except ValueError:
|
|
1218
|
+
values.append(float('nan'))
|
|
1219
|
+
gene_ids.append(gene_id)
|
|
1220
|
+
rows.append(values)
|
|
1221
|
+
|
|
1222
|
+
df = pd.DataFrame(rows, index=gene_ids, columns=header_samples[:len(rows[0]) if rows else 0])
|
|
1223
|
+
|
|
1224
|
+
# === 探针 ID → 基因符号映射 ===
|
|
1225
|
+
mapping_stats = {
|
|
1226
|
+
"total_probes": len(df),
|
|
1227
|
+
"mapped_probes": 0,
|
|
1228
|
+
"unmapped_probes": 0,
|
|
1229
|
+
"unique_genes": 0,
|
|
1230
|
+
"platform_id": metadata.get('platform', ''),
|
|
1231
|
+
"mapping_applied": False
|
|
1232
|
+
}
|
|
1233
|
+
|
|
1234
|
+
platform_id = metadata.get('platform', '')
|
|
1235
|
+
|
|
1236
|
+
# 优先级1:SOFT文件内嵌的平台表映射(最可靠,因为它与数据完全对应)
|
|
1237
|
+
probe_map_to_use = None
|
|
1238
|
+
mapping_source = ""
|
|
1239
|
+
|
|
1240
|
+
if platform_probe_map:
|
|
1241
|
+
probe_map_to_use = platform_probe_map
|
|
1242
|
+
mapping_source = "soft_platform_table"
|
|
1243
|
+
|
|
1244
|
+
# 优先级2:外部提供的映射表
|
|
1245
|
+
if probe_map_to_use is None and probe_id_map:
|
|
1246
|
+
probe_map_to_use = probe_id_map
|
|
1247
|
+
mapping_source = "provided"
|
|
1248
|
+
|
|
1249
|
+
# 优先级3:自动下载平台注释
|
|
1250
|
+
if probe_map_to_use is None and platform_id:
|
|
1251
|
+
downloaded_map = self.build_probe_gene_map(platform_id, cache_dir=cache_dir)
|
|
1252
|
+
if downloaded_map:
|
|
1253
|
+
probe_map_to_use = downloaded_map
|
|
1254
|
+
mapping_source = "platform_annotation_download"
|
|
1255
|
+
|
|
1256
|
+
# 优先级4:从数据表结构推断基因符号列
|
|
1257
|
+
if probe_map_to_use is None:
|
|
1258
|
+
inferred_map = self._parse_gene_symbol_from_data_table(data_lines, header_samples)
|
|
1259
|
+
if inferred_map:
|
|
1260
|
+
probe_map_to_use = inferred_map
|
|
1261
|
+
mapping_source = "data_table_inference"
|
|
1262
|
+
|
|
1263
|
+
if probe_map_to_use:
|
|
1264
|
+
# 应用映射
|
|
1265
|
+
mapped_index = []
|
|
1266
|
+
unmapped_count = 0
|
|
1267
|
+
for idx in df.index:
|
|
1268
|
+
gene_symbol = probe_map_to_use.get(idx, "")
|
|
1269
|
+
if gene_symbol:
|
|
1270
|
+
mapped_index.append(gene_symbol)
|
|
1271
|
+
else:
|
|
1272
|
+
unmapped_count += 1
|
|
1273
|
+
mapped_index.append(None)
|
|
1274
|
+
|
|
1275
|
+
# 替换索引
|
|
1276
|
+
df.index = mapped_index
|
|
1277
|
+
|
|
1278
|
+
# 删除未映射的行
|
|
1279
|
+
unmapped_count_before = len(df)
|
|
1280
|
+
df = df[df.index.notna()]
|
|
1281
|
+
unmapped_count = unmapped_count_before - len(df)
|
|
1282
|
+
|
|
1283
|
+
# 多探针对同一基因:取均值
|
|
1284
|
+
duplicated_genes = df.index.duplicated(keep=False)
|
|
1285
|
+
if duplicated_genes.any():
|
|
1286
|
+
df = df.groupby(df.index).mean()
|
|
1287
|
+
|
|
1288
|
+
mapping_stats["mapped_probes"] = len(df)
|
|
1289
|
+
mapping_stats["unmapped_probes"] = unmapped_count
|
|
1290
|
+
mapping_stats["unique_genes"] = len(df)
|
|
1291
|
+
mapping_stats["mapping_applied"] = True
|
|
1292
|
+
mapping_stats["mapping_source"] = mapping_source
|
|
1293
|
+
else:
|
|
1294
|
+
# 无映射 — 行索引保持原始 probe ID
|
|
1295
|
+
mapping_stats["unmapped_probes"] = len(df)
|
|
1296
|
+
mapping_stats["mapping_applied"] = False
|
|
1297
|
+
|
|
1298
|
+
# 如果指定了目标基因,只保留目标基因
|
|
1299
|
+
if target_genes:
|
|
1300
|
+
available_genes = [g for g in target_genes if g in df.index]
|
|
1301
|
+
if available_genes:
|
|
1302
|
+
df = df.loc[available_genes]
|
|
1303
|
+
|
|
1304
|
+
return APIResponse(
|
|
1305
|
+
success=True,
|
|
1306
|
+
data={
|
|
1307
|
+
"expression_matrix": df,
|
|
1308
|
+
"sample_metadata": sample_metadata,
|
|
1309
|
+
"platform": metadata.get('platform', ''),
|
|
1310
|
+
"gene_count": len(df),
|
|
1311
|
+
"sample_count": len(df.columns),
|
|
1312
|
+
"accession": Path(file_path).stem.replace('_series_matrix.txt', ''),
|
|
1313
|
+
"probe_mapping_stats": mapping_stats
|
|
1314
|
+
},
|
|
1315
|
+
source=self.source_name,
|
|
1316
|
+
endpoint="parse_series_matrix",
|
|
1317
|
+
params={"file_path": file_path},
|
|
1318
|
+
timestamp=""
|
|
1319
|
+
)
|
|
1320
|
+
|
|
1321
|
+
except Exception as e:
|
|
1322
|
+
return APIResponse(
|
|
1323
|
+
success=False, data=None, source=self.source_name,
|
|
1324
|
+
endpoint="parse_series_matrix",
|
|
1325
|
+
params={"file_path": file_path}, timestamp="",
|
|
1326
|
+
error=f"解析错误: {str(e)}"
|
|
1327
|
+
)
|
|
1328
|
+
|
|
1329
|
+
def infer_sample_groups(
|
|
1330
|
+
self,
|
|
1331
|
+
sample_metadata: dict,
|
|
1332
|
+
disease: str
|
|
1333
|
+
) -> dict:
|
|
1334
|
+
"""
|
|
1335
|
+
从样本元数据推断 case/control 分组
|
|
1336
|
+
|
|
1337
|
+
策略(按优先级):
|
|
1338
|
+
1. group 标签直接分组
|
|
1339
|
+
2. characteristics 中包含 disease/healthy 关键词
|
|
1340
|
+
3. title + source_name 中包含 disease/normal/control 关键词
|
|
1341
|
+
4. 按位置前半/后半分组(最后手段)
|
|
1342
|
+
|
|
1343
|
+
Returns:
|
|
1344
|
+
{"disease": [sample_ids], "control": [sample_ids], "method": str}
|
|
1345
|
+
"""
|
|
1346
|
+
disease_samples = []
|
|
1347
|
+
control_samples = []
|
|
1348
|
+
unassigned_samples = []
|
|
1349
|
+
|
|
1350
|
+
disease_lower = disease.lower()
|
|
1351
|
+
# 疾病关键词:完整疾病名 + 单个词(长度>2)+ 通用癌症关键词
|
|
1352
|
+
disease_words = [w for w in disease_lower.split() if len(w) > 2]
|
|
1353
|
+
disease_keywords = [
|
|
1354
|
+
disease_lower, "tumor", "tumour", "cancer", "carcinoma",
|
|
1355
|
+
"adenocarcinoma", "malignant", "case", "patient"
|
|
1356
|
+
] + disease_words
|
|
1357
|
+
# 去重
|
|
1358
|
+
disease_keywords = list(dict.fromkeys(disease_keywords))
|
|
1359
|
+
|
|
1360
|
+
control_keywords = [
|
|
1361
|
+
"normal", "control", "healthy", "adjacent", "benign",
|
|
1362
|
+
"non-tumor", "non_tumor", "noncancer", "healthy volunteer",
|
|
1363
|
+
"non-neoplastic", "non_neoplastic", "parenchyma"
|
|
1364
|
+
]
|
|
1365
|
+
|
|
1366
|
+
for sample_id, meta in sample_metadata.items():
|
|
1367
|
+
# 构建完整文本(所有可用字段拼接)
|
|
1368
|
+
text_parts = [
|
|
1369
|
+
meta.get('title', ''),
|
|
1370
|
+
meta.get('characteristics', ''),
|
|
1371
|
+
meta.get('source_name', '')
|
|
1372
|
+
]
|
|
1373
|
+
text = ' '.join(text_parts).lower()
|
|
1374
|
+
group_label = meta.get('group', '').lower()
|
|
1375
|
+
|
|
1376
|
+
is_disease = any(kw in text for kw in disease_keywords)
|
|
1377
|
+
is_control = any(kw in text for kw in control_keywords)
|
|
1378
|
+
|
|
1379
|
+
# 也检查 group 标签
|
|
1380
|
+
if group_label:
|
|
1381
|
+
if not is_disease and any(kw in group_label for kw in disease_keywords):
|
|
1382
|
+
is_disease = True
|
|
1383
|
+
if not is_control and any(kw in group_label for kw in control_keywords):
|
|
1384
|
+
is_control = True
|
|
1385
|
+
|
|
1386
|
+
# 特殊处理:如果文本包含 disease 名但也被标记为 normal/adjacent,
|
|
1387
|
+
# 优先识别为 control(如 "breast cancer adjacent normal")
|
|
1388
|
+
if is_disease and is_control:
|
|
1389
|
+
# 检查是否更偏向 control
|
|
1390
|
+
control_indicators = ["adjacent", "normal", "benign", "non-tumor", "non-neoplastic"]
|
|
1391
|
+
if any(ci in text for ci in control_indicators):
|
|
1392
|
+
is_disease = False
|
|
1393
|
+
else:
|
|
1394
|
+
is_control = False
|
|
1395
|
+
|
|
1396
|
+
if is_disease and not is_control:
|
|
1397
|
+
disease_samples.append(sample_id)
|
|
1398
|
+
elif is_control and not is_disease:
|
|
1399
|
+
control_samples.append(sample_id)
|
|
1400
|
+
else:
|
|
1401
|
+
unassigned_samples.append(sample_id)
|
|
1402
|
+
|
|
1403
|
+
# 如果分组失败,尝试按位置分组
|
|
1404
|
+
if not disease_samples or not control_samples:
|
|
1405
|
+
all_samples = list(sample_metadata.keys())
|
|
1406
|
+
mid = len(all_samples) // 2
|
|
1407
|
+
if len(all_samples) >= 4:
|
|
1408
|
+
return {
|
|
1409
|
+
"disease": all_samples[:mid],
|
|
1410
|
+
"control": all_samples[mid:],
|
|
1411
|
+
"method": "positional",
|
|
1412
|
+
"warning": "无法从元数据推断分组,按位置前后分组(结果可能不准确)"
|
|
1413
|
+
}
|
|
1414
|
+
|
|
1415
|
+
return {
|
|
1416
|
+
"disease": disease_samples,
|
|
1417
|
+
"control": control_samples,
|
|
1418
|
+
"unassigned": unassigned_samples,
|
|
1419
|
+
"method": "metadata"
|
|
1420
|
+
}
|