npm - @youhaozhao/cninfo-mcp - Versions diffs - 1.0.2 → 1.0.4 - Mend

@youhaozhao/cninfo-mcp 1.0.2 → 1.0.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

package/LICENSE +21 -0
package/README.md +2 -0
package/bin/cninfo-mcp.js +12 -27
package/package.json +9 -7
package/python/__pycache__/spider.cpython-314.pyc +0 -0
package/python/mcp_server.py +156 -64
package/python/spider.py +203 -159
package/scripts/install-python-deps.js +56 -35

package/LICENSE ADDED Viewed

@@ -0,0 +1,21 @@
+MIT License
+Copyright (c) 2026 youhaozhao
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.

package/README.md CHANGED Viewed

@@ -1,5 +1,7 @@
 # cninfo-mcp
+[![npm version](https://img.shields.io/npm/v/@youhaozhao/cninfo-mcp)](https://www.npmjs.com/package/@youhaozhao/cninfo-mcp)
 通过 MCP 协议查询和下载巨潮资讯网上市公司年报的工具，适用于 Claude Desktop。
 ## 使用方法

package/bin/cninfo-mcp.js CHANGED Viewed

@@ -1,23 +1,19 @@
 #!/usr/bin/env node
 /**
- * CNINFO MCP Server Launcher
- *
- * This script launches the Python MCP Server and handles stdio communication.
- * It automatically detects Python and installs dependencies if needed.
+ * 巨潮资讯 MCP 服务器启动器
+ * 自动检测 Python 并安装依赖，然后启动 Python MCP 服务器。
  */
 const { spawn } = require('child_process');
 const path = require('path');
 const fs = require('fs');
-// Configuration
+// 配置路径
 const PYTHON_SCRIPT = path.join(__dirname, '..', 'python', 'mcp_server.py');
 const PYTHON_REQUIREMENTS = path.join(__dirname, '..', 'python', 'requirements.txt');
-/**
- * Find Python executable
- */
+// 查找可用的 Python 可执行文件
 async function findPython() {
   const pythonCommands = ['python3', 'python', 'python3.12', 'python3.11', 'python3.10'];
@@ -28,7 +24,7 @@ async function findPython() {
         return cmd;
       }
     } catch (error) {
-      // Continue to next command
+      // 继续尝试下一个命令
     }
   }
@@ -38,9 +34,7 @@ async function findPython() {
   );
 }
-/**
- * Check and install Python dependencies
- */
+// 检查并安装 Python 依赖
 async function ensureDependencies(pythonCmd) {
   const requirementsPath = PYTHON_REQUIREMENTS;
@@ -50,10 +44,10 @@ async function ensureDependencies(pythonCmd) {
   }
   try {
-    // Check if mcp package is installed
+    // 检查 mcp 包是否已安装
     const checkResult = await spawnAsync(pythonCmd, ['-c', 'import mcp']);
   } catch (error) {
-    // Dependencies not installed, install them
+    // 未安装，执行安装
     console.error('Installing Python dependencies...');
     const installResult = await spawnAsync(pythonCmd, ['-m', 'pip', 'install', '-r', requirementsPath], {
       stdio: 'inherit'
@@ -70,9 +64,7 @@ async function ensureDependencies(pythonCmd) {
   }
 }
-/**
- * Spawn a process and return result
- */
+// 启动子进程并返回结果
 function spawnAsync(command, args, options = {}) {
   return new Promise((resolve, reject) => {
     const child = spawn(command, args, {
@@ -116,24 +108,18 @@ function spawnAsync(command, args, options = {}) {
   });
 }
-/**
- * Main execution
- */
 async function main() {
   try {
-    // Check if Python script exists
+    // 检查 Python 脚本是否存在
     if (!fs.existsSync(PYTHON_SCRIPT)) {
       console.error('Error: mcp_server.py not found at', PYTHON_SCRIPT);
       process.exit(1);
     }
-    // Find Python
     const pythonCmd = await findPython();
-    // Ensure dependencies are installed
     await ensureDependencies(pythonCmd);
-    // Launch MCP Server with stdio
+    // 启动 MCP 服务器
     console.error('巨潮资讯 MCP 服务器已启动，等待连接...');
     const child = spawn(pythonCmd, [PYTHON_SCRIPT], {
       stdio: 'inherit',
@@ -144,7 +130,7 @@ async function main() {
       }
     });
-    // Handle child process exit
+    // 处理子进程退出
     child.on('error', (error) => {
       console.error('Failed to start MCP Server:', error.message);
       process.exit(1);
@@ -160,5 +146,4 @@ async function main() {
   }
 }
-// Run
 main();

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@youhaozhao/cninfo-mcp",
-  "version": "1.0.2",
+  "version": "1.0.4",
   "description": "MCP Server for querying and downloading Chinese listed companies' annual reports from CNINFO (巨潮资讯网)",
   "keywords": [
     "mcp",
@@ -11,16 +11,17 @@
     "finance",
     "python"
   ],
-  "homepage": "https://github.com/youhaozhao/cninfo_mcp#readme",
+  "homepage": "https://github.com/youhaozhao/cninfo-mcp#readme",
   "repository": {
     "type": "git",
-    "url": "git+https://github.com/youhaozhao/cninfo_mcp.git"
+    "url": "git+https://github.com/youhaozhao/cninfo-mcp.git"
   },
   "bugs": {
-    "url": "https://github.com/youhaozhao/cninfo_mcp/issues"
+    "url": "https://github.com/youhaozhao/cninfo-mcp/issues"
   },
+  "license": "MIT",
   "bin": {
-    "cninfo-mcp": "./bin/cninfo-mcp.js"
+    "cninfo-mcp": "bin/cninfo-mcp.js"
   },
   "scripts": {
     "postinstall": "node scripts/install-python-deps.js",
@@ -46,6 +47,7 @@
     "bin/",
     "python/",
     "scripts/",
-    "README.md"
+    "README.md",
+    "LICENSE"
   ]
-}
+}

package/python/__pycache__/spider.cpython-314.pyc ADDED Viewed

Binary file

package/python/mcp_server.py CHANGED Viewed

@@ -1,31 +1,34 @@
 #!/usr/bin/env python3
 """
-CNINFO MCP Server
-Model Context Protocol server for querying and downloading annual reports from CNINFO
+巨潮资讯 MCP 服务器
+用于查询和下载 A 股年度报告的 MCP 工具服务
 """
 import os
 import sys
 from typing import Optional
-# Add current directory to path for imports
+# 将当前目录加入模块搜索路径
 sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))
 from mcp.server import FastMCP
-from spider import query_annual_reports, download_annual_reports, saving_path
+from spider import (
+    query_annual_reports,
+    download_annual_reports,
+    query_prospectus,
+    download_prospectus,
+    saving_path,
+)
-# Create MCP server
+# 创建 MCP 服务器实例
 mcp = FastMCP(
     name="cninfo-server",
-    instructions="CNINFO annual reports server - Query and download Chinese listed companies' annual reports from cninfo.com.cn"
+    instructions="CNINFO annual reports server - Query and download Chinese listed companies' annual reports from cninfo.com.cn",
 )
 @mcp.tool()
-def query_annual_reports_tool(
-    stock_code: str,
-    year: Optional[int] = None
-) -> dict:
+def query_annual_reports_tool(stock_code: str, year: Optional[int] = None) -> dict:
     """
     Query annual reports for a Chinese listed company
@@ -46,57 +49,61 @@ def query_annual_reports_tool(
         if not reports:
             return {
-                'success': False,
-                'stock_code': stock_code,
-                'year': year,
-                'count': 0,
-                'reports': [],
-                'message': f'No annual reports found for stock {stock_code}' + (f' in year {year}' if year else '')
+                "success": False,
+                "stock_code": stock_code,
+                "year": year,
+                "count": 0,
+                "reports": [],
+                "message": f"No annual reports found for stock {stock_code}"
+                + (f" in year {year}" if year else ""),
             }
-        # Extract relevant information
+        # 提取关键字段
+        base_url = "https://static.cninfo.com.cn/"
         report_details = []
         for report in reports:
-            report_details.append({
-                'announcementTitle': report.get('announcementTitle', ''),
-                'announcementTime': report.get('announcementTime', ''),
-                'secCode': report.get('secCode', ''),
-                'secName': report.get('secName', ''),
-                'adjunctUrl': report.get('adjunctUrl', '')
-            })
+            adj = report.get("adjunctUrl", "")
+            report_details.append(
+                {
+                    "announcementTitle": report.get("announcementTitle", ""),
+                    "announcementTime": report.get("announcementTime", ""),
+                    "secCode": report.get("secCode", ""),
+                    "secName": report.get("secName", ""),
+                    "adjunctUrl": base_url + adj if adj else "",
+                }
+            )
         return {
-            'success': True,
-            'stock_code': stock_code,
-            'year': year,
-            'count': len(reports),
-            'reports': report_details,
-            'message': f'Found {len(reports)} annual report(s)' + (f' for year {year}' if year else '')
+            "success": True,
+            "stock_code": stock_code,
+            "year": year,
+            "count": len(reports),
+            "reports": report_details,
+            "message": f"Found {len(reports)} annual report(s)"
+            + (f" for year {year}" if year else ""),
         }
     except Exception as e:
         return {
-            'success': False,
-            'stock_code': stock_code,
-            'year': year,
-            'count': 0,
-            'reports': [],
-            'error': str(e),
-            'message': f'Error querying annual reports: {str(e)}'
+            "success": False,
+            "stock_code": stock_code,
+            "year": year,
+            "count": 0,
+            "reports": [],
+            "error": str(e),
+            "message": f"Error querying annual reports: {str(e)}",
         }
 @mcp.tool()
-def download_annual_reports_tool(
-    stock_code: str,
-    year: Optional[int] = None
-) -> dict:
+def download_annual_reports_tool(stock_code: str, year: Optional[int] = None, save_path: Optional[str] = None) -> dict:
     """
     Download annual reports for a Chinese listed company
     Args:
         stock_code: Stock code (e.g., '000888' for 峨眉山, '688777' for 中科德芯)
         year: Optional year to filter (e.g., 2024). If not provided, downloads all available years
+        save_path: Optional directory to save files (e.g., '/Users/me/reports'). Defaults to pdf/ in package directory
     Returns:
         Dictionary containing:
@@ -108,40 +115,125 @@ def download_annual_reports_tool(
         - message: Status message
     """
     try:
-        # Ensure download directory exists
-        os.makedirs(saving_path, exist_ok=True)
-        result = download_annual_reports(stock_code, year)
+        output_dir = save_path or saving_path
+        os.makedirs(output_dir, exist_ok=True)
-        # Add path information
-        result['stock_code'] = stock_code
-        result['year'] = year
+        result = download_annual_reports(stock_code, year, save_path=output_dir)
+        result["stock_code"] = stock_code
+        result["year"] = year
         return result
     except Exception as e:
         return {
-            'success': False,
-            'stock_code': stock_code,
-            'year': year,
-            'downloaded': 0,
-            'path': saving_path,
-            'error': str(e),
-            'message': f'Error downloading annual reports: {str(e)}'
+            "success": False,
+            "stock_code": stock_code,
+            "year": year,
+            "downloaded": 0,
+            "path": save_path or saving_path,
+            "error": str(e),
+            "message": f"Error downloading annual reports: {str(e)}",
         }
-@mcp.resource("annual-reports-list://{stock_code}")
-def get_annual_reports_list(stock_code: str) -> str:
+@mcp.tool()
+def query_prospectus_tool(stock_code: str) -> dict:
     """
-    Get a formatted list of annual reports for a stock code
+    Query prospectus documents for a Chinese listed company
     Args:
-        stock_code: Stock code (e.g., '000888')
+        stock_code: Stock code (e.g., '000888' for 峨眉山, '688777' for 中科德芯)
     Returns:
-        Formatted string with annual reports information
+        Dictionary containing:
+        - success: Boolean indicating if the query was successful
+        - stock_code: The queried stock code
+        - count: Number of documents found
+        - reports: List of document details (announcementTitle, announcementTime, secCode, secName)
     """
+    try:
+        reports = query_prospectus(stock_code)
+        if not reports:
+            return {
+                "success": False,
+                "stock_code": stock_code,
+                "count": 0,
+                "reports": [],
+                "message": f"No prospectus found for stock {stock_code}",
+            }
+        base_url = "https://static.cninfo.com.cn/"
+        report_details = [
+            {
+                "announcementTitle": r.get("announcementTitle", ""),
+                "announcementTime": r.get("announcementTime", ""),
+                "secCode": r.get("secCode", ""),
+                "secName": r.get("secName", ""),
+                "adjunctUrl": base_url + r.get("adjunctUrl", "") if r.get("adjunctUrl") else "",
+            }
+            for r in reports
+        ]
+        return {
+            "success": True,
+            "stock_code": stock_code,
+            "count": len(reports),
+            "reports": report_details,
+            "message": f"Found {len(reports)} prospectus document(s)",
+        }
+    except Exception as e:
+        return {
+            "success": False,
+            "stock_code": stock_code,
+            "count": 0,
+            "reports": [],
+            "error": str(e),
+            "message": f"Error querying prospectus: {str(e)}",
+        }
+@mcp.tool()
+def download_prospectus_tool(stock_code: str, save_path: Optional[str] = None) -> dict:
+    """
+    Download prospectus documents for a Chinese listed company
+    Args:
+        stock_code: Stock code (e.g., '000888' for 峨眉山, '688777' for 中科德芯)
+        save_path: Optional directory to save files (e.g., '/Users/me/reports'). Defaults to pdf/ in package directory
+    Returns:
+        Dictionary containing:
+        - success: Boolean indicating if download was successful
+        - stock_code: The stock code
+        - downloaded: Number of files downloaded
+        - path: Directory where files were saved
+        - message: Status message
+    """
+    try:
+        output_dir = save_path or saving_path
+        os.makedirs(output_dir, exist_ok=True)
+        result = download_prospectus(stock_code, save_path=output_dir)
+        result["stock_code"] = stock_code
+        return result
+    except Exception as e:
+        return {
+            "success": False,
+            "stock_code": stock_code,
+            "downloaded": 0,
+            "path": save_path or saving_path,
+            "error": str(e),
+            "message": f"Error downloading prospectus: {str(e)}",
+        }
+@mcp.resource("annual-reports-list://{stock_code}")
+def get_annual_reports_list(stock_code: str) -> str:
+    """返回指定股票代码的年度报告格式化列表"""
     try:
         reports = query_annual_reports(stock_code)
@@ -151,9 +243,9 @@ def get_annual_reports_list(stock_code: str) -> str:
         output = [f"Annual Reports for {stock_code}:", "=" * 60]
         for report in reports:
-            title = report.get('announcementTitle', 'N/A')
-            time = report.get('announcementTime', 'N/A')
-            name = report.get('secName', 'N/A')
+            title = report.get("announcementTitle", "N/A")
+            time = report.get("announcementTime", "N/A")
+            name = report.get("secName", "N/A")
             output.append(f"\n📄 {title}")
             output.append(f"   Company: {name}")
             output.append(f"   Date: {time}")
@@ -168,5 +260,5 @@ def get_annual_reports_list(stock_code: str) -> str:
 if __name__ == "__main__":
-    # Run the server with stdio transport
+    # 以 stdio 方式运行服务器
     mcp.run()

package/python/spider.py CHANGED Viewed

@@ -1,17 +1,17 @@
 """
-    downloads:
-    公开招股书（招股说明书/招股意向书）
-    《年度报告》 16 17 18
+从巨潮资讯下载年度报告和招股书
 """
 import os
 import random
 import time
 import requests
-download_path = 'https://static.cninfo.com.cn/'
+download_path = "https://static.cninfo.com.cn/"
 # 使用脚本所在目录的相对路径
-_saving_path = os.path.join(os.path.dirname(os.path.abspath(__file__)), 'pdf')
-saving_path = _saving_path + '/'
+_saving_path = os.path.join(os.path.dirname(os.path.abspath(__file__)), "pdf")
+saving_path = _saving_path + "/"
 User_Agent = [
     "Mozilla/5.0 (compatible; MSIE 9.0; Windows NT 6.1; Win64; x64; Trident/5.0; .NET CLR 3.5.30729; .NET CLR 3.0.30729; .NET CLR 2.0.50727; Media Center PC 6.0)",
@@ -20,169 +20,169 @@ User_Agent = [
     "Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN) AppleWebKit/523.15 (KHTML, like Gecko, Safari/419.3) Arora/0.3 (Change: 287 c9dfb30)",
     "Mozilla/5.0 (X11; U; Linux; en-US) AppleWebKit/527+ (KHTML, like Gecko, Safari/419.3) Arora/0.6",
     "Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:1.8.1.2pre) Gecko/20070215 K-Ninja/2.1.1",
-    "Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9) Gecko/20080705 Firefox/3.0 Kapiko/3.0"
+    "Mozilla/5.0 (Windows; U; Windows NT 5.1; zh-CN; rv:1.9) Gecko/20080705 Firefox/3.0 Kapiko/3.0",
 ]
-headers = {'Accept': 'application/json, text/javascript, */*; q=0.01',
-           "Content-Type": "application/x-www-form-urlencoded; charset=UTF-8",
-           "Accept-Encoding": "gzip, deflate",
-           "Accept-Language": "zh-CN,zh;q=0.9,en-US;q=0.8,en;q=0.7,zh-HK;q=0.6,zh-TW;q=0.5",
-           'Host': 'www.cninfo.com.cn',
-           'Origin': 'http://www.cninfo.com.cn',
-           'Referer': 'http://www.cninfo.com.cn/new/commonUrl?url=disclosure/list/notice',
-           'X-Requested-With': 'XMLHttpRequest'
-           }
+headers = {
+    "Accept": "application/json, text/javascript, */*; q=0.01",
+    "Content-Type": "application/x-www-form-urlencoded; charset=UTF-8",
+    "Accept-Encoding": "gzip, deflate",
+    "Accept-Language": "zh-CN,zh;q=0.9,en-US;q=0.8,en;q=0.7,zh-HK;q=0.6,zh-TW;q=0.5",
+    "Host": "www.cninfo.com.cn",
+    "Origin": "http://www.cninfo.com.cn",
+    "Referer": "http://www.cninfo.com.cn/new/commonUrl?url=disclosure/list/notice",
+    "X-Requested-With": "XMLHttpRequest",
+}
 # 深市 年度报告
 def szseAnnual(page, stock):
-    query_path = 'http://www.cninfo.com.cn/new/hisAnnouncement/query'
-    headers['User-Agent'] = random.choice(User_Agent)  # 定义User_Agent
-    query = {'pageNum': page,  # 页码
-             'pageSize': 30,
-             'tabName': 'fulltext',
-             'column': 'szse',  # 深交所
-             'stock': '',
-             'searchkey': stock,  # 使用searchkey查询股票代码或公司名
-             'secid': '',
-             'plate': 'sz',
-             'category': 'category_ndbg_szsh',  # 年度报告
-             'trade': '',
-             'seDate': '2020-01-01~2026-02-15'  # 时间区间
-             }
+    query_path = "http://www.cninfo.com.cn/new/hisAnnouncement/query"
+    headers["User-Agent"] = random.choice(User_Agent)  # 定义User_Agent
+    query = {
+        "pageNum": page,  # 页码
+        "pageSize": 30,
+        "tabName": "fulltext",
+        "column": "szse",  # 深交所
+        "stock": "",
+        "searchkey": stock,  # 使用searchkey查询股票代码或公司名
+        "secid": "",
+        "plate": "sz",
+        "category": "category_ndbg_szsh",  # 年度报告
+        "trade": "",
+        "seDate": "2020-01-01~2026-02-15",  # 时间区间
+    }
     namelist = requests.post(query_path, headers=headers, data=query)
     result = namelist.json()
-    if result and 'announcements' in result and result['announcements']:
-        return result['announcements']
+    if result and "announcements" in result and result["announcements"]:
+        return result["announcements"]
     return []
 # 沪市 年度报告
 def sseAnnual(page, stock):
-    query_path = 'http://www.cninfo.com.cn/new/hisAnnouncement/query'
-    headers['User-Agent'] = random.choice(User_Agent)  # 定义User_Agent
-    query = {'pageNum': page,  # 页码
-             'pageSize': 30,
-             'tabName': 'fulltext',
-             'column': 'sse',
-             'stock': '',
-             'searchkey': stock,  # 使用searchkey查询股票代码或公司名
-             'secid': '',
-             'plate': 'sh',
-             'category': 'category_ndbg_szsh',  # 年度报告
-             'trade': '',
-             'seDate': '2020-01-01~2026-02-15'  # 时间区间
-             }
+    query_path = "http://www.cninfo.com.cn/new/hisAnnouncement/query"
+    headers["User-Agent"] = random.choice(User_Agent)  # 定义User_Agent
+    query = {
+        "pageNum": page,  # 页码
+        "pageSize": 30,
+        "tabName": "fulltext",
+        "column": "sse",
+        "stock": "",
+        "searchkey": stock,  # 使用searchkey查询股票代码或公司名
+        "secid": "",
+        "plate": "sh",
+        "category": "category_ndbg_szsh",  # 年度报告
+        "trade": "",
+        "seDate": "2020-01-01~2026-02-15",  # 时间区间
+    }
     namelist = requests.post(query_path, headers=headers, data=query)
     result = namelist.json()
-    if result and 'announcements' in result and result['announcements']:
-        return result['announcements']
+    if result and "announcements" in result and result["announcements"]:
+        return result["announcements"]
     return []
 # 深市 招股
 def szseStock(page, stock):
-    query_path = 'http://www.cninfo.com.cn/new/hisAnnouncement/query'
-    headers['User-Agent'] = random.choice(User_Agent)  # 定义User_Agent
-    query = {'pageNum': page,  # 页码
-             'pageSize': 30,
-             'tabName': 'fulltext',
-             'column': 'szse',
-             'stock': '',
-             'searchkey': stock + ' 招股',  # 组合搜索：股票代码 + 招股
-             'secid': '',
-             'plate': 'sz',
-             'category': '',
-             'trade': '',
-             'seDate': '2015-01-01~2026-02-15'  # 时间区间
-             }
+    query_path = "http://www.cninfo.com.cn/new/hisAnnouncement/query"
+    headers["User-Agent"] = random.choice(User_Agent)  # 定义User_Agent
+    query = {
+        "pageNum": page,  # 页码
+        "pageSize": 30,
+        "tabName": "fulltext",
+        "column": "szse",
+        "stock": "",
+        "searchkey": stock + " 招股",  # 组合搜索：股票代码 + 招股
+        "secid": "",
+        "plate": "sz",
+        "category": "",
+        "trade": "",
+        "seDate": "2015-01-01~2026-02-15",  # 时间区间
+    }
     namelist = requests.post(query_path, headers=headers, data=query)
     result = namelist.json()
-    if result and 'announcements' in result and result['announcements']:
-        return result['announcements']
+    if result and "announcements" in result and result["announcements"]:
+        return result["announcements"]
     return []
 # 沪市 招股
 def sseStock(page, stock):
-    query_path = 'http://www.cninfo.com.cn/new/hisAnnouncement/query'
-    headers['User-Agent'] = random.choice(User_Agent)  # 定义User_Agent
-    query = {'pageNum': page,  # 页码
-             'pageSize': 30,
-             'tabName': 'fulltext',
-             'column': 'sse',
-             'stock': '',
-             'searchkey': stock + ' 招股',  # 组合搜索：股票代码 + 招股
-             'secid': '',
-             'plate': 'sh',
-             'category': '',
-             'trade': '',
-             'seDate': '2015-01-01~2026-02-15'  # 时间区间
-             }
+    query_path = "http://www.cninfo.com.cn/new/hisAnnouncement/query"
+    headers["User-Agent"] = random.choice(User_Agent)  # 定义User_Agent
+    query = {
+        "pageNum": page,  # 页码
+        "pageSize": 30,
+        "tabName": "fulltext",
+        "column": "sse",
+        "stock": "",
+        "searchkey": stock + " 招股",  # 组合搜索：股票代码 + 招股
+        "secid": "",
+        "plate": "sh",
+        "category": "",
+        "trade": "",
+        "seDate": "2015-01-01~2026-02-15",  # 时间区间
+    }
     namelist = requests.post(query_path, headers=headers, data=query)
     result = namelist.json()
-    if result and 'announcements' in result and result['announcements']:
-        return result['announcements']
+    if result and "announcements" in result and result["announcements"]:
+        return result["announcements"]
     return []
-# download PDF
-def Download(single_page, year_filter=None):
-    """
-    Download PDF files from announcement list
-    Args:
-        single_page: List of announcement dictionaries
-        year_filter: Optional year to filter (e.g., 2024). If None, downloads all years
-    """
+def Download(single_page, year_filter=None, save_path=None):
+    """下载公告列表中的 PDF 文件"""
     if single_page is None:
         return
-    headers = {'Accept': 'application/json, text/javascript, */*; q=0.01',
-               "Content-Type": "application/x-www-form-urlencoded; charset=UTF-8",
-               "Accept-Encoding": "gzip, deflate",
-               "Accept-Language": "zh-CN,zh;q=0.9,en-US;q=0.8,en;q=0.7,zh-HK;q=0.6,zh-TW;q=0.5",
-               'Host': 'www.cninfo.com.cn',
-               'Origin': 'http://www.cninfo.com.cn'
-               }
+    headers = {
+        "Accept": "application/json, text/javascript, */*; q=0.01",
+        "Content-Type": "application/x-www-form-urlencoded; charset=UTF-8",
+        "Accept-Encoding": "gzip, deflate",
+        "Accept-Language": "zh-CN,zh;q=0.9,en-US;q=0.8,en;q=0.7,zh-HK;q=0.6,zh-TW;q=0.5",
+        "Host": "www.cninfo.com.cn",
+        "Origin": "http://www.cninfo.com.cn",
+    }
-    # Build allowed list dynamically based on year_filter
+    # 按年份筛选允许下载的标题
     allowed_list = []
     if year_filter:
         allowed_list = [
-            f'{year_filter}年年度报告（更新后）',
-            f'{year_filter}年年度报告',
+            f"{year_filter}年年度报告（更新后）",
+            f"{year_filter}年年度报告",
         ]
     else:
-        # Default: all years from 2016-2025
+        # 默认下载 2016-2025 年
         for year in range(2016, 2026):
-            allowed_list.append(f'{year}年年度报告（更新后）')
-            allowed_list.append(f'{year}年年度报告')
+            allowed_list.append(f"{year}年年度报告（更新后）")
+            allowed_list.append(f"{year}年年度报告")
     allowed_list_2 = [
-        '招股书',
-        '招股说明书',
-        '招股意向书',
+        "招股书",
+        "招股说明书",
+        "招股意向书",
     ]
+    output_dir = (save_path or saving_path).rstrip("/") + "/"
+    downloaded_count = 0
     for i in single_page:
-        title = i['announcementTitle']
+        title = i["announcementTitle"]
-        # 跳过确认意见等非正式报告
-        if '确认意见' in title or '取消' in title:
+        # 跳过确认意见、取消公告、摘要等非正文文件
+        if "确认意见" in title or "取消" in title or "摘要" in title:
             continue
-        # 检查标题是否包含允许的文本
+        # 检查标题是否精确匹配（避免"摘要"等变体被误下载）
         allowed = False
         for item in allowed_list:
-            if item in title:
+            if title == item:
                 allowed = True
                 break
@@ -194,102 +194,146 @@ def Download(single_page, year_filter=None):
         if allowed:
             download = download_path + i["adjunctUrl"]
-            name = i["secCode"] + '_' + i['secName'] + '_' + i['announcementTitle'] + '.pdf'
-            if '*' in name:
-                name = name.replace('*', '')
-            file_path = saving_path + name
+            name = (
+                i["secCode"]
+                + "_"
+                + i["secName"]
+                + "_"
+                + i["announcementTitle"]
+                + ".pdf"
+            )
+            if "*" in name:
+                name = name.replace("*", "")
+            file_path = output_dir + name
             # 显示下载进度
             print(f"  ↓ {name}")
             # 确保目录存在
-            os.makedirs(os.path.dirname(file_path), exist_ok=True)
+            os.makedirs(output_dir, exist_ok=True)
             time.sleep(random.random() * 2)
-            headers['User-Agent'] = random.choice(User_Agent)
+            headers["User-Agent"] = random.choice(User_Agent)
             r = requests.get(download)
             f = open(file_path, "wb")
             f.write(r.content)
             f.close()
+            downloaded_count += 1
         else:
             continue
-    return True
+    return downloaded_count
-def query_annual_reports(stock_code, year=None):
-    """
-    Query annual reports for a specific stock code
+def query_prospectus(stock_code):
+    """查询指定股票代码的招股书公告列表"""
+    all_announcements = []
+    try:
+        announcements_sse = sseStock(1, stock_code)
+        all_announcements.extend(announcements_sse)
+    except Exception as e:
+        print(f"沪市招股书查询失败: {e}")
+    try:
+        announcements_szse = szseStock(1, stock_code)
+        all_announcements.extend(announcements_szse)
+    except Exception as e:
+        print(f"深市招股书查询失败: {e}")
+    prospectus_keywords = ["招股书", "招股说明书", "招股意向书"]
+    filtered = [
+        a for a in all_announcements
+        if any(kw in a.get("announcementTitle", "") for kw in prospectus_keywords)
+    ]
-    Args:
-        stock_code: Stock code (e.g., '000888', '688777')
-        year: Optional year filter (e.g., 2024). If None, returns all years
+    return filtered
-    Returns:
-        List of announcement dictionaries
-    """
+def download_prospectus(stock_code, save_path=None):
+    """下载指定股票的招股书"""
+    announcements = query_prospectus(stock_code)
+    if not announcements:
+        return {
+            "success": False,
+            "message": f"未找到股票 {stock_code} 的招股书",
+            "downloaded": 0,
+        }
+    output_dir = save_path or saving_path
+    count = Download(announcements, save_path=output_dir)
+    downloaded = count or 0
+    return {
+        "success": downloaded > 0,
+        "message": f"已下载 {stock_code} 招股书，共 {downloaded} 个文件"
+        if downloaded > 0
+        else f"未下载任何文件（{stock_code} 招股书）",
+        "downloaded": downloaded,
+        "path": output_dir,
+    }
+def query_annual_reports(stock_code, year=None):
+    """查询指定股票的年度报告列表"""
     all_announcements = []
-    # Try SSE (Shanghai)
+    # 查询沪市
     try:
         announcements_sse = sseAnnual(1, stock_code)
         all_announcements.extend(announcements_sse)
     except Exception as e:
-        print(f"Error querying SSE: {e}")
+        print(f"沪市年报查询失败: {e}")
-    # Try SZSE (Shenzhen)
+    # 查询深市
     try:
         announcements_szse = szseAnnual(1, stock_code)
         all_announcements.extend(announcements_szse)
     except Exception as e:
-        print(f"Error querying SZSE: {e}")
+        print(f"深市年报查询失败: {e}")
-    # Filter by year if specified
+    # 按年份过滤
     if year:
         year_str = str(year)
         filtered = []
         for announcement in all_announcements:
-            if year_str in announcement.get('announcementTitle', ''):
+            if year_str in announcement.get("announcementTitle", ""):
                 filtered.append(announcement)
         all_announcements = filtered
     return all_announcements
-def download_annual_reports(stock_code, year=None):
-    """
-    Download annual reports for a specific stock code
-    Args:
-        stock_code: Stock code (e.g., '000888', '688777')
-        year: Optional year filter (e.g., 2024). If None, downloads all years
-    Returns:
-        Dictionary with status and message
-    """
+def download_annual_reports(stock_code, year=None, save_path=None):
+    """下载指定股票的年度报告"""
     announcements = query_annual_reports(stock_code, year)
     if not announcements:
         return {
-            'success': False,
-            'message': f'No annual reports found for stock {stock_code}' + (f' in year {year}' if year else ''),
-            'downloaded': 0
+            "success": False,
+            "message": f"未找到股票 {stock_code} 的年度报告"
+            + (f"（{year} 年）" if year else ""),
+            "downloaded": 0,
         }
-    # Download PDFs
-    result = Download(announcements, year_filter=year)
+    output_dir = save_path or saving_path
+    count = Download(announcements, year_filter=year, save_path=output_dir)
+    downloaded = count or 0
+    year_suffix = f"（{year} 年）" if year else ""
     return {
-        'success': result,
-        'message': f'Downloaded reports for {stock_code}' + (f' year {year}' if year else ''),
-        'downloaded': len(announcements),
-        'path': saving_path
+        "success": downloaded > 0,
+        "message": f"已下载 {stock_code} 年度报告{year_suffix}，共 {downloaded} 个文件"
+        if downloaded > 0
+        else f"未下载任何文件（{stock_code} 年度报告{year_suffix}）",
+        "downloaded": downloaded,
+        "path": output_dir,
     }
-# given page_number & stock number
 def Run(page_number, stock):
     try:
         annual_report = szseAnnual(page_number, stock)
@@ -297,19 +341,19 @@ def Run(page_number, stock):
         annual_report_ = sseAnnual(page_number, stock)
         stock_report_ = sseStock(page_number, stock)
     except Exception:
-        print(page_number, 'page error, retrying')
+        print(page_number, "page error, retrying")
         try:
             annual_report = szseAnnual(page_number, stock)
         except Exception:
-            print(page_number, 'page error')
+            print(page_number, "page error")
     Download(annual_report)
     Download(stock_report)
     Download(annual_report_)
     Download(stock_report_)
-if __name__ == '__main__':
-    with open('company_id.txt') as file:
+if __name__ == "__main__":
+    with open("company_id.txt") as file:
         lines = file.readlines()
         for line in lines:
             stock = line

package/scripts/install-python-deps.js CHANGED Viewed

@@ -1,28 +1,36 @@
 #!/usr/bin/env node
 /**
- * Post-install script to install Python dependencies
- * This runs automatically after `npm install`
+ * npm install 后自动安装 Python 依赖
  */
-const { spawn } = require('child_process');
-const fs = require('fs');
-const path = require('path');
+const { spawn } = require("child_process");
+const fs = require("fs");
+const path = require("path");
-const REQUIREMENTS_FILE = path.join(__dirname, '..', 'python', 'requirements.txt');
+const REQUIREMENTS_FILE = path.join(
+  __dirname,
+  "..",
+  "python",
+  "requirements.txt",
+);
 async function findPython() {
-  const pythonCommands = ['python3', 'python', 'python3.12', 'python3.11', 'python3.10'];
+  const pythonCommands = [
+    "python3",
+    "python",
+    "python3.12",
+    "python3.11",
+    "python3.10",
+  ];
   for (const cmd of pythonCommands) {
     try {
-      const result = await spawnCommand(cmd, ['--version']);
-      if (result.stdout && result.stdout.includes('Python')) {
+      const result = await spawnCommand(cmd, ["--version"]);
+      if (result.stdout && result.stdout.includes("Python")) {
         return cmd;
       }
-    } catch (error) {
-      // Continue
-    }
+    } catch (error) {}
   }
   return null;
@@ -30,51 +38,64 @@ async function findPython() {
 function spawnCommand(cmd, args) {
   return new Promise((resolve, reject) => {
-    const child = spawn(cmd, args, { stdio: 'pipe', shell: process.platform === 'win32' });
-    let stdout = '';
-    let stderr = '';
+    const child = spawn(cmd, args, {
+      stdio: "pipe",
+      shell: process.platform === "win32",
+    });
+    let stdout = "";
+    let stderr = "";
-    child.stdout?.on('data', (d) => stdout += d);
-    child.stderr?.on('data', (d) => stderr += d);
+    child.stdout?.on("data", (d) => (stdout += d));
+    child.stderr?.on("data", (d) => (stderr += d));
-    child.on('close', (code) => {
+    child.on("close", (code) => {
       if (code === 0) resolve({ stdout, stderr });
-      else reject(new Error(`Command failed: ${cmd} ${args.join(' ')}`));
+      else reject(new Error(`Command failed: ${cmd} ${args.join(" ")}`));
     });
-    child.on('error', reject);
+    child.on("error", reject);
   });
 }
 async function main() {
-  // Skip if requirements.txt doesn't exist
+  // requirements.txt 不存在则跳过
   if (!fs.existsSync(REQUIREMENTS_FILE)) {
-    console.log('⚠️  requirements.txt not found, skipping Python dependencies installation');
+    console.log(
+      "⚠️  requirements.txt not found, skipping Python dependencies installation",
+    );
     return;
   }
   const pythonCmd = await findPython();
   if (!pythonCmd) {
-    console.warn('⚠️  Python not found. Python dependencies will be installed on first run.');
-    console.warn('   Please install Python 3.10+ from https://python.org');
+    console.warn(
+      "⚠️  Python not found. Python dependencies will be installed on first run.",
+    );
+    console.warn("   Please install Python 3.10+ from https://python.org");
     return;
   }
   try {
-    // Check if mcp is already installed
-    await spawnCommand(pythonCmd, ['-c', 'import mcp']);
-    console.log('✅ Python dependencies already installed');
+    // 检查 mcp 是否已安装
+    await spawnCommand(pythonCmd, ["-c", "import mcp"]);
+    console.log("✅ Python dependencies already installed");
   } catch (error) {
-    // Install dependencies
-    console.log('📦 Installing Python dependencies...');
+    // 执行安装
+    console.log("📦 Installing Python dependencies...");
     try {
-      await spawnCommand(pythonCmd, ['-m', 'pip', 'install', '-r', REQUIREMENTS_FILE], {
-        stdio: 'inherit'
-      });
-      console.log('✅ Python dependencies installed successfully');
+      await spawnCommand(
+        pythonCmd,
+        ["-m", "pip", "install", "-r", REQUIREMENTS_FILE],
+        {
+          stdio: "inherit",
+        },
+      );
+      console.log("✅ Python dependencies installed successfully");
     } catch (installError) {
-      console.warn('⚠️  Failed to install Python dependencies during npm install');
-      console.warn('   They will be installed automatically on first run');
+      console.warn(
+        "⚠️  Failed to install Python dependencies during npm install",
+      );
+      console.warn("   They will be installed automatically on first run");
     }
   }
 }