PyPI - jarvis-ai-assistant - Versions diffs - 0.5.0__py3-none-any.whl → 0.6.0__py3-none-any.whl - Mend

jarvis-ai-assistant 0.5.0py3-none-any.whl → 0.6.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (41) hide show

jarvis/__init__.py +1 -1
jarvis/jarvis_agent/__init__.py +114 -6
jarvis/jarvis_agent/agent_manager.py +3 -0
jarvis/jarvis_agent/jarvis.py +45 -9
jarvis/jarvis_agent/run_loop.py +6 -1
jarvis/jarvis_agent/task_planner.py +219 -0
jarvis/jarvis_c2rust/__init__.py +13 -0
jarvis/jarvis_c2rust/cli.py +405 -0
jarvis/jarvis_c2rust/collector.py +209 -0
jarvis/jarvis_c2rust/library_replacer.py +933 -0
jarvis/jarvis_c2rust/llm_module_agent.py +1265 -0
jarvis/jarvis_c2rust/scanner.py +1671 -0
jarvis/jarvis_c2rust/transpiler.py +1236 -0
jarvis/jarvis_code_agent/code_agent.py +151 -18
jarvis/jarvis_data/config_schema.json +13 -3
jarvis/jarvis_sec/README.md +180 -0
jarvis/jarvis_sec/__init__.py +674 -0
jarvis/jarvis_sec/checkers/__init__.py +33 -0
jarvis/jarvis_sec/checkers/c_checker.py +1269 -0
jarvis/jarvis_sec/checkers/rust_checker.py +367 -0
jarvis/jarvis_sec/cli.py +110 -0
jarvis/jarvis_sec/prompts.py +324 -0
jarvis/jarvis_sec/report.py +260 -0
jarvis/jarvis_sec/types.py +20 -0
jarvis/jarvis_sec/workflow.py +513 -0
jarvis/jarvis_tools/cli/main.py +1 -0
jarvis/jarvis_tools/execute_script.py +1 -1
jarvis/jarvis_tools/read_code.py +11 -1
jarvis/jarvis_tools/read_symbols.py +129 -0
jarvis/jarvis_tools/registry.py +9 -1
jarvis/jarvis_tools/sub_agent.py +4 -3
jarvis/jarvis_tools/sub_code_agent.py +3 -3
jarvis/jarvis_utils/config.py +28 -6
jarvis/jarvis_utils/git_utils.py +39 -0
jarvis/jarvis_utils/utils.py +150 -7
{jarvis_ai_assistant-0.5.0.dist-info → jarvis_ai_assistant-0.6.0.dist-info}/METADATA +13 -1
{jarvis_ai_assistant-0.5.0.dist-info → jarvis_ai_assistant-0.6.0.dist-info}/RECORD +41 -22
{jarvis_ai_assistant-0.5.0.dist-info → jarvis_ai_assistant-0.6.0.dist-info}/entry_points.txt +4 -0
{jarvis_ai_assistant-0.5.0.dist-info → jarvis_ai_assistant-0.6.0.dist-info}/WHEEL +0 -0
{jarvis_ai_assistant-0.5.0.dist-info → jarvis_ai_assistant-0.6.0.dist-info}/licenses/LICENSE +0 -0
{jarvis_ai_assistant-0.5.0.dist-info → jarvis_ai_assistant-0.6.0.dist-info}/top_level.txt +0 -0

jarvis/jarvis_sec/checkers/rust_checker.py ADDED Viewed

@@ -0,0 +1,367 @@
+# -*- coding: utf-8 -*-
+"""
+OpenHarmony 安全演进多Agent套件 —— Rust 启发式安全检查器（阶段一）
+目标与范围：
+- 聚焦 unsafe 使用、原始指针、错误处理、并发与 FFI 等基础安全问题。
+- 提供可解释的启发式检测与置信度评估，面向 .rs 源文件。
+输出约定：
+- 返回 jarvis.jarvis_sec.workflow.Issue 列表（结构化，便于聚合评分与报告生成）。
+- 置信度区间 [0,1]；严重性（severity）分为 high/medium/low。
+使用方式：
+- from jarvis.jarvis_sec.checkers.rust_checker import analyze_files
+- issues = analyze_files("./repo", ["src/lib.rs", "src/foo.rs"])
+"""
+from __future__ import annotations
+import re
+from pathlib import Path
+from typing import Iterable, List, Sequence, Tuple
+from jarvis.jarvis_sec.types import Issue
+# ---------------------------
+# 规则库（正则表达式）
+# ---------------------------
+RE_UNSAFE = re.compile(r"\bunsafe\b")
+RE_RAW_PTR = re.compile(r"\*(?:mut|const)\s+[A-Za-z_]\w*")  # 类型处的原始指针
+RE_FORGET = re.compile(r"\bmem::forget\b")
+RE_TRANSMUTE = re.compile(r"\bmem::transmute\b")
+RE_MAYBE_UNINIT = re.compile(r"\bMaybeUninit\b")
+RE_ASSUME_INIT = re.compile(r"\bassume_init\s*\(")
+RE_UNWRAP = re.compile(r"\bunwrap\s*\(", re.IGNORECASE)
+RE_EXPECT = re.compile(r"\bexpect\s*\(", re.IGNORECASE)
+RE_EXTERN_C = re.compile(r'extern\s+"C"')
+RE_UNSAFE_IMPL = re.compile(r"\bunsafe\s+impl\s+(?:Send|Sync)\b|\bimpl\s+unsafe\s+(?:Send|Sync)\b", re.IGNORECASE)
+# 结果忽略/下划线绑定（可能忽略错误）
+RE_LET_UNDERSCORE = re.compile(r"\blet\s+_+\s*=\s*.+;")
+RE_MATCH_IGNORE_ERR = re.compile(r"\.ok\s*\(\s*\)|\.ok\?\s*;|\._?\s*=\s*.+\.err\(\s*\)", re.IGNORECASE)  # 粗略
+# ---------------------------
+# 公共工具
+# ---------------------------
+def _safe_line(lines: Sequence[str], idx: int) -> str:
+    if 1 <= idx <= len(lines):
+        return lines[idx - 1]
+    return ""
+def _strip_line(s: str, max_len: int = 200) -> str:
+    s = s.strip().replace("\t", " ")
+    return s if len(s) <= max_len else s[: max_len - 3] + "..."
+def _window(lines: Sequence[str], center: int, before: int = 3, after: int = 3) -> List[Tuple[int, str]]:
+    start = max(1, center - before)
+    end = min(len(lines), center + after)
+    return [(i, _safe_line(lines, i)) for i in range(start, end + 1)]
+def _has_safety_comment_around(lines: Sequence[str], line_no: int, radius: int = 5) -> bool:
+    """
+    Rust 社区约定在 unsafe 附近写 SAFETY: 注释说明前置条件。
+    如存在，适当降低置信度。
+    """
+    for _, s in _window(lines, line_no, before=radius, after=radius):
+        if "SAFETY:" in s or "Safety:" in s or "safety:" in s:
+            return True
+    return False
+def _in_test_context(lines: Sequence[str], line_no: int, radius: int = 20) -> bool:
+    """
+    近邻出现 #[test] 或 mod tests { ... } 等，可能处于测试上下文，适度降低严重度。
+    """
+    for _, s in _window(lines, line_no, before=radius, after=radius):
+        if "#[test]" in s or re.search(r"\bmod\s+tests\b", s):
+            return True
+    return False
+def _severity_from_confidence(conf: float) -> str:
+    if conf >= 0.8:
+        return "high"
+    if conf >= 0.6:
+        return "medium"
+    return "low"
+# ---------------------------
+# 规则实现
+# ---------------------------
+def _rule_unsafe(lines: Sequence[str], relpath: str) -> List[Issue]:
+    issues: List[Issue] = []
+    for idx, s in enumerate(lines, start=1):
+        if not RE_UNSAFE.search(s):
+            continue
+        conf = 0.8
+        if _has_safety_comment_around(lines, idx, radius=5):
+            conf -= 0.1
+        if _in_test_context(lines, idx):
+            conf -= 0.05
+        conf = max(0.5, min(0.95, conf))
+        issues.append(
+            Issue(
+                language="rust",
+                category="unsafe_usage",
+                pattern="unsafe",
+                file=relpath,
+                line=idx,
+                evidence=_strip_line(s),
+                description="存在 unsafe 代码块/标识，需证明内存/别名/生命周期安全性。",
+                suggestion="将不安全操作封装在最小作用域内，并提供 SAFETY 注释说明前置条件与不变式。",
+                confidence=conf,
+                severity=_severity_from_confidence(conf),
+            )
+        )
+    return issues
+def _rule_raw_pointer(lines: Sequence[str], relpath: str) -> List[Issue]:
+    issues: List[Issue] = []
+    for idx, s in enumerate(lines, start=1):
+        if not RE_RAW_PTR.search(s):
+            continue
+        conf = 0.75
+        if _has_safety_comment_around(lines, idx):
+            conf -= 0.1
+        if _in_test_context(lines, idx):
+            conf -= 0.05
+        conf = max(0.5, min(0.9, conf))
+        issues.append(
+            Issue(
+                language="rust",
+                category="unsafe_usage",
+                pattern="raw_pointer",
+                file=relpath,
+                line=idx,
+                evidence=_strip_line(s),
+                description="出现原始指针（*mut/*const），可能绕过借用/生命周期检查，带来未定义行为风险。",
+                suggestion="优先使用引用/智能指针；必须使用原始指针时，严格证明无别名、对齐与生命周期安全。",
+                confidence=conf,
+                severity=_severity_from_confidence(conf),
+            )
+        )
+    return issues
+def _rule_transmute(lines: Sequence[str], relpath: str) -> List[Issue]:
+    issues: List[Issue] = []
+    for idx, s in enumerate(lines, start=1):
+        if not RE_TRANSMUTE.search(s):
+            continue
+        conf = 0.85
+        if _has_safety_comment_around(lines, idx):
+            conf -= 0.1
+        conf = max(0.6, min(0.95, conf))
+        issues.append(
+            Issue(
+                language="rust",
+                category="unsafe_usage",
+                pattern="mem::transmute",
+                file=relpath,
+                line=idx,
+                evidence=_strip_line(s),
+                description="使用 mem::transmute 进行类型转换，若未严格保证布局/对齐/生命周期，将导致未定义行为。",
+                suggestion="避免使用 transmute，优先采用安全转换或 bytemuck 等受审计抽象；必须使用时严格注明不变式。",
+                confidence=conf,
+                severity=_severity_from_confidence(conf),
+            )
+        )
+    return issues
+def _rule_maybe_uninit(lines: Sequence[str], relpath: str) -> List[Issue]:
+    """
+    MaybeUninit + assume_init 组合常见于优化/FFI，需特别小心初始化与有效性。
+    """
+    issues: List[Issue] = []
+    for idx, s in enumerate(lines, start=1):
+        if not (RE_MAYBE_UNINIT.search(s) or RE_ASSUME_INIT.search(s)):
+            continue
+        conf = 0.7
+        # 若在邻近几行同时出现 MaybeUninit 与 assume_init，风险更高
+        win_text = " ".join(t for _, t in _window(lines, idx, before=3, after=3))
+        if RE_MAYBE_UNINIT.search(win_text) and RE_ASSUME_INIT.search(win_text):
+            conf += 0.1
+        if _has_safety_comment_around(lines, idx):
+            conf -= 0.05
+        conf = max(0.5, min(0.9, conf))
+        issues.append(
+            Issue(
+                language="rust",
+                category="unsafe_usage",
+                pattern="MaybeUninit/assume_init",
+                file=relpath,
+                line=idx,
+                evidence=_strip_line(s),
+                description="使用 MaybeUninit/assume_init 需保证正确初始化与读取顺序，否则可能导致未定义行为。",
+                suggestion="确保初始化前不读取；使用更安全的构造函数；在 SAFETY 注释中说明前置条件。",
+                confidence=conf,
+                severity=_severity_from_confidence(conf),
+            )
+        )
+    return issues
+def _rule_unwrap_expect(lines: Sequence[str], relpath: str) -> List[Issue]:
+    issues: List[Issue] = []
+    for idx, s in enumerate(lines, start=1):
+        if not (RE_UNWRAP.search(s) or RE_EXPECT.search(s)):
+            continue
+        conf = 0.65
+        if _in_test_context(lines, idx):
+            conf -= 0.1
+        conf = max(0.45, min(0.8, conf))
+        issues.append(
+            Issue(
+                language="rust",
+                category="error_handling",
+                pattern="unwrap/expect",
+                file=relpath,
+                line=idx,
+                evidence=_strip_line(s),
+                description="直接 unwrap/expect 可能在错误条件下 panic，缺少健壮的错误处理路径。",
+                suggestion="使用 ? 传播错误或 match 显式处理；为关键路径提供错误上下文与恢复策略。",
+                confidence=conf,
+                severity=_severity_from_confidence(conf),
+            )
+        )
+    return issues
+def _rule_extern_c(lines: Sequence[str], relpath: str) -> List[Issue]:
+    issues: List[Issue] = []
+    for idx, s in enumerate(lines, start=1):
+        if not RE_EXTERN_C.search(s):
+            continue
+        conf = 0.7
+        if _has_safety_comment_around(lines, idx):
+            conf -= 0.05
+        conf = max(0.5, min(0.85, conf))
+        issues.append(
+            Issue(
+                language="rust",
+                category="ffi",
+                pattern='extern "C"',
+                file=relpath,
+                line=idx,
+                evidence=_strip_line(s),
+                description="FFI 边界需要确保指针有效性、长度/对齐、生命周期、线程安全等约束，否则可能产生未定义行为。",
+                suggestion="在 FFI 边界进行严格的参数校验与安全封装；在 SAFETY 注释中记录不变式与约束。",
+                confidence=conf,
+                severity=_severity_from_confidence(conf),
+            )
+        )
+    return issues
+def _rule_unsafe_impl(lines: Sequence[str], relpath: str) -> List[Issue]:
+    issues: List[Issue] = []
+    for idx, s in enumerate(lines, start=1):
+        if not RE_UNSAFE_IMPL.search(s):
+            continue
+        conf = 0.8
+        if _has_safety_comment_around(lines, idx):
+            conf -= 0.1
+        conf = max(0.6, min(0.95, conf))
+        issues.append(
+            Issue(
+                language="rust",
+                category="concurrency",
+                pattern="unsafe_impl_Send_or_Sync",
+                file=relpath,
+                line=idx,
+                evidence=_strip_line(s),
+                description="手写 unsafe impl Send/Sync 可能破坏并发内存模型保证，带来数据竞争风险。",
+                suggestion="避免手写 unsafe impl；必要时严格证明线程安全前置条件并最小化不安全区域。",
+                confidence=conf,
+                severity=_severity_from_confidence(conf),
+            )
+        )
+    return issues
+def _rule_ignore_result(lines: Sequence[str], relpath: str) -> List[Issue]:
+    """
+    启发式：使用 let _ = xxx; 或 .ok() 等可能忽略错误。
+    该规则误报可能较高，因此置信度较低。
+    """
+    issues: List[Issue] = []
+    for idx, s in enumerate(lines, start=1):
+        if not (RE_LET_UNDERSCORE.search(s) or RE_MATCH_IGNORE_ERR.search(s)):
+            continue
+        conf = 0.55
+        if _in_test_context(lines, idx):
+            conf -= 0.1
+        conf = max(0.4, min(0.7, conf))
+        issues.append(
+            Issue(
+                language="rust",
+                category="error_handling",
+                pattern="ignored_result",
+                file=relpath,
+                line=idx,
+                evidence=_strip_line(s),
+                description="可能忽略了返回的错误结果，导致失败未被处理。",
+                suggestion="显式处理 Result（? 传播或 match），确保错误路径涵盖资源回收与日志记录。",
+                confidence=conf,
+                severity=_severity_from_confidence(conf),
+            )
+        )
+    return issues
+# ---------------------------
+# 对外主入口
+# ---------------------------
+def analyze_rust_text(relpath: str, text: str) -> List[Issue]:
+    """
+    基于提供的文本进行 Rust 启发式分析。
+    """
+    lines = text.splitlines()
+    issues: List[Issue] = []
+    issues.extend(_rule_unsafe(lines, relpath))
+    issues.extend(_rule_raw_pointer(lines, relpath))
+    issues.extend(_rule_transmute(lines, relpath))
+    issues.extend(_rule_maybe_uninit(lines, relpath))
+    issues.extend(_rule_unwrap_expect(lines, relpath))
+    issues.extend(_rule_extern_c(lines, relpath))
+    issues.extend(_rule_unsafe_impl(lines, relpath))
+    issues.extend(_rule_ignore_result(lines, relpath))
+    return issues
+def analyze_rust_file(base: Path, relpath: Path) -> List[Issue]:
+    """
+    从磁盘读取文件进行分析。
+    """
+    try:
+        text = (base / relpath).read_text(errors="ignore")
+    except Exception:
+        return []
+    return analyze_rust_text(str(relpath), text)
+def analyze_files(base_path: str, files: Iterable[str]) -> List[Issue]:
+    """
+    批量分析文件，相对路径相对于 base_path。
+    """
+    base = Path(base_path).resolve()
+    out: List[Issue] = []
+    for f in files:
+        p = Path(f)
+        if p.suffix.lower() == ".rs":
+            out.extend(analyze_rust_file(base, p))
+    return out

jarvis/jarvis_sec/cli.py ADDED Viewed

@@ -0,0 +1,110 @@
+# -*- coding: utf-8 -*-
+"""
+OpenHarmony 安全演进套件 —— 命令行入口（Typer 版本）
+用法示例：
+- Agent模式（单Agent，逐条子任务分析）
+  python -m jarvis.jarvis_sec.cli agent --path ./target_project
+可选参数：
+- --output: 最终Markdown报告输出路径（默认 ./report.md）
+"""
+from __future__ import annotations
+import sys
+from pathlib import Path
+from typing import Optional
+import typer
+from jarvis.jarvis_utils.utils import init_env
+# removed: set_config import（避免全局覆盖模型组配置）
+from jarvis.jarvis_sec.workflow import run_with_multi_agent, run_security_analysis_fast
+app = typer.Typer(
+    add_completion=False,
+    no_args_is_help=True,
+    help="OpenHarmony 安全演进套件（单Agent逐条子任务分析）",
+)
+@app.command("agent", help="Agent模式（单Agent逐条子任务分析）")
+def agent(
+    path: str = typer.Option(..., "--path", "-p", help="待分析的根目录"),
+    llm_group: Optional[str] = typer.Option(
+        None, "--llm-group", "-g", help="使用的模型组（仅对本次运行生效，不修改全局配置）"
+    ),
+    output: Optional[str] = typer.Option(
+        "report.md", "--output", "-o", help="最终Markdown报告输出路径（默认 ./report.md）"
+    ),
+) -> None:
+    # 初始化环境，确保平台/模型等全局配置就绪（避免 NoneType 平台）
+    try:
+        init_env("欢迎使用 Jarvis-OpenHarmony 安全套件！", None)
+    except Exception:
+        # 环境初始化失败不应阻塞CLI基础功能，继续后续流程
+        pass
+    # 若指定了模型组：仅对本次运行生效，透传给 Agent；不修改全局配置（无需 set_config）
+    text: Optional[str] = None
+    try:
+        text = run_with_multi_agent(
+            path,
+            llm_group=llm_group,
+        )
+    except Exception as e:
+        try:
+            typer.secho(f"[jarvis_sec] Agent 分析过程出错，将回退到直扫基线（fast）：{e}", fg=typer.colors.YELLOW, err=True)
+        except Exception:
+            pass
+        text = None
+    if not text or not str(text).strip():
+        try:
+            typer.secho("[jarvis_sec] Agent 无输出，回退到直扫基线（fast）。", fg=typer.colors.YELLOW, err=True)
+        except Exception:
+            pass
+        text = run_security_analysis_fast(path)
+    if output:
+        try:
+            md_text = text or ""
+            try:
+                lines = (text or "").splitlines()
+                idx = -1
+                for i, ln in enumerate(lines):
+                    if ln.strip().startswith("# OpenHarmony 安全问题分析报告"):
+                        idx = i
+                        break
+                if idx >= 0:
+                    md_text = "\n".join(lines[idx:])
+            except Exception:
+                md_text = text or ""
+            p = Path(output)
+            p.parent.mkdir(parents=True, exist_ok=True)
+            p.write_text(md_text, encoding="utf-8")
+            try:
+                typer.secho(f"[jarvis_sec] Markdown 报告已写入: {p}", fg=typer.colors.GREEN)
+            except Exception:
+                pass
+        except Exception as e:
+            try:
+                typer.secho(f"[jarvis_sec] 写入Markdown报告失败: {e}", fg=typer.colors.RED, err=True)
+            except Exception:
+                pass
+    typer.echo(text)
+def main() -> int:
+    app()
+    return 0
+if __name__ == "__main__":
+    sys.exit(main())

jarvis-ai-assistant 0.5.0__py3-none-any.whl → 0.6.0__py3-none-any.whl

jarvis-ai-assistant 0.5.0py3-none-any.whl → 0.6.0py3-none-any.whl