PyPI - noscroll - Versions diffs - 0.1.1__tar.gz - Mend

noscroll 0.1.1__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (49) hide show

noscroll-0.1.1/.env.example +70 -0
noscroll-0.1.1/.gitignore +22 -0
noscroll-0.1.1/LICENSE +21 -0
noscroll-0.1.1/PKG-INFO +64 -0
noscroll-0.1.1/README.md +45 -0
noscroll-0.1.1/automation/.env.example +4 -0
noscroll-0.1.1/automation/README.md +134 -0
noscroll-0.1.1/automation/__init__.py +4 -0
noscroll-0.1.1/automation/__main__.py +6 -0
noscroll-0.1.1/automation/adapters/__init__.py +98 -0
noscroll-0.1.1/automation/agents.py +253 -0
noscroll-0.1.1/automation/config.py +39 -0
noscroll-0.1.1/automation/evals/__init__.py +110 -0
noscroll-0.1.1/automation/latest +1 -0
noscroll-0.1.1/automation/loop.py +419 -0
noscroll-0.1.1/automation/prompts/diagnostic.txt +24 -0
noscroll-0.1.1/automation/prompts/executor.txt +32 -0
noscroll-0.1.1/automation/prompts/fixer.txt +29 -0
noscroll-0.1.1/automation/tasks/__init__.py +95 -0
noscroll-0.1.1/prompts/system.txt +90 -0
noscroll-0.1.1/pyproject.toml +37 -0
noscroll-0.1.1/src/noscroll/__init__.py +3 -0
noscroll-0.1.1/src/noscroll/__main__.py +5 -0
noscroll-0.1.1/src/noscroll/cli.py +1120 -0
noscroll-0.1.1/src/noscroll/config.py +189 -0
noscroll-0.1.1/src/noscroll/crawler.py +676 -0
noscroll-0.1.1/src/noscroll/duration.py +312 -0
noscroll-0.1.1/src/noscroll/fetch.py +36 -0
noscroll-0.1.1/src/noscroll/hackernews.py +737 -0
noscroll-0.1.1/src/noscroll/llm.py +741 -0
noscroll-0.1.1/src/noscroll/opml.py +76 -0
noscroll-0.1.1/src/noscroll/rss.py +161 -0
noscroll-0.1.1/src/noscroll/runner.py +359 -0
noscroll-0.1.1/src/noscroll/utils.py +88 -0
noscroll-0.1.1/subscriptions/subscriptions.toml +184 -0
noscroll-0.1.1/tests/integration/__init__.py +1 -0
noscroll-0.1.1/tests/integration/conftest.py +47 -0
noscroll-0.1.1/tests/integration/test_cli_config.py +46 -0
noscroll-0.1.1/tests/integration/test_cli_run.py +215 -0
noscroll-0.1.1/tests/integration/test_real_run.py +164 -0
noscroll-0.1.1/tests/test_cli.py +600 -0
noscroll-0.1.1/tests/test_config.py +273 -0
noscroll-0.1.1/tests/test_duration.py +323 -0
noscroll-0.1.1/tests/test_hackernews.py +531 -0
noscroll-0.1.1/tests/test_llm.py +412 -0
noscroll-0.1.1/tests/test_opml.py +293 -0
noscroll-0.1.1/tests/test_rss.py +223 -0
noscroll-0.1.1/tests/test_runner.py +497 -0
noscroll-0.1.1/tests/test_utils.py +182 -0

noscroll-0.1.1/.env.example ADDED Viewed

@@ -0,0 +1,70 @@
+# NoScroll Configuration
+# All environment variables can also be set via CLI arguments.
+# Priority: CLI > Environment Variable > Config File > Default
+# =============================================================================
+# LLM Configuration (also available as CLI: --llm-api-url, --llm-api-key, etc.)
+# =============================================================================
+# LLM API Settings
+LLM_API_URL="https://api.openai.com/v1"    # CLI: --llm-api-url
+LLM_API_KEY=""                              # CLI: --llm-api-key
+LLM_MODEL="gpt-4o"                          # CLI: --llm-model
+LLM_SUMMARY_MODEL="gpt-4o-mini"             # CLI: --llm-summary-model
+LLM_API_MODE="chat"                         # CLI: --llm-api-mode (chat/completions/responses)
+# LLM Timeout & Concurrency
+LLM_TIMEOUT_MS=600000                       # CLI: --llm-timeout
+LLM_GLOBAL_CONCURRENCY=5                    # CLI: --llm-concurrency
+# =============================================================================
+# Paths (also available as CLI arguments)
+# =============================================================================
+SUBSCRIPTIONS_PATH="subscriptions/subscriptions.toml"  # CLI: --subscriptions
+SYSTEM_PROMPT_PATH="prompts/system.txt"                # CLI: --system-prompt
+LLM_LOG_PATH="logs/llm-trace.log"                      # CLI: --llm-log
+FEED_LOG_PATH="logs/feed-items.log"                    # CLI: --feed-log
+OUTPUT_DIR="outputs"
+# Config file path (optional - defaults to ~/.config/noscroll/config.toml)
+# NOSCROLL_CONFIG="/path/to/config.toml"
+# =============================================================================
+# Proxy (uses standard environment variables)
+# =============================================================================
+# NoScroll automatically uses standard proxy environment variables:
+#   HTTPS_PROXY, HTTP_PROXY, ALL_PROXY
+# Example:
+#   export HTTPS_PROXY="http://127.0.0.1:7890"
+#   export ALL_PROXY="socks5://127.0.0.1:1080"
+# =============================================================================
+# CLI-Specific Options (NOSCROLL_* prefix)
+# These map directly to `noscroll run` arguments
+# =============================================================================
+# Time Window
+# NOSCROLL_LAST="10d"                       # CLI: --last (e.g., 10d, 36h, 2w)
+# NOSCROLL_FROM=""                          # CLI: --from (RFC3339 or YYYY-MM-DD)
+# NOSCROLL_TO=""                            # CLI: --to (default: now)
+# Output Splitting
+# NOSCROLL_BUCKET=""                        # CLI: --bucket (day, hour, or duration)
+# NOSCROLL_NAME_TEMPLATE="{start:%Y-%m-%d}.md"  # CLI: --name-template
+# Output
+# NOSCROLL_OUT="./noscroll.md"              # CLI: --out
+# NOSCROLL_FORMAT="markdown"                # CLI: --format (markdown/json)
+# Source Filtering
+# NOSCROLL_SOURCE_TYPES="rss,web,hn"        # CLI: --source-types
+# LLM Request Options
+# NOSCROLL_SERIAL="false"                   # CLI: --serial
+# NOSCROLL_DELAY=0                          # CLI: --delay (ms)
+# NOSCROLL_LANG="en"                        # CLI: --lang (en, zh, ja, etc.)
+# Debug
+# NOSCROLL_DEBUG="false"                    # CLI: --debug
+# DEBUG="false"                             # Alternative debug flag

noscroll-0.1.1/.gitignore ADDED Viewed

@@ -0,0 +1,22 @@
+.env
+node_modules/
+output.json
+# VS Code
+.vscode/settings.json
+# Python
+.venv/
+__pycache__/
+*.pyc
+*.pyo
+*.egg-info/
+.pytest_cache/
+htmlcov/
+.coverage
+# Logs and crawled content
+logs/
+crawled/
+test_outputs/
+outputs/

noscroll-0.1.1/LICENSE ADDED Viewed

@@ -0,0 +1,21 @@
+MIT License
+Copyright (c) 2026 Yuxin
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.

noscroll-0.1.1/PKG-INFO ADDED Viewed

@@ -0,0 +1,64 @@
+Metadata-Version: 2.4
+Name: noscroll
+Version: 0.1.1
+Summary: Pull, don't scroll. RSS aggregator with LLM-powered summarization.
+License-File: LICENSE
+Requires-Python: >=3.11
+Requires-Dist: feedparser>=6.0.0
+Requires-Dist: httpx[socks]>=0.27.0
+Requires-Dist: platformdirs>=4.0.0
+Requires-Dist: python-dotenv>=1.0.0
+Requires-Dist: pyyaml>=6.0.0
+Provides-Extra: crawler
+Requires-Dist: crawl4ai>=0.3.0; extra == 'crawler'
+Requires-Dist: pydantic>=2.0.0; extra == 'crawler'
+Provides-Extra: dev
+Requires-Dist: pytest-asyncio>=0.23.0; extra == 'dev'
+Requires-Dist: pytest>=8.0.0; extra == 'dev'
+Description-Content-Type: text/markdown
+# NoScroll - Pull, don't scroll
+[![Python](https://img.shields.io/badge/python-3.11%2B-blue.svg)](https://www.python.org/)
+[![License](https://img.shields.io/badge/license-MIT-green.svg)](LICENSE)
+[![CLI](https://img.shields.io/badge/interface-CLI-black.svg)](https://github.com/zhuanyongxigua/noscroll)
+[![Sources](https://img.shields.io/badge/sources-RSS%20%7C%20Web%20%7C%20HN-orange.svg)](https://github.com/zhuanyongxigua/noscroll)
+## What is NoScroll
+NoScroll is a Python CLI that pulls information from RSS feeds, web pages, and Hacker News, then uses an LLM to summarize and rank the most useful items.
+It is designed for a pull-based reading workflow: define sources once, run on schedule, read only the high-signal digest.
+## Installation
+```bash
+pipx install noscroll
+```
+## Ask Command
+Use natural language directly:
+```bash
+noscroll --env-file .env ask "Collect content from the past five days, one file per day"
+```
+This will generate daily digest files in `outputs/`.
+Example generated text:
+```markdown
+## AI (3)
+1) Off Grid: Running text/image/vision models offline on mobile | Value: 4/5 | Type: Practice
+- Conclusion: This open-source project demonstrates on-device multimodal inference on smartphones, with strong privacy and offline usability.
+- Why it matters: On-device AI can reduce privacy risk and cloud inference cost, and is a good fit for offline-first products.
+- Evidence links: https://github.com/alichherawalla/off-grid-mobile
+## Other News (2)
+4) uBlock rule: hide YouTube Shorts with one click | Value: 4/5 | Domain: Tech
+## Life & Health (2)
+6) AI avatars for rural healthcare support | Value: 3/5 | Domain: Health
+```
+## License
+MIT. See [LICENSE](LICENSE).

noscroll-0.1.1/README.md ADDED Viewed

@@ -0,0 +1,45 @@
+# NoScroll - Pull, don't scroll
+[![Python](https://img.shields.io/badge/python-3.11%2B-blue.svg)](https://www.python.org/)
+[![License](https://img.shields.io/badge/license-MIT-green.svg)](LICENSE)
+[![CLI](https://img.shields.io/badge/interface-CLI-black.svg)](https://github.com/zhuanyongxigua/noscroll)
+[![Sources](https://img.shields.io/badge/sources-RSS%20%7C%20Web%20%7C%20HN-orange.svg)](https://github.com/zhuanyongxigua/noscroll)
+## What is NoScroll
+NoScroll is a Python CLI that pulls information from RSS feeds, web pages, and Hacker News, then uses an LLM to summarize and rank the most useful items.
+It is designed for a pull-based reading workflow: define sources once, run on schedule, read only the high-signal digest.
+## Installation
+```bash
+pipx install noscroll
+```
+## Ask Command
+Use natural language directly:
+```bash
+noscroll --env-file .env ask "Collect content from the past five days, one file per day"
+```
+This will generate daily digest files in `outputs/`.
+Example generated text:
+```markdown
+## AI (3)
+1) Off Grid: Running text/image/vision models offline on mobile | Value: 4/5 | Type: Practice
+- Conclusion: This open-source project demonstrates on-device multimodal inference on smartphones, with strong privacy and offline usability.
+- Why it matters: On-device AI can reduce privacy risk and cloud inference cost, and is a good fit for offline-first products.
+- Evidence links: https://github.com/alichherawalla/off-grid-mobile
+## Other News (2)
+4) uBlock rule: hide YouTube Shorts with one click | Value: 4/5 | Domain: Tech
+## Life & Health (2)
+6) AI avatars for rural healthcare support | Value: 3/5 | Domain: Health
+```
+## License
+MIT. See [LICENSE](LICENSE).

noscroll-0.1.1/automation/.env.example ADDED Viewed

@@ -0,0 +1,4 @@
+ANTHROPIC_API_KEY=sk-ant-xxx
+ANTHROPIC_BASE_URL="https://<third-party-anthropic-compatible-endpoint>"
+ANTHROPIC_MODEL="claude-3-100k"
+ANTHROPIC_DEFAULT_HAIKU_MODEL="claude-3-100k"

noscroll-0.1.1/automation/README.md ADDED Viewed

@@ -0,0 +1,134 @@
+# NoScroll Automation Harness
+Automated **run → test → eval → fix** loop using Claude Agent SDK.
+This is an **agent harness** layer, separate from business logic in `src/`.
+## Directory Structure
+```
+automation/
+├── __init__.py          # Package entry
+├── __main__.py          # python -m automation
+├── loop.py              # Main loop: run → test → eval → fix → repeat
+├── config.py            # Configuration
+├── agents.py            # Claude Agent SDK agents (executor, diagnostic, fixer)
+├── tasks/               # Task/scenario definitions
+│   └── __init__.py      # Predefined tasks
+├── evals/               # Evaluation logic
+│   └── __init__.py      # Output validation
+├── prompts/             # System prompts (file-based for easy editing)
+│   ├── executor.txt     # Executor agent prompt
+│   ├── diagnostic.txt   # Diagnostic agent prompt
+│   └── fixer.txt        # Fixer agent prompt
+├── adapters/            # External tool adapters
+│   └── __init__.py      # pytest, ruff, git adapters
+└── artifacts/           # Loop outputs: logs, diffs, reports
+```
+## The Loop
+```
+┌─────────────────────────────────────────────────────────────┐
+│                     Start Task                               │
+└─────────────────────────────────────────────────────────────┘
+                            │
+                            ▼
+┌─────────────────────────────────────────────────────────────┐
+│  1. Execute: Translate instruction → Run noscroll command    │
+└─────────────────────────────────────────────────────────────┘
+                            │
+                            ▼
+┌─────────────────────────────────────────────────────────────┐
+│  2. Evaluate: Check output files, validate content           │
+└─────────────────────────────────────────────────────────────┘
+                            │
+                            ▼
+                    ┌───────────────┐
+                    │    Passed?    │
+                    └───────────────┘
+                      │           │
+                  Yes │           │ No
+                      ▼           ▼
+              ┌─────────────┐  ┌─────────────────────────────────┐
+              │   SUCCESS   │  │  3. Diagnose: Analyze failure    │
+              │   (break)   │  │     (describe phenomena only)    │
+              └─────────────┘  └─────────────────────────────────┘
+                                          │
+                                          ▼
+                               ┌─────────────────────────────────┐
+                               │  4. Fix: Apply code changes      │
+                               └─────────────────────────────────┘
+                                          │
+                                          ▼
+                                  ┌───────────────┐
+                                  │  Max loops?   │
+                                  └───────────────┘
+                                    │           │
+                                Yes │           │ No
+                                    ▼           ▼
+                              ┌─────────┐   (back to 1)
+                              │  FAIL   │
+                              └─────────┘
+```
+## Stop Conditions
+1. **Success**: Evaluation passes ✓
+2. **Max loops**: Reached iteration limit (default: 3)
+3. **Fix failed**: Fixer couldn't apply changes
+## Installation
+```bash
+# Claude Agent SDK requires Claude Code CLI
+pip install claude-agent-sdk
+```
+## Usage
+```bash
+# List available tasks
+python -m automation --list
+# Run a specific task
+python -m automation --task basic_run_5d
+# Run a suite
+python -m automation --suite basic
+# Custom task
+python -m automation --custom "运行 noscroll，获取过去 3 天的 HN 内容"
+# Options
+python -m automation --task basic_run_5d --max-loops 5
+python -m automation --task basic_run_5d --quiet
+```
+## Artifacts
+Each run produces artifacts in `automation/artifacts/<task_name>/`:
+- `loop_result.json` - Full iteration history
+- Output files from the noscroll command
+## Design Principles
+1. **Separation of concerns**: This is a harness layer, not business logic
+2. **File-based prompts**: Easy to edit and version control
+3. **Adapters for tools**: Clean interface to pytest, git, etc.
+4. **Artifacts tracking**: Every run produces traceable outputs
+## Why Not in `src/`?
+The `src/` layout convention keeps only publishable package code in `src/`.
+Automation tools, scripts, and harnesses belong at the project root level:
+```
+project/
+├── src/noscroll/     # Business logic (pip installable)
+├── tests/            # Unit/integration tests
+└── automation/       # Agent harness (development tool)
+```
+This keeps import paths clean and separates runtime code from development tooling.

noscroll-0.1.1/automation/__init__.py ADDED Viewed

@@ -0,0 +1,4 @@
+"""Automation harness for NoScroll using Claude Agent SDK.
+This package provides an automated run → test → eval → fix loop.
+"""

noscroll-0.1.1/automation/__main__.py ADDED Viewed

@@ -0,0 +1,6 @@
+"""Allow running automation as a module: python -m automation"""
+from .loop import main
+if __name__ == "__main__":
+    main()

noscroll-0.1.1/automation/adapters/__init__.py ADDED Viewed

@@ -0,0 +1,98 @@
+"""Adapters for external tools (pytest, git, etc.)."""
+from __future__ import annotations
+import subprocess
+from dataclasses import dataclass
+from pathlib import Path
+from typing import Optional
+@dataclass
+class CommandResult:
+    """Result from running an external command."""
+    command: str
+    return_code: int
+    stdout: str
+    stderr: str
+    success: bool
+def run_command(
+    command: list[str],
+    cwd: Optional[Path] = None,
+    timeout: int = 300,
+) -> CommandResult:
+    """Run a shell command and capture output."""
+    cmd_str = " ".join(command)
+    try:
+        result = subprocess.run(
+            command,
+            cwd=str(cwd) if cwd else None,
+            capture_output=True,
+            text=True,
+            timeout=timeout,
+        )
+        return CommandResult(
+            command=cmd_str,
+            return_code=result.returncode,
+            stdout=result.stdout,
+            stderr=result.stderr,
+            success=result.returncode == 0,
+        )
+    except subprocess.TimeoutExpired:
+        return CommandResult(
+            command=cmd_str,
+            return_code=-1,
+            stdout="",
+            stderr=f"Command timed out after {timeout}s",
+            success=False,
+        )
+    except Exception as e:
+        return CommandResult(
+            command=cmd_str,
+            return_code=-1,
+            stdout="",
+            stderr=str(e),
+            success=False,
+        )
+def run_pytest(
+    test_path: Optional[Path] = None,
+    cwd: Optional[Path] = None,
+    args: Optional[list[str]] = None,
+) -> CommandResult:
+    """Run pytest with optional arguments."""
+    command = ["python", "-m", "pytest"]
+    if test_path:
+        command.append(str(test_path))
+    if args:
+        command.extend(args)
+    return run_command(command, cwd=cwd)
+def run_ruff(
+    path: Optional[Path] = None,
+    cwd: Optional[Path] = None,
+    fix: bool = False,
+) -> CommandResult:
+    """Run ruff linter."""
+    command = ["python", "-m", "ruff", "check"]
+    if fix:
+        command.append("--fix")
+    if path:
+        command.append(str(path))
+    else:
+        command.append(".")
+    return run_command(command, cwd=cwd)
+def git_diff(cwd: Optional[Path] = None) -> CommandResult:
+    """Get git diff of current changes."""
+    return run_command(["git", "diff"], cwd=cwd)
+def git_status(cwd: Optional[Path] = None) -> CommandResult:
+    """Get git status."""
+    return run_command(["git", "status", "--porcelain"], cwd=cwd)