PyPI - crossref-local - Versions diffs - 0.4.0__py3-none-any.whl → 0.5.0__py3-none-any.whl - Mend

crossref-local 0.4.0py3-none-any.whl → 0.5.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (48) hide show

crossref_local/__init__.py +18 -10
crossref_local/_aio/__init__.py +30 -0
crossref_local/_aio/_impl.py +238 -0
crossref_local/_cache/__init__.py +15 -0
crossref_local/{cache_export.py → _cache/export.py} +27 -10
crossref_local/_cache/utils.py +93 -0
crossref_local/_cli/__init__.py +9 -0
crossref_local/_cli/cli.py +512 -0
crossref_local/_cli/mcp.py +351 -0
crossref_local/_cli/mcp_server.py +413 -0
crossref_local/_core/__init__.py +58 -0
crossref_local/{api.py → _core/api.py} +24 -5
crossref_local/{citations.py → _core/citations.py} +55 -26
crossref_local/{config.py → _core/config.py} +40 -22
crossref_local/{db.py → _core/db.py} +32 -26
crossref_local/{fts.py → _core/fts.py} +18 -14
crossref_local/{models.py → _core/models.py} +11 -6
crossref_local/_remote/__init__.py +56 -0
crossref_local/_remote/base.py +356 -0
crossref_local/_remote/collections.py +175 -0
crossref_local/_server/__init__.py +140 -0
crossref_local/_server/middleware.py +25 -0
crossref_local/_server/models.py +129 -0
crossref_local/_server/routes_citations.py +98 -0
crossref_local/_server/routes_collections.py +282 -0
crossref_local/_server/routes_compat.py +102 -0
crossref_local/_server/routes_works.py +128 -0
crossref_local/_server/server.py +19 -0
crossref_local/aio.py +30 -206
crossref_local/cache.py +100 -100
crossref_local/cli.py +5 -515
crossref_local/jobs.py +169 -0
crossref_local/mcp_server.py +5 -410
crossref_local/remote.py +5 -266
crossref_local/server.py +5 -349
{crossref_local-0.4.0.dist-info → crossref_local-0.5.0.dist-info}/METADATA +36 -11
crossref_local-0.5.0.dist-info/RECORD +47 -0
{crossref_local-0.4.0.dist-info → crossref_local-0.5.0.dist-info}/entry_points.txt +1 -1
crossref_local/cli_mcp.py +0 -275
crossref_local-0.4.0.dist-info/RECORD +0 -27
/crossref_local/{cache_viz.py → _cache/viz.py} +0 -0
/crossref_local/{cli_cache.py → _cli/cache.py} +0 -0
/crossref_local/{cli_completion.py → _cli/completion.py} +0 -0
/crossref_local/{cli_main.py → _cli/main.py} +0 -0
/crossref_local/{impact_factor → _impact_factor}/__init__.py +0 -0
/crossref_local/{impact_factor → _impact_factor}/calculator.py +0 -0
/crossref_local/{impact_factor → _impact_factor}/journal_lookup.py +0 -0
{crossref_local-0.4.0.dist-info → crossref_local-0.5.0.dist-info}/WHEEL +0 -0

crossref_local/cache.py CHANGED Viewed

@@ -18,38 +18,37 @@ Usage:
     >>> stats = cache.stats("epilepsy")
 """
-import json
-import os
-import time
-from dataclasses import dataclass
-from pathlib import Path
-from typing import Any, Dict, List, Optional
+import json as _json
+import time as _time
+from dataclasses import dataclass as _dataclass
+from typing import Any as _Any
+from typing import Dict as _Dict
+from typing import List as _List
+from typing import Optional as _Optional
+from ._core.api import get_many as _get_many
+from ._core.api import search as _search
+from ._cache.utils import cache_path as _cache_path
+from ._cache.utils import get_cache_dir as _get_cache_dir
+from ._cache.utils import meta_path as _meta_path
-from .api import get_many, search
-def _get_cache_dir() -> Path:
-    """Get cache directory, creating if needed."""
-    cache_dir = Path(
-        os.environ.get(
-            "CROSSREF_LOCAL_CACHE_DIR", Path.home() / ".cache" / "crossref-local"
-        )
-    )
-    cache_dir.mkdir(parents=True, exist_ok=True)
-    return cache_dir
-def _cache_path(name: str) -> Path:
-    """Get path for a named cache."""
-    return _get_cache_dir() / f"{name}.json"
-def _meta_path(name: str) -> Path:
-    """Get path for cache metadata."""
-    return _get_cache_dir() / f"{name}.meta.json"
+__all__ = [
+    "CacheInfo",
+    "create",
+    "append",
+    "load",
+    "query",
+    "query_dois",
+    "stats",
+    "info",
+    "exists",
+    "list_caches",
+    "delete",
+    "export",
+]
-@dataclass
+@_dataclass
 class CacheInfo:
     """Information about a cache."""
@@ -58,7 +57,7 @@ class CacheInfo:
     size_bytes: int
     paper_count: int
     created_at: str
-    query: Optional[str] = None
+    query: _Optional[str] = None
     def to_dict(self) -> dict:
         return {
@@ -74,11 +73,12 @@ class CacheInfo:
 def create(
     name: str,
-    query: Optional[str] = None,
-    dois: Optional[List[str]] = None,
-    papers: Optional[List[Dict[str, Any]]] = None,
+    query: _Optional[str] = None,
+    dois: _Optional[_List[str]] = None,
+    papers: _Optional[_List[_Dict[str, _Any]]] = None,
     limit: int = 1000,
     offset: int = 0,
+    user_id: _Optional[str] = None,
 ) -> CacheInfo:
     """Create a cache from search query, DOI list, or pre-fetched papers.
@@ -89,6 +89,7 @@ def create(
         papers: Pre-fetched paper dicts (skips API calls)
         limit: Max papers to fetch (for query mode)
         offset: Offset for pagination (for query mode)
+        user_id: _Optional user ID for multi-tenant scoping
     Returns:
         CacheInfo with cache details
@@ -105,31 +106,31 @@ def create(
         raise ValueError("Must provide 'query', 'dois', or 'papers'")
     elif dois is None:
         # Get DOIs from search
-        results = search(query, limit=limit, offset=offset)
+        results = _search(query, limit=limit, offset=offset)
         dois = [w.doi for w in results.works]
         # Fetch full metadata
-        works = get_many(dois)
+        works = _get_many(dois)
         papers = [w.to_dict() for w in works]
     else:
         # Fetch full metadata for DOIs
-        works = get_many(dois)
+        works = _get_many(dois)
         papers = [w.to_dict() for w in works]
     # Save cache
-    cache_file = _cache_path(name)
+    cache_file = _cache_path(name, user_id)
     with open(cache_file, "w") as f:
-        json.dump(papers, f)
+        _json.dump(papers, f)
     # Save metadata
     meta = {
         "name": name,
         "query": query,
-        "created_at": time.strftime("%Y-%m-%d %H:%M:%S"),
+        "created_at": _time.strftime("%Y-%m-%d %H:%M:%S"),
         "paper_count": len(papers),
         "dois_requested": len(dois) if dois else len(papers),
     }
-    with open(_meta_path(name), "w") as f:
-        json.dump(meta, f, indent=2)
+    with open(_meta_path(name, user_id), "w") as f:
+        _json.dump(meta, f, indent=2)
     return CacheInfo(
         name=name,
@@ -143,10 +144,11 @@ def create(
 def append(
     name: str,
-    query: Optional[str] = None,
-    dois: Optional[List[str]] = None,
+    query: _Optional[str] = None,
+    dois: _Optional[_List[str]] = None,
     limit: int = 1000,
     offset: int = 0,
+    user_id: _Optional[str] = None,
 ) -> CacheInfo:
     """Append papers to existing cache.
@@ -156,20 +158,23 @@ def append(
         dois: Explicit list of DOIs to add
         limit: Max papers to fetch (for query mode)
         offset: Offset for pagination (for query mode)
+        user_id: _Optional user ID for multi-tenant scoping
     Returns:
         Updated CacheInfo
     """
-    if not exists(name):
-        return create(name, query=query, dois=dois, limit=limit, offset=offset)
+    if not exists(name, user_id=user_id):
+        return create(
+            name, query=query, dois=dois, limit=limit, offset=offset, user_id=user_id
+        )
     # Load existing
-    existing = load(name)
+    existing = load(name, user_id=user_id)
     existing_dois = {p["doi"] for p in existing}
     # Get new DOIs
     if dois is None and query is not None:
-        results = search(query, limit=limit, offset=offset)
+        results = _search(query, limit=limit, offset=offset)
         dois = [w.doi for w in results.works]
     elif dois is None:
         raise ValueError("Must provide either 'query' or 'dois'")
@@ -179,62 +184,64 @@ def append(
     if new_dois:
         # Fetch new metadata
-        new_works = get_many(new_dois)
+        new_works = _get_many(new_dois)
         new_papers = [w.to_dict() for w in new_works]
         # Combine and save
         all_papers = existing + new_papers
-        cache_file = _cache_path(name)
+        cache_file = _cache_path(name, user_id)
         with open(cache_file, "w") as f:
-            json.dump(all_papers, f)
+            _json.dump(all_papers, f)
         # Update metadata
-        meta_file = _meta_path(name)
+        meta_file = _meta_path(name, user_id)
         if meta_file.exists():
             with open(meta_file) as f:
-                meta = json.load(f)
+                meta = _json.load(f)
         else:
             meta = {"name": name}
-        meta["updated_at"] = time.strftime("%Y-%m-%d %H:%M:%S")
+        meta["updated_at"] = _time.strftime("%Y-%m-%d %H:%M:%S")
         meta["paper_count"] = len(all_papers)
         with open(meta_file, "w") as f:
-            json.dump(meta, f, indent=2)
+            _json.dump(meta, f, indent=2)
-        return info(name)
+        return info(name, user_id=user_id)
-    return info(name)
+    return info(name, user_id=user_id)
-def load(name: str) -> List[Dict[str, Any]]:
+def load(name: str, user_id: _Optional[str] = None) -> _List[_Dict[str, _Any]]:
     """Load raw cache data.
     Args:
         name: Cache name
+        user_id: _Optional user ID for multi-tenant scoping
     Returns:
         List of paper dictionaries with full metadata
     """
-    cache_file = _cache_path(name)
+    cache_file = _cache_path(name, user_id)
     if not cache_file.exists():
         raise FileNotFoundError(f"Cache not found: {name}")
     with open(cache_file) as f:
-        return json.load(f)
+        return _json.load(f)
 def query(
     name: str,
-    fields: Optional[List[str]] = None,
+    fields: _Optional[_List[str]] = None,
     include_abstract: bool = False,
     include_references: bool = False,
     include_citations: bool = False,
-    year_min: Optional[int] = None,
-    year_max: Optional[int] = None,
-    journal: Optional[str] = None,
-    limit: Optional[int] = None,
-) -> List[Dict[str, Any]]:
+    year_min: _Optional[int] = None,
+    year_max: _Optional[int] = None,
+    journal: _Optional[str] = None,
+    limit: _Optional[int] = None,
+    user_id: _Optional[str] = None,
+) -> _List[_Dict[str, _Any]]:
     """Query cache with field filtering.
     Args:
@@ -247,6 +254,7 @@ def query(
         year_max: Filter by maximum year
         journal: Filter by journal name (substring match)
         limit: Max results to return
+        user_id: _Optional user ID for multi-tenant scoping
     Returns:
         Filtered list of paper dictionaries
@@ -257,7 +265,7 @@ def query(
         >>> # With filters
         >>> papers = query("epilepsy", year_min=2020, include_citations=True)
     """
-    papers = load(name)
+    papers = load(name, user_id=user_id)
     # Apply filters
     if year_min is not None:
@@ -295,29 +303,31 @@ def query(
     return papers
-def query_dois(name: str) -> List[str]:
+def query_dois(name: str, user_id: _Optional[str] = None) -> _List[str]:
     """Get just DOIs from cache.
     Args:
         name: Cache name
+        user_id: _Optional user ID for multi-tenant scoping
     Returns:
         List of DOIs
     """
-    papers = load(name)
+    papers = load(name, user_id=user_id)
     return [p["doi"] for p in papers if p.get("doi")]
-def stats(name: str) -> Dict[str, Any]:
+def stats(name: str, user_id: _Optional[str] = None) -> _Dict[str, _Any]:
     """Get cache statistics.
     Args:
         name: Cache name
+        user_id: _Optional user ID for multi-tenant scoping
     Returns:
         Dictionary with statistics
     """
-    papers = load(name)
+    papers = load(name, user_id=user_id)
     # Year distribution
     years = [p.get("year") for p in papers if p.get("year")]
@@ -360,26 +370,27 @@ def stats(name: str) -> Dict[str, Any]:
     }
-def info(name: str) -> CacheInfo:
+def info(name: str, user_id: _Optional[str] = None) -> CacheInfo:
     """Get cache information.
     Args:
         name: Cache name
+        user_id: _Optional user ID for multi-tenant scoping
     Returns:
         CacheInfo object
     """
-    cache_file = _cache_path(name)
+    cache_file = _cache_path(name, user_id)
     if not cache_file.exists():
         raise FileNotFoundError(f"Cache not found: {name}")
-    meta_file = _meta_path(name)
+    meta_file = _meta_path(name, user_id)
     meta = {}
     if meta_file.exists():
         with open(meta_file) as f:
-            meta = json.load(f)
+            meta = _json.load(f)
-    papers = load(name)
+    papers = load(name, user_id=user_id)
     return CacheInfo(
         name=name,
@@ -391,25 +402,29 @@ def info(name: str) -> CacheInfo:
     )
-def exists(name: str) -> bool:
+def exists(name: str, user_id: _Optional[str] = None) -> bool:
     """Check if cache exists.
     Args:
         name: Cache name
+        user_id: _Optional user ID for multi-tenant scoping
     Returns:
         True if cache exists
     """
-    return _cache_path(name).exists()
+    return _cache_path(name, user_id).exists()
-def list_caches() -> List[CacheInfo]:
+def list_caches(user_id: _Optional[str] = None) -> _List[CacheInfo]:
     """List all available caches.
+    Args:
+        user_id: _Optional user ID for multi-tenant scoping
     Returns:
         List of CacheInfo objects
     """
-    cache_dir = _get_cache_dir()
+    cache_dir = _get_cache_dir(user_id)
     caches = []
     for f in cache_dir.glob("*.json"):
@@ -417,24 +432,25 @@ def list_caches() -> List[CacheInfo]:
             continue
         name = f.stem
         try:
-            caches.append(info(name))
+            caches.append(info(name, user_id=user_id))
         except Exception:
             pass
     return sorted(caches, key=lambda c: c.name)
-def delete(name: str) -> bool:
+def delete(name: str, user_id: _Optional[str] = None) -> bool:
     """Delete a cache.
     Args:
         name: Cache name
+        user_id: _Optional user ID for multi-tenant scoping
     Returns:
         True if deleted
     """
-    cache_file = _cache_path(name)
-    meta_file = _meta_path(name)
+    cache_file = _cache_path(name, user_id)
+    meta_file = _meta_path(name, user_id)
     deleted = False
     if cache_file.exists():
@@ -446,21 +462,5 @@ def delete(name: str) -> bool:
     return deleted
 # Re-export from cache_export for backwards compatibility
-from .cache_export import export
-__all__ = [
-    "CacheInfo",
-    "create",
-    "append",
-    "load",
-    "query",
-    "query_dois",
-    "stats",
-    "info",
-    "exists",
-    "list_caches",
-    "delete",
-    "export",
-]
+from ._cache.export import export

crossref-local 0.4.0__py3-none-any.whl → 0.5.0__py3-none-any.whl

crossref-local 0.4.0py3-none-any.whl → 0.5.0py3-none-any.whl