academic-refchecker 1.2.61__tar.gz → 1.2.63__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {academic_refchecker-1.2.61/src/academic_refchecker.egg-info → academic_refchecker-1.2.63}/PKG-INFO +1 -1
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63/src/academic_refchecker.egg-info}/PKG-INFO +1 -1
- academic_refchecker-1.2.63/src/refchecker/__version__.py +5 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/checkers/semantic_scholar.py +3 -3
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/utils/arxiv_utils.py +10 -1
- academic_refchecker-1.2.61/src/refchecker/__version__.py +0 -5
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/LICENSE +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/MANIFEST.in +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/README.md +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/pyproject.toml +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/requirements.txt +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/scripts/download_db.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/scripts/run_tests.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/scripts/start_vllm_server.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/setup.cfg +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/academic_refchecker.egg-info/SOURCES.txt +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/academic_refchecker.egg-info/dependency_links.txt +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/academic_refchecker.egg-info/entry_points.txt +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/academic_refchecker.egg-info/requires.txt +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/academic_refchecker.egg-info/top_level.txt +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/__init__.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/__main__.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/checkers/__init__.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/checkers/crossref.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/checkers/enhanced_hybrid_checker.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/checkers/github_checker.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/checkers/local_semantic_scholar.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/checkers/openalex.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/checkers/openreview_checker.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/checkers/pdf_paper_checker.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/checkers/webpage_checker.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/config/__init__.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/config/logging.conf +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/config/settings.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/core/__init__.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/core/db_connection_pool.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/core/parallel_processor.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/core/refchecker.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/database/__init__.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/database/download_semantic_scholar_db.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/llm/__init__.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/llm/base.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/llm/providers.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/scripts/__init__.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/scripts/start_vllm_server.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/services/__init__.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/services/pdf_processor.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/utils/__init__.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/utils/author_utils.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/utils/biblatex_parser.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/utils/bibliography_utils.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/utils/bibtex_parser.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/utils/config_validator.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/utils/db_utils.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/utils/doi_utils.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/utils/error_utils.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/utils/mock_objects.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/utils/text_utils.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/utils/unicode_utils.py +0 -0
- {academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/utils/url_utils.py +0 -0
|
@@ -95,7 +95,7 @@ class NonArxivReferenceChecker:
|
|
|
95
95
|
# Make the request with retries and backoff
|
|
96
96
|
for attempt in range(max_retries_for_this_query):
|
|
97
97
|
try:
|
|
98
|
-
response = requests.get(endpoint, headers=self.headers, params=params)
|
|
98
|
+
response = requests.get(endpoint, headers=self.headers, params=params, timeout=30)
|
|
99
99
|
|
|
100
100
|
# Check for rate limiting
|
|
101
101
|
if response.status_code == 429:
|
|
@@ -141,7 +141,7 @@ class NonArxivReferenceChecker:
|
|
|
141
141
|
# Make the request with retries and backoff
|
|
142
142
|
for attempt in range(self.max_retries):
|
|
143
143
|
try:
|
|
144
|
-
response = requests.get(endpoint, headers=self.headers, params=params)
|
|
144
|
+
response = requests.get(endpoint, headers=self.headers, params=params, timeout=30)
|
|
145
145
|
|
|
146
146
|
# Check for rate limiting
|
|
147
147
|
if response.status_code == 429:
|
|
@@ -264,7 +264,7 @@ class NonArxivReferenceChecker:
|
|
|
264
264
|
|
|
265
265
|
for attempt in range(self.max_retries):
|
|
266
266
|
try:
|
|
267
|
-
response = requests.get(endpoint, headers=self.headers, params=params)
|
|
267
|
+
response = requests.get(endpoint, headers=self.headers, params=params, timeout=30)
|
|
268
268
|
|
|
269
269
|
if response.status_code == 429:
|
|
270
270
|
wait_time = self.request_delay * (self.backoff_factor ** attempt)
|
{academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/utils/arxiv_utils.py
RENAMED
|
@@ -458,7 +458,16 @@ def get_bibtex_content(paper):
|
|
|
458
458
|
|
|
459
459
|
logger.debug(f"Bibliography comparison: .bbl has {bbl_entry_count} entries, .bib has {bib_entry_count} entries")
|
|
460
460
|
|
|
461
|
-
|
|
461
|
+
# IMPORTANT: Prefer .bbl when .bib is excessively large (e.g., includes full ACL Anthology)
|
|
462
|
+
# The .bbl file contains only the actually-cited references, while .bib may contain
|
|
463
|
+
# entire bibliography databases. Parsing 80k+ entries would cause the tool to hang.
|
|
464
|
+
# Use .bbl if: (1) .bbl has entries AND (2) .bib has >10x more entries than .bbl OR >1000 entries
|
|
465
|
+
excessive_bib = bib_entry_count > 1000 or (bbl_entry_count > 0 and bib_entry_count > bbl_entry_count * 10)
|
|
466
|
+
|
|
467
|
+
if bbl_entry_count > 0 and excessive_bib:
|
|
468
|
+
logger.info(f"Using .bbl files from ArXiv source (.bib has {bib_entry_count} entries which is excessive, .bbl has {bbl_entry_count})")
|
|
469
|
+
return bbl_content
|
|
470
|
+
elif uses_bibtex and bib_entry_count > 0 and not excessive_bib:
|
|
462
471
|
logger.info(f"Using .bib files from ArXiv source (main TeX uses \\bibliography{{...}})")
|
|
463
472
|
return bib_content
|
|
464
473
|
elif bbl_entry_count > 0:
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/checkers/__init__.py
RENAMED
|
File without changes
|
{academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/checkers/crossref.py
RENAMED
|
File without changes
|
|
File without changes
|
{academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/checkers/github_checker.py
RENAMED
|
File without changes
|
|
File without changes
|
{academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/checkers/openalex.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/checkers/webpage_checker.py
RENAMED
|
File without changes
|
|
File without changes
|
{academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/config/logging.conf
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/core/db_connection_pool.py
RENAMED
|
File without changes
|
{academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/core/parallel_processor.py
RENAMED
|
File without changes
|
|
File without changes
|
{academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/database/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/scripts/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
{academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/services/__init__.py
RENAMED
|
File without changes
|
{academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/services/pdf_processor.py
RENAMED
|
File without changes
|
|
File without changes
|
{academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/utils/author_utils.py
RENAMED
|
File without changes
|
{academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/utils/biblatex_parser.py
RENAMED
|
File without changes
|
{academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/utils/bibliography_utils.py
RENAMED
|
File without changes
|
{academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/utils/bibtex_parser.py
RENAMED
|
File without changes
|
{academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/utils/config_validator.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
{academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/utils/error_utils.py
RENAMED
|
File without changes
|
{academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/utils/mock_objects.py
RENAMED
|
File without changes
|
{academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/utils/text_utils.py
RENAMED
|
File without changes
|
{academic_refchecker-1.2.61 → academic_refchecker-1.2.63}/src/refchecker/utils/unicode_utils.py
RENAMED
|
File without changes
|
|
File without changes
|