PyPI - arxiv-to-prompt - Versions diffs - 0.5.0__tar.gz → 0.5.1__tar.gz - Mend

arxiv-to-prompt 0.5.0tar.gz → 0.5.1tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

{arxiv_to_prompt-0.5.0/src/arxiv_to_prompt.egg-info → arxiv_to_prompt-0.5.1}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: arxiv-to-prompt
-Version: 0.5.0
+Version: 0.5.1
 Summary: transform arXiv papers into a single latex prompt for LLMs
 Author: Takashi Ishida
 License: MIT

{arxiv_to_prompt-0.5.0 → arxiv_to_prompt-0.5.1}/pyproject.toml RENAMED Viewed

@@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta"
 [project]
 name = "arxiv-to-prompt"
-version = "0.5.0"
+version = "0.5.1"
 description = "transform arXiv papers into a single latex prompt for LLMs"
 readme = "README.md"
 authors = [{ name = "Takashi Ishida" }]

{arxiv_to_prompt-0.5.0 → arxiv_to_prompt-0.5.1}/src/arxiv_to_prompt/core.py RENAMED Viewed

@@ -92,40 +92,55 @@ def download_arxiv_source(arxiv_id: str, cache_dir: Optional[str] = None, use_ca
 def find_main_tex(directory: str) -> Optional[str]:
     """
-    Find the main .tex file containing documentclass.
+    Find the main .tex file containing documentclass.
+    Searches recursively through subdirectories.
     First checks for common naming conventions (main.tex, paper.tex, index.tex).
-    If none found, returns the filename of the longest .tex file containing documentclass,
-    since shorter files are typically conference templates or supplementary documents
+    If none found, returns the path of the longest .tex file containing documentclass,
+    since shorter files are typically conference templates or supplementary documents
     rather than the main manuscript.
     """
     common_names = ['main.tex', 'paper.tex', 'index.tex']
     main_tex_file = None
     max_line_count = 0
-    # First pass: check for common naming conventions
-    for file_name in os.listdir(directory):
-        if file_name in common_names:
-            try:
-                with open(os.path.join(directory, file_name), 'r', encoding='utf-8') as file:
-                    lines = file.readlines()
-                    if any('\\documentclass' in line for line in lines):
-                        return file_name
-            except Exception as e:
-                logging.warning(f"Could not read file {file_name}: {e}")
+    # Walk through directory and subdirectories
+    for root, dirs, files in os.walk(directory):
+        rel_root = os.path.relpath(root, directory)
+        # First pass: check for common naming conventions
+        for file_name in files:
+            if file_name in common_names:
+                file_path = os.path.join(root, file_name)
+                try:
+                    with open(file_path, 'r', encoding='utf-8') as file:
+                        lines = file.readlines()
+                        if any('\\documentclass' in line for line in lines):
+                            if rel_root == '.':
+                                return file_name
+                            return os.path.join(rel_root, file_name)
+                except Exception as e:
+                    logging.warning(f"Could not read file {file_path}: {e}")
     # Second pass: find the longest .tex file containing documentclass
-    for file_name in os.listdir(directory):
-        if file_name.endswith('.tex'):
-            try:
-                with open(os.path.join(directory, file_name), 'r', encoding='utf-8') as file:
-                    lines = file.readlines()
-                    if any('\\documentclass' in line for line in lines):
-                        line_count = len(lines)
-                        if line_count > max_line_count:
-                            main_tex_file = file_name
-                            max_line_count = line_count
-            except Exception as e:
-                logging.warning(f"Could not read file {file_name}: {e}")
+    for root, dirs, files in os.walk(directory):
+        rel_root = os.path.relpath(root, directory)
+        for file_name in files:
+            if file_name.endswith('.tex'):
+                file_path = os.path.join(root, file_name)
+                try:
+                    with open(file_path, 'r', encoding='utf-8') as file:
+                        lines = file.readlines()
+                        if any('\\documentclass' in line for line in lines):
+                            line_count = len(lines)
+                            if line_count > max_line_count:
+                                if rel_root == '.':
+                                    main_tex_file = file_name
+                                else:
+                                    main_tex_file = os.path.join(rel_root, file_name)
+                                max_line_count = line_count
+                except Exception as e:
+                    logging.warning(f"Could not read file {file_path}: {e}")
     return main_tex_file

{arxiv_to_prompt-0.5.0 → arxiv_to_prompt-0.5.1/src/arxiv_to_prompt.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: arxiv-to-prompt
-Version: 0.5.0
+Version: 0.5.1
 Summary: transform arXiv papers into a single latex prompt for LLMs
 Author: Takashi Ishida
 License: MIT

{arxiv_to_prompt-0.5.0 → arxiv_to_prompt-0.5.1}/tests/test_core.py RENAMED Viewed

@@ -153,6 +153,23 @@ def test_find_main_tex(temp_cache_dir):
     assert found_main == "main.tex"
+def test_find_main_tex_in_subdirectory(temp_cache_dir):
+    """Test finding main tex file in a subdirectory."""
+    # Create test directory with subdirectory
+    tex_dir = temp_cache_dir / "test_tex_subdir"
+    tex_dir.mkdir(parents=True)
+    subdir = tex_dir / "paper"
+    subdir.mkdir()
+    # Create main.tex in subdirectory
+    main_file = subdir / "main.tex"
+    main_file.write_text("\\documentclass{article}\n\\begin{document}\nHello\n\\end{document}")
+    # Test finding main file in subdirectory
+    found_main = find_main_tex(str(tex_dir))
+    assert found_main == os.path.join("paper", "main.tex")
 def test_commented_input_commands(temp_cache_dir):
     """Test that commented-out \\include and \\input commands are ignored."""
     # Create test directory and files