PyPI - txt2ebook - Versions diffs - 0.1.159__tar.gz → 0.1.161__tar.gz - Mend

txt2ebook 0.1.159tar.gz → 0.1.161tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (51) hide show

{txt2ebook-0.1.159/src/txt2ebook.egg-info → txt2ebook-0.1.161}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: txt2ebook
-Version: 0.1.159
+Version: 0.1.161
 Summary: CLI tool to convert txt file to ebook format
 Author-email: Kian-Meng Ang <kianmeng@cpan.org>
 License-Expression: AGPL-3.0-or-later
@@ -13,17 +13,17 @@ Classifier: Natural Language :: Chinese (Simplified)
 Classifier: Natural Language :: Chinese (Traditional)
 Classifier: Programming Language :: Python
 Classifier: Programming Language :: Python :: 3 :: Only
-Classifier: Programming Language :: Python :: 3.9
 Classifier: Programming Language :: Python :: 3.10
 Classifier: Programming Language :: Python :: 3.11
 Classifier: Programming Language :: Python :: 3.12
 Classifier: Programming Language :: Python :: 3.13
+Classifier: Programming Language :: Python :: 3.14
 Classifier: Topic :: Text Processing
 Classifier: Topic :: Text Processing :: Filters
 Classifier: Topic :: Text Processing :: General
 Classifier: Topic :: Text Processing :: Markup :: HTML
 Classifier: Topic :: Text Processing :: Markup :: Markdown
-Requires-Python: ~=3.9
+Requires-Python: >=3.10
 Description-Content-Type: text/markdown
 License-File: LICENSE.md
 Requires-Dist: CJKwrap~=2.2

{txt2ebook-0.1.159 → txt2ebook-0.1.161}/pyproject.toml RENAMED Viewed

@@ -1,9 +1,9 @@
 [project]
 name = "txt2ebook"
-version = "0.1.159"
+version = "0.1.161"
 description = "CLI tool to convert txt file to ebook format"
 authors = [{ name = "Kian-Meng Ang", email = "kianmeng@cpan.org" }]
-requires-python = "~=3.9"
+requires-python = ">=3.10"
 readme = "README.md"
 license = "AGPL-3.0-or-later"
 license-files = ["LICENSE.md"]
@@ -25,11 +25,11 @@ classifiers = [
     "Natural Language :: Chinese (Traditional)",
     "Programming Language :: Python",
     "Programming Language :: Python :: 3 :: Only",
-    "Programming Language :: Python :: 3.9",
     "Programming Language :: Python :: 3.10",
     "Programming Language :: Python :: 3.11",
     "Programming Language :: Python :: 3.12",
     "Programming Language :: Python :: 3.13",
+    "Programming Language :: Python :: 3.14",
     "Topic :: Text Processing",
     "Topic :: Text Processing :: Filters",
     "Topic :: Text Processing :: General",

{txt2ebook-0.1.159 → txt2ebook-0.1.161}/src/txt2ebook/__init__.py RENAMED Viewed

@@ -15,6 +15,7 @@
 """Common shared functions."""
+from importlib import metadata
 import argparse
 import logging
 import platform
@@ -24,7 +25,7 @@ import langdetect
 logger = logging.getLogger(__name__)
-__version__ = "0.1.126"
+__version__ = metadata.version("txt2ebook")
 def setup_logger(config: argparse.Namespace) -> None:

{txt2ebook-0.1.159 → txt2ebook-0.1.161}/src/txt2ebook/cli.py RENAMED Viewed

@@ -23,7 +23,7 @@ issues: https://github.com/kianmeng/txt2ebook/issues
 import argparse
 import logging
 import sys
-from typing import Optional, Sequence
+from typing import Sequence
 import txt2ebook.subcommands
 from txt2ebook import __version__, setup_logger
@@ -134,7 +134,7 @@ def build_parser() -> argparse.ArgumentParser:
     return parser
-def main(args: Optional[Sequence[str]] = None):
+def main(args: Sequence[str] | None = None):
     """Set the main entrypoint of the CLI script."""
     args = args or sys.argv[1:]

{txt2ebook-0.1.159 → txt2ebook-0.1.161}/src/txt2ebook/exceptions.py RENAMED Viewed

@@ -16,5 +16,9 @@
 """List of all exceptions used for this application."""
+class InputError(Exception):
+    """Raised when the input arguments are invalid."""
 class EmptyFileError(Exception):
     """Raised when the input file has no content."""

{txt2ebook-0.1.159 → txt2ebook-0.1.161}/src/txt2ebook/formats/base.py RENAMED Viewed

@@ -24,8 +24,8 @@ import shutil
 import subprocess
 import sys
 from abc import ABC, abstractmethod
-from importlib import import_module
 from pathlib import Path
+from types import ModuleType
 from txt2ebook.helpers import lower_underscore
 from txt2ebook.models import Book, Chapter, Volume
@@ -36,22 +36,23 @@ logger = logging.getLogger(__name__)
 class BaseWriter(ABC):
     """Base class for writing to ebook format."""
-    def __init__(self, book: Book, opts: argparse.Namespace) -> None:
+    def __init__(
+        self, book: Book, opts: argparse.Namespace, langconf: ModuleType
+    ) -> None:
         """Create a Writer module.
         Args:
             book(Book): The book model which contains metadata and table of
             contents of volumes and chapters.
             opts(argparse.Namespace): The configs from the command-line.
+            langconf(ModuleType): The language configuration module.
         Returns:
             None
         """
         self.book = book
         self.config = opts
-        config_lang = self.config.language.replace("-", "_")
-        self.langconf = import_module(f"txt2ebook.languages.{config_lang}")
+        self.langconf = langconf
         if not self.config.output_file:
             self._refresh_output_folder()
@@ -84,7 +85,8 @@ class BaseWriter(ABC):
                 shutil.rmtree(cwd)
             else:
                 answer = input(
-                    f"Are you sure to purge output folder: {cwd.absolute()}? [y/N] "
+                    f"Are you sure to purge output folder: {cwd.absolute()}? "
+                    "[y/N] "
                 )
                 if answer.lower() == "y":
                     logger.debug("Purge output folder: %s", cwd.absolute())

{txt2ebook-0.1.159 → txt2ebook-0.1.161}/src/txt2ebook/formats/epub.py RENAMED Viewed

@@ -19,7 +19,7 @@ import logging
 import uuid
 from importlib.resources import contents, read_text
 from pathlib import Path
-from typing import Optional
 from ebooklib import epub
@@ -181,7 +181,7 @@ class EpubWriter(BaseWriter):
         return epub_html
     def _build_chapter(
-        self, chapter: Chapter, volume: Optional[Volume] = None
+        self, chapter: Chapter, volume: Volume | None = None
     ) -> epub.EpubHtml:
         """Generate the whole chapter to HTML."""
         if volume:

{txt2ebook-0.1.159 → txt2ebook-0.1.161}/src/txt2ebook/formats/txt.py RENAMED Viewed

@@ -155,17 +155,21 @@ class TxtWriter(BaseWriter):
                 chapter_seq = 0
                 for chapter in section.chapters:
                     chapter_seq += 1
-                    output_filename = self._get_volume_chapter_filename_for_split(
-                        txt_filename,
-                        str(section_seq).rjust(2, "0"),
-                        str(chapter_seq).rjust(2, "0"),
-                        section,
-                        chapter,
-                        ".txt",
+                    output_filename = (
+                        self._get_volume_chapter_filename_for_split(
+                            txt_filename,
+                            str(section_seq).rjust(2, "0"),
+                            str(chapter_seq).rjust(2, "0"),
+                            section,
+                            chapter,
+                            ".txt",
+                        )
                     )
                     with open(output_filename, "w", encoding="utf8") as file:
                         logger.info("Creating %s", output_filename.resolve())
-                        file.write(self._to_volume_chapter_txt(section, chapter))
+                        file.write(
+                            self._to_volume_chapter_txt(section, chapter)
+                        )
             elif isinstance(section, Chapter):
                 section_seq += 1
                 output_filename = self._get_chapter_filename_for_split(

{txt2ebook-0.1.159 → txt2ebook-0.1.161}/src/txt2ebook/formats/typ.py RENAMED Viewed

@@ -140,7 +140,8 @@ class TypWriter(BaseWriter):
             f"""
             #set page(paper: "{self._get_pagesize()}", numbering: none)
             #align(center + horizon, text(17pt)[{self.book.title}])
-            #align(center + horizon, text(17pt)[{", ".join(self.book.authors)}])
+            #align(center + horizon, text(17pt)[
+                {", ".join(self.book.authors)}])
             #pagebreak()
         """

{txt2ebook-0.1.159 → txt2ebook-0.1.161}/src/txt2ebook/helpers/__init__.py RENAMED Viewed

@@ -22,7 +22,8 @@ logger = logging.getLogger(__name__)
 def lower_underscore(string: str) -> str:
-    """Convert a string to lower case and replace multiple spaces to single underscore.
+    """Convert a string to lower case and replace multiple spaces to single
+    underscore.
     Args:
         string (str): A string.

{txt2ebook-0.1.159 → txt2ebook-0.1.161}/src/txt2ebook/models/book.py RENAMED Viewed

@@ -18,7 +18,7 @@
 import logging
 from collections import Counter
 from dataclasses import dataclass, field
-from typing import List, Union
+from typing import List
 from txt2ebook.models.chapter import Chapter
 from txt2ebook.models.volume import Volume
@@ -38,7 +38,7 @@ class Book:
     language: str = field(default="")
     cover: str = field(default="", repr=False)
     raw_content: str = field(default="", repr=False)
-    toc: List[Union[Volume, Chapter]] = field(default_factory=list, repr=False)
+    toc: List[Volume | Chapter] = field(default_factory=list, repr=False)
     def stats(self) -> Counter:
         """Returns the statistics count for the parsed tokens.

{txt2ebook-0.1.159 → txt2ebook-0.1.161}/src/txt2ebook/parser.py RENAMED Viewed

@@ -17,14 +17,15 @@
 import argparse
 import logging
+from collections import Counter
 from dataclasses import dataclass
 from types import ModuleType
-from typing import List, Tuple, Union
+from typing import List, Tuple
 import regex as re
 from txt2ebook.models import Book, Chapter, Volume
-from txt2ebook.tokenizer import Tokenizer
+from txt2ebook.tokenizer import Token, Tokenizer
 from txt2ebook.zh_utils import zh_halfwidth_to_fullwidth, zh_words_to_numbers
 logger = logging.getLogger(__name__)
@@ -55,7 +56,7 @@ class Parser:
         Returns:
           txt2ebook.models.Book: The Book model.
         """
-        tokenizer = Tokenizer(self.raw_content, self.config)
+        tokenizer = Tokenizer(self.raw_content, self.config, self.langconf)
         (book_title, authors, translators, tags, index, toc) = (
             self.parse_tokens(tokenizer)
@@ -79,6 +80,28 @@ class Parser:
         return book
+    def _pad_header_number(self, words: str, length: int) -> str:
+        """Left pad the section number if found as halfwidth or fullwidth
+        integer.
+        """
+        # left pad the section number if found as halfwidth integer
+        match = re.match(rf"第([{self.langconf.HALFWIDTH_NUMS}]*)", words)
+        if match and match.group(1) != "":
+            header_nums = match.group(1)
+            return words.replace(
+                header_nums, str(header_nums).rjust(length, "0")
+            )
+        # left pad the section number if found as fullwidth integer
+        match = re.match(rf"第([{self.langconf.FULLWIDTH_NUMS}]*)", words)
+        if match and match.group(1) != "":
+            header_nums = match.group(1)
+            return words.replace(
+                header_nums, str(header_nums).rjust(length, "０")
+            )
+        return words
     def words_to_nums(self, words: str, length: int) -> str:
         """Convert header from words to numbers.
@@ -99,22 +122,13 @@ class Parser:
         ):
             return words
-        # left pad the section number if found as halfwidth integer
-        match = re.match(rf"第([{self.langconf.HALFWIDTH_NUMS}]*)", words)
-        if match and match.group(1) != "":
-            header_nums = match.group(1)
-            return words.replace(
-                header_nums, str(header_nums).rjust(length, "0")
-            )
-        # left pad the section number if found as fullwidth integer
-        match = re.match(rf"第([{self.langconf.FULLWIDTH_NUMS}]*)", words)
-        if match and match.group(1) != "":
-            header_nums = match.group(1)
-            return words.replace(
-                header_nums, str(header_nums).rjust(length, "０")
-            )
+        # Check if the header is already a number and pad it
+        padded_words = self._pad_header_number(words, length)
+        if padded_words != words:
+            return padded_words
+        # Convert words to numbers and then apply fullwidth conversion if
+        # configured
         replaced_words = zh_words_to_numbers(words, length=length)
         if hasattr(self.config, "fullwidth") and self.config.fullwidth:
@@ -127,14 +141,102 @@ class Parser:
         )
         return replaced_words
+    def _process_metadata_token(self, token: Token, book_data: dict) -> None:
+        """Process metadata tokens (TITLE, AUTHOR, TAG, INDEX, TRANSLATOR)."""
+        if token.type == "TITLE":
+            book_data["book_title"] = token.value
+        elif token.type == "AUTHOR":
+            book_data["authors"].append(token.value)
+        elif token.type == "TAG":
+            book_data["tags"].append(token.value)
+        elif token.type == "INDEX":
+            book_data["index"] = token.value.split(" ")
+        elif token.type == "TRANSLATOR":
+            book_data["translators"].append(token.value)
+    def _process_volume_chapter_token(
+        self,
+        token: Token,
+        toc: List[Volume | Chapter],
+        stats: Counter,
+        current_volume: Volume,
+        current_chapter: Chapter,
+    ) -> Tuple[Volume, Chapter]:
+        """Process VOLUME_CHAPTER token and update current volume/chapter."""
+        [volume, chapter] = token.value
+        volume_title = self.words_to_nums(volume.value, 2)
+        if current_volume.title != volume_title:
+            current_volume = Volume(title=volume_title)
+            toc.append(current_volume)
+        chapter_title = self.words_to_nums(
+            chapter.value, len(str(stats.get("VOLUME_CHAPTER")))
+        )
+        if current_chapter.title != chapter_title:
+            current_chapter = Chapter(title=chapter_title)
+            if isinstance(toc[-1], Volume):
+                toc[-1].add_chapter(current_chapter)
+        return current_volume, current_chapter
+    def _process_volume_token(
+        self,
+        token: Token,
+        toc: List[Volume | Chapter],
+        stats: Counter,
+        current_volume: Volume,
+    ) -> Volume:
+        """Process VOLUME token and update current volume."""
+        volume_title = self.words_to_nums(
+            token.value, len(str(stats.get("VOLUME")))
+        )
+        if current_volume.title != volume_title:
+            current_volume = Volume(title=volume_title)
+            toc.append(current_volume)
+        return current_volume
+    def _process_chapter_token(
+        self,
+        token: Token,
+        toc: List[Volume | Chapter],
+        stats: Counter,
+        current_chapter: Chapter,
+    ) -> Chapter:
+        """Process CHAPTER token and update current chapter."""
+        chapter_title = self.words_to_nums(
+            token.value, len(str(stats.get("CHAPTER")))
+        )
+        if current_chapter.title != chapter_title:
+            current_chapter = Chapter(title=chapter_title)
+            if toc and isinstance(toc[-1], Volume):
+                toc[-1].add_chapter(current_chapter)
+            else:
+                toc.append(current_chapter)
+        return current_chapter
+    def _process_paragraph_token(
+        self, token: Token, toc: List[Volume | Chapter]
+    ) -> None:
+        """Process PARAGRAPH token and add it to the current chapter."""
+        if toc:
+            if isinstance(toc[-1], Volume):
+                toc[-1].chapters[-1].add_paragraph(token.value)
+            if isinstance(toc[-1], Chapter):
+                toc[-1].add_paragraph(token.value)
     def parse_tokens(self, tokenizer: Tokenizer) -> Tuple:
         """Parse the tokens and organize into book structure."""
-        toc: List[Union[Volume, Chapter]] = []
-        book_title = ""
-        authors = []
-        tags = []
-        index = []
-        translators = []
+        toc: List[Volume | Chapter] = []
+        book_data = {
+            "book_title": "",
+            "authors": [],
+            "tags": [],
+            "index": [],
+            "translators": [],
+        }
         current_volume = Volume("")
         current_chapter = Chapter("")
@@ -162,80 +264,48 @@ class Parser:
             ):
                 logger.debug(repr(token))
-            if token.type == "TITLE":
-                book_title = token.value
-            if token.type == "AUTHOR":
-                authors.append(token.value)
-            if token.type == "TAG":
-                tags.append(token.value)
-            if token.type == "INDEX":
-                index = token.value.split(" ")
-            if token.type == "TRANSLATOR":
-                translators.append(token.value)
-            if token.type == "VOLUME_CHAPTER":
-                [volume, chapter] = token.value
-                volume_title = self.words_to_nums(volume.value, 2)
-                if current_volume.title != volume_title:
-                    current_volume = Volume(title=volume_title)
-                    toc.append(current_volume)
-                chapter_title = self.words_to_nums(
-                    chapter.value, len(str(stats.get("VOLUME_CHAPTER")))
+            if token.type in [
+                "TITLE",
+                "AUTHOR",
+                "TAG",
+                "INDEX",
+                "TRANSLATOR",
+            ]:
+                self._process_metadata_token(token, book_data)
+            elif token.type == "VOLUME_CHAPTER":
+                (current_volume, current_chapter) = (
+                    self._process_volume_chapter_token(
+                        token, toc, stats, current_volume, current_chapter
+                    )
                 )
-                if current_chapter.title != chapter_title:
-                    current_chapter = Chapter(title=chapter_title)
-                    if isinstance(toc[-1], Volume):
-                        toc[-1].add_chapter(current_chapter)
-            if token.type == "VOLUME":
-                volume_title = self.words_to_nums(
-                    token.value, len(str(stats.get("VOLUME")))
+            elif token.type == "VOLUME":
+                current_volume = self._process_volume_token(
+                    token, toc, stats, current_volume
                 )
-                if current_volume.title != volume_title:
-                    current_volume = Volume(title=volume_title)
-                    toc.append(current_volume)
-            if token.type == "CHAPTER":
-                chapter_title = self.words_to_nums(
-                    token.value, len(str(stats.get("CHAPTER")))
+            elif token.type == "CHAPTER":
+                current_chapter = self._process_chapter_token(
+                    token, toc, stats, current_chapter
                 )
-                if current_chapter.title != chapter_title:
-                    current_chapter = Chapter(title=chapter_title)
-                    if toc and isinstance(toc[-1], Volume):
-                        toc[-1].add_chapter(current_chapter)
-                    else:
-                        toc.append(current_chapter)
-            if token.type == "PARAGRAPH":
-                if toc:
-                    if isinstance(toc[-1], Volume):
-                        toc[-1].chapters[-1].add_paragraph(token.value)
-                    if isinstance(toc[-1], Chapter):
-                        toc[-1].add_paragraph(token.value)
+            elif token.type == "PARAGRAPH":
+                self._process_paragraph_token(token, toc)
         # Use authors if set explicitly from command line.
         if hasattr(self.config, "author") and self.config.author:
-            authors = self.config.author
+            book_data["authors"] = self.config.author
         if hasattr(self.config, "title") and self.config.title:
-            book_title = self.config.title
+            book_data["book_title"] = self.config.title
         if hasattr(self.config, "translator") and self.config.translator:
-            translators = self.config.translator
+            book_data["translators"] = self.config.translator
-        logger.info("Found or set book title: %s", book_title)
-        logger.info("Found or set authors: %s", repr(authors))
-        logger.info("Found or set translators: %s", repr(translators))
-        logger.info("Found or set tags: %s", repr(tags))
-        logger.info("Found or set index: %s", repr(index))
+        logger.info("Found or set book title: %s", book_data["book_title"])
+        logger.info("Found or set authors: %s", repr(book_data["authors"]))
+        logger.info(
+            "Found or set translators: %s", repr(book_data["translators"])
+        )
+        logger.info("Found or set tags: %s", repr(book_data["tags"]))
+        logger.info("Found or set index: %s", repr(book_data["index"]))
         if (
             hasattr(self.config, "sort_volume_and_chapter")
@@ -243,7 +313,14 @@ class Parser:
         ):
             self.sort_volume_and_chapter(toc)
-        return (book_title, authors, translators, tags, index, toc)
+        return (
+            book_data["book_title"],
+            book_data["authors"],
+            book_data["translators"],
+            book_data["tags"],
+            book_data["index"],
+            toc,
+        )
     def sort_volume_and_chapter(self, toc: List) -> None:
         """Sort by title of volumes and its chapters.

{txt2ebook-0.1.159 → txt2ebook-0.1.161}/src/txt2ebook/subcommands/epub.py RENAMED Viewed

@@ -19,6 +19,7 @@ import argparse
 import logging
 import sys
+from txt2ebook.exceptions import InputError
 from txt2ebook.formats import EPUB_TEMPLATES
 from txt2ebook.formats.epub import EpubWriter
 from txt2ebook.subcommands.parse import run as parse_txt
@@ -133,14 +134,15 @@ def run(args: argparse.Namespace) -> None:
         input_sources.append(sys.stdin)
     else:
         logger.error("No input files provided.")
-        sys.exit(1)
+        raise InputError("No input files provided.")
     if len(input_sources) > 1 and args.output_file:
-        logger.error(
+        msg = (
             "Cannot specify a single output file when "
             "processing multiple input files."
         )
-        sys.exit(1)
+        logger.error(msg)
+        raise InputError(msg)
     for i, current_input_stream in enumerate(input_sources):
         # ensures that `input_file` and `output_file` are correctly isolated
@@ -156,8 +158,8 @@ def run(args: argparse.Namespace) -> None:
         if i > 0 and args.output_file:
             current_file_args.output_file = None
-        book = parse_txt(current_file_args)
-        writer = EpubWriter(book, current_file_args)
+        book, langconf = parse_txt(current_file_args)
+        writer = EpubWriter(book, current_file_args, langconf)
         writer.write()
         # close the file stream if it was opened by argparse.FileType and is

{txt2ebook-0.1.159 → txt2ebook-0.1.161}/src/txt2ebook/subcommands/gmi.py RENAMED Viewed

@@ -19,6 +19,7 @@ import argparse
 import logging
 import sys
+from txt2ebook.exceptions import InputError
 from txt2ebook.formats.gmi import GmiWriter
 from txt2ebook.subcommands.parse import run as parse_txt
@@ -114,6 +115,41 @@ def run(args: argparse.Namespace) -> None:
     Returns:
         None
     """
-    book = parse_txt(args)
-    writer = GmiWriter(book, args)
-    writer.write()
+    input_sources = []
+    if args.input_file:
+        # File path(s) were explicitly provided on the command line
+        input_sources.append(args.input_file)
+    elif not sys.stdin.isatty():
+        # No file path provided, check for piped input
+        input_sources.append(sys.stdin)
+    else:
+        logger.error("No input files provided.")
+        raise InputError("No input files provided.")
+    if len(input_sources) > 1 and args.output_file:
+        msg = (
+            "Cannot specify a single output file when "
+            "processing multiple input files."
+        )
+        logger.error(msg)
+        raise InputError(msg)
+    for i, current_input_stream in enumerate(input_sources):
+        # ensures that `input_file` and `output_file` are correctly isolated
+        current_file_args = argparse.Namespace(**vars(args))
+        current_file_args.input_file = current_input_stream
+        # if an explicit output_file was provided, it must apply to the first
+        # input
+        if i > 0 and args.output_file:
+            current_file_args.output_file = None
+        book, langconf = parse_txt(current_file_args)
+        writer = GmiWriter(book, current_file_args, langconf)
+        writer.write()
+        # close the file stream if it was opened by argparse.FileType and is
+        # not sys.stdin.
+        if current_input_stream is not sys.stdin:
+            current_input_stream.close()

{txt2ebook-0.1.159 → txt2ebook-0.1.161}/src/txt2ebook/subcommands/md.py RENAMED Viewed

@@ -19,6 +19,7 @@ import argparse
 import logging
 import sys
+from txt2ebook.exceptions import InputError
 from txt2ebook.formats.md import MdWriter as MarkdownWriter
 from txt2ebook.subcommands.parse import run as parse_txt
@@ -114,6 +115,41 @@ def run(args: argparse.Namespace) -> None:
     Returns:
         None
     """
-    book = parse_txt(args)
-    writer = MarkdownWriter(book, args)
-    writer.write()
+    input_sources = []
+    if args.input_file:
+        # File path(s) were explicitly provided on the command line
+        input_sources.append(args.input_file)
+    elif not sys.stdin.isatty():
+        # No file path provided, check for piped input
+        input_sources.append(sys.stdin)
+    else:
+        logger.error("No input files provided.")
+        raise InputError("No input files provided.")
+    if len(input_sources) > 1 and args.output_file:
+        msg = (
+            "Cannot specify a single output file when "
+            "processing multiple input files."
+        )
+        logger.error(msg)
+        raise InputError(msg)
+    for i, current_input_stream in enumerate(input_sources):
+        # ensures that `input_file` and `output_file` are correctly isolated
+        current_file_args = argparse.Namespace(**vars(args))
+        current_file_args.input_file = current_input_stream
+        # if an explicit output_file was provided, it must apply to the first
+        # input
+        if i > 0 and args.output_file:
+            current_file_args.output_file = None
+        book, langconf = parse_txt(current_file_args)
+        writer = MarkdownWriter(book, current_file_args, langconf)
+        writer.write()
+        # close the file stream if it was opened by argparse.FileType and is
+        # not sys.stdin.
+        if current_input_stream is not sys.stdin:
+            current_input_stream.close()

{txt2ebook-0.1.159 → txt2ebook-0.1.161}/src/txt2ebook/subcommands/parse.py RENAMED Viewed

@@ -19,6 +19,8 @@ import argparse
 import logging
 import sys
 from importlib import import_module
+from types import ModuleType
+from typing import Tuple
 import jieba.analyse
 from bs4 import UnicodeDammit
@@ -59,14 +61,15 @@ def build_subparser(subparsers) -> None:
     parse_parser.set_defaults(func=run)
-def run(args: argparse.Namespace) -> Book:
+def run(args: argparse.Namespace) -> Tuple[Book, ModuleType]:
     """Run env subcommand.
     Args:
         args (argparse.Namespace): Config from command line arguments
     Returns:
-        None
+        Tuple[Book, ModuleType]: The Book model and the language
+        configuration module.
     """
     logger.info("Parsing txt file: %s", args.input_file.name)
@@ -94,4 +97,4 @@ def run(args: argparse.Namespace) -> Book:
     if args.debug:
         book.debug(args.verbose)
-    return book
+    return book, langconf

{txt2ebook-0.1.159 → txt2ebook-0.1.161}/src/txt2ebook/subcommands/pdf.py RENAMED Viewed

@@ -19,6 +19,7 @@ import argparse
 import logging
 import sys
+from txt2ebook.exceptions import InputError
 from txt2ebook.formats import PAGE_SIZES
 from txt2ebook.formats.pdf import PdfWriter
 from txt2ebook.subcommands.parse import run as parse_txt
@@ -104,6 +105,41 @@ def run(args: argparse.Namespace) -> None:
     Returns:
         None
     """
-    book = parse_txt(args)
-    writer = PdfWriter(book, args)
-    writer.write()
+    input_sources = []
+    if args.input_file:
+        # File path(s) were explicitly provided on the command line
+        input_sources.append(args.input_file)
+    elif not sys.stdin.isatty():
+        # No file path provided, check for piped input
+        input_sources.append(sys.stdin)
+    else:
+        logger.error("No input files provided.")
+        raise InputError("No input files provided.")
+    if len(input_sources) > 1 and args.output_file:
+        msg = (
+            "Cannot specify a single output file when "
+            "processing multiple input files."
+        )
+        logger.error(msg)
+        raise InputError(msg)
+    for i, current_input_stream in enumerate(input_sources):
+        # ensures that `input_file` and `output_file` are correctly isolated
+        current_file_args = argparse.Namespace(**vars(args))
+        current_file_args.input_file = current_input_stream
+        # if an explicit output_file was provided, it must apply to the first
+        # input
+        if i > 0 and args.output_file:
+            current_file_args.output_file = None
+        book, langconf = parse_txt(current_file_args)
+        writer = PdfWriter(book, current_file_args, langconf)
+        writer.write()
+        # close the file stream if it was opened by argparse.FileType and is
+        # not sys.stdin.
+        if current_input_stream is not sys.stdin:
+            current_input_stream.close()

{txt2ebook-0.1.159 → txt2ebook-0.1.161}/src/txt2ebook/subcommands/tex.py RENAMED Viewed

@@ -19,6 +19,7 @@ import argparse
 import logging
 import sys
+from txt2ebook.exceptions import InputError
 from txt2ebook.formats.tex import TexWriter
 from txt2ebook.subcommands.parse import run as parse_txt
@@ -122,14 +123,15 @@ def run(args: argparse.Namespace) -> None:
         input_sources.extend(args.input_file)
     else:
         logger.error("No input files provided.")
-        sys.exit(1)
+        raise InputError("No input files provided.")
     if len(input_sources) > 1 and args.output_file:
-        logger.error(
+        msg = (
             "Cannot specify a single output file when "
             "processing multiple input files."
         )
-        sys.exit(1)
+        logger.error(msg)
+        raise InputError(msg)
     for i, current_input_stream in enumerate(input_sources):
         # ensures that `input_file` and `output_file` are correctly isolated
@@ -141,8 +143,8 @@ def run(args: argparse.Namespace) -> None:
         if i > 0 and args.output_file:
             current_file_args.output_file = None
-        book = parse_txt(current_file_args)
-        writer = TexWriter(book, current_file_args)
+        book, langconf = parse_txt(current_file_args)
+        writer = TexWriter(book, current_file_args, langconf)
         writer.write()
         # close the file stream if it was opened by argparse.FileType and is

{txt2ebook-0.1.159 → txt2ebook-0.1.161}/src/txt2ebook/subcommands/typ.py RENAMED Viewed

@@ -13,16 +13,22 @@
 # You should have received a copy of the GNU Affero General Public License
 # along with this program.  If not, see <https://www.gnu.org/licenses/>.
-"""typ subcommand."""
 import argparse
 import logging
 import sys
+from txt2ebook.exceptions import InputError
 from txt2ebook.formats import PAGE_SIZES
 from txt2ebook.formats.typ import TypWriter
 from txt2ebook.subcommands.parse import run as parse_txt
 logger = logging.getLogger(__name__)
@@ -124,46 +130,70 @@ def build_subparser(subparsers) -> None:
 def run(args: argparse.Namespace) -> None:
     """Run typ subcommand.
     Args:
         args (argparse.Namespace): Config from command line arguments
     Returns:
         None
     """
     input_sources = []
     if not sys.stdin.isatty():
         # piped input, use stdin as the single input source
         input_sources.append(sys.stdin)
     elif args.input_file:
         # multiple file(s)
         input_sources.extend(args.input_file)
     else:
         logger.error("No input files provided.")
-        sys.exit(1)
+        raise InputError("No input files provided.")
     if len(input_sources) > 1 and args.output_file:
-        logger.error(
+        msg = (
             "Cannot specify a single output file when "
             "processing multiple input files."
         )
-        sys.exit(1)
+        logger.error(msg)
+        raise InputError(msg)
     for i, current_input_stream in enumerate(input_sources):
         # ensures that `input_file` and `output_file` are correctly isolated
         current_file_args = argparse.Namespace(**vars(args))
         current_file_args.input_file = current_input_stream
         # if an explicit output_file was provided, it must apply to the first
         # input
         if i > 0 and args.output_file:
             current_file_args.output_file = None
-        book = parse_txt(current_file_args)
-        writer = TypWriter(book, current_file_args)
+        book, langconf = parse_txt(current_file_args)
+        writer = TypWriter(book, current_file_args, langconf)
         writer.write()
         # close the file stream if it was opened by argparse.FileType and is
         # not sys.stdin.
         if current_input_stream is not sys.stdin:
             current_input_stream.close()

{txt2ebook-0.1.159 → txt2ebook-0.1.161}/src/txt2ebook/tokenizer.py RENAMED Viewed

@@ -20,7 +20,7 @@ import logging
 import re
 from collections import Counter
 from dataclasses import dataclass, field
-from importlib import import_module
+from types import ModuleType
 from typing import Any, Dict, List
 from txt2ebook import log_or_raise_on_warning
@@ -55,17 +55,21 @@ class Tokenizer:
     raw_content: str = field(repr=False)
     metadata_marker: str = field(repr=False)
     config: argparse.Namespace = field(repr=False)
+    langconf: ModuleType = field(repr=False)
     tokens: List[Token] = field(default_factory=List, repr=False)
     lineno_lookup: Dict = field(default_factory=Dict, repr=False)
-    def __init__(self, raw_content: str, config: argparse.Namespace) -> None:
+    def __init__(
+        self,
+        raw_content: str,
+        config: argparse.Namespace,
+        langconf: ModuleType,
+    ) -> None:
         """Set the constructor for the Tokenizer."""
         self.raw_content = raw_content
         self.config = config
         self.metadata_marker = "---"
-        config_lang = config.language.replace("-", "_")
-        self.langconf = import_module(f"txt2ebook.languages.{config_lang}")
+        self.langconf = langconf
         lookupcontent = raw_content[:]
         lineno_lookup = {}
@@ -184,7 +188,8 @@ class Tokenizer:
         else:
             # No metadata block found according to the pattern,
             # so assume all raw_content is the actual content.
-            # _extract_metadata would have already logged/warned if metadata was expected.
+            # _extract_metadata would have already logged/warned if metadata
+            # was expected.
             content_str = self.raw_content
         content_str = content_str.strip(self.config.paragraph_separator)

{txt2ebook-0.1.159 → txt2ebook-0.1.161/src/txt2ebook.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: txt2ebook
-Version: 0.1.159
+Version: 0.1.161
 Summary: CLI tool to convert txt file to ebook format
 Author-email: Kian-Meng Ang <kianmeng@cpan.org>
 License-Expression: AGPL-3.0-or-later
@@ -13,17 +13,17 @@ Classifier: Natural Language :: Chinese (Simplified)
 Classifier: Natural Language :: Chinese (Traditional)
 Classifier: Programming Language :: Python
 Classifier: Programming Language :: Python :: 3 :: Only
-Classifier: Programming Language :: Python :: 3.9
 Classifier: Programming Language :: Python :: 3.10
 Classifier: Programming Language :: Python :: 3.11
 Classifier: Programming Language :: Python :: 3.12
 Classifier: Programming Language :: Python :: 3.13
+Classifier: Programming Language :: Python :: 3.14
 Classifier: Topic :: Text Processing
 Classifier: Topic :: Text Processing :: Filters
 Classifier: Topic :: Text Processing :: General
 Classifier: Topic :: Text Processing :: Markup :: HTML
 Classifier: Topic :: Text Processing :: Markup :: Markdown
-Requires-Python: ~=3.9
+Requires-Python: >=3.10
 Description-Content-Type: text/markdown
 License-File: LICENSE.md
 Requires-Dist: CJKwrap~=2.2