PyPI - novel-downloader - Versions diffs - 1.5.0__py3-none-any.whl → 2.0.1__py3-none-any.whl - Mend

novel-downloader 1.5.0py3-none-any.whl → 2.0.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (248) hide show

novel_downloader/__init__.py +1 -1
novel_downloader/cli/__init__.py +1 -3
novel_downloader/cli/clean.py +21 -88
novel_downloader/cli/config.py +26 -21
novel_downloader/cli/download.py +79 -66
novel_downloader/cli/export.py +17 -21
novel_downloader/cli/main.py +1 -1
novel_downloader/cli/search.py +62 -65
novel_downloader/cli/ui.py +156 -0
novel_downloader/config/__init__.py +8 -5
novel_downloader/config/adapter.py +206 -209
novel_downloader/config/{loader.py → file_io.py} +53 -26
novel_downloader/core/__init__.py +5 -5
novel_downloader/core/archived/deqixs/fetcher.py +115 -0
novel_downloader/core/archived/deqixs/parser.py +132 -0
novel_downloader/core/archived/deqixs/searcher.py +89 -0
novel_downloader/core/{searchers/qidian.py → archived/qidian/searcher.py} +12 -20
novel_downloader/core/archived/wanbengo/searcher.py +98 -0
novel_downloader/core/archived/xshbook/searcher.py +93 -0
novel_downloader/core/downloaders/__init__.py +3 -24
novel_downloader/core/downloaders/base.py +49 -23
novel_downloader/core/downloaders/common.py +191 -137
novel_downloader/core/downloaders/qianbi.py +187 -146
novel_downloader/core/downloaders/qidian.py +187 -141
novel_downloader/core/downloaders/registry.py +4 -2
novel_downloader/core/downloaders/signals.py +46 -0
novel_downloader/core/exporters/__init__.py +3 -20
novel_downloader/core/exporters/base.py +33 -37
novel_downloader/core/exporters/common/__init__.py +1 -2
novel_downloader/core/exporters/common/epub.py +15 -10
novel_downloader/core/exporters/common/main_exporter.py +19 -12
novel_downloader/core/exporters/common/txt.py +17 -12
novel_downloader/core/exporters/epub_util.py +59 -29
novel_downloader/core/exporters/linovelib/__init__.py +1 -0
novel_downloader/core/exporters/linovelib/epub.py +23 -25
novel_downloader/core/exporters/linovelib/main_exporter.py +8 -12
novel_downloader/core/exporters/linovelib/txt.py +20 -14
novel_downloader/core/exporters/qidian.py +2 -8
novel_downloader/core/exporters/registry.py +4 -2
novel_downloader/core/exporters/txt_util.py +7 -7
novel_downloader/core/fetchers/__init__.py +54 -48
novel_downloader/core/fetchers/aaatxt.py +83 -0
novel_downloader/core/fetchers/{biquge/session.py → b520.py} +6 -11
novel_downloader/core/fetchers/{base/session.py → base.py} +37 -46
novel_downloader/core/fetchers/{biquge/browser.py → biquyuedu.py} +12 -17
novel_downloader/core/fetchers/dxmwx.py +110 -0
novel_downloader/core/fetchers/eightnovel.py +139 -0
novel_downloader/core/fetchers/{esjzone/session.py → esjzone.py} +19 -12
novel_downloader/core/fetchers/guidaye.py +85 -0
novel_downloader/core/fetchers/hetushu.py +92 -0
novel_downloader/core/fetchers/{qianbi/browser.py → i25zw.py} +19 -28
novel_downloader/core/fetchers/ixdzs8.py +113 -0
novel_downloader/core/fetchers/jpxs123.py +101 -0
novel_downloader/core/fetchers/lewenn.py +83 -0
novel_downloader/core/fetchers/{linovelib/session.py → linovelib.py} +12 -13
novel_downloader/core/fetchers/piaotia.py +105 -0
novel_downloader/core/fetchers/qbtr.py +101 -0
novel_downloader/core/fetchers/{qianbi/session.py → qianbi.py} +5 -10
novel_downloader/core/fetchers/{qidian/session.py → qidian.py} +56 -64
novel_downloader/core/fetchers/quanben5.py +92 -0
novel_downloader/core/fetchers/{base/rate_limiter.py → rate_limiter.py} +2 -2
novel_downloader/core/fetchers/registry.py +5 -16
novel_downloader/core/fetchers/{sfacg/session.py → sfacg.py} +7 -10
novel_downloader/core/fetchers/shencou.py +106 -0
novel_downloader/core/fetchers/shuhaige.py +84 -0
novel_downloader/core/fetchers/tongrenquan.py +84 -0
novel_downloader/core/fetchers/ttkan.py +95 -0
novel_downloader/core/fetchers/wanbengo.py +83 -0
novel_downloader/core/fetchers/xiaoshuowu.py +106 -0
novel_downloader/core/fetchers/xiguashuwu.py +177 -0
novel_downloader/core/fetchers/xs63b.py +171 -0
novel_downloader/core/fetchers/xshbook.py +85 -0
novel_downloader/core/fetchers/{yamibo/session.py → yamibo.py} +19 -12
novel_downloader/core/fetchers/yibige.py +114 -0
novel_downloader/core/interfaces/__init__.py +1 -9
novel_downloader/core/interfaces/downloader.py +6 -2
novel_downloader/core/interfaces/exporter.py +7 -7
novel_downloader/core/interfaces/fetcher.py +6 -19
novel_downloader/core/interfaces/parser.py +7 -8
novel_downloader/core/interfaces/searcher.py +9 -1
novel_downloader/core/parsers/__init__.py +49 -12
novel_downloader/core/parsers/aaatxt.py +132 -0
novel_downloader/core/parsers/b520.py +116 -0
novel_downloader/core/parsers/base.py +64 -12
novel_downloader/core/parsers/biquyuedu.py +133 -0
novel_downloader/core/parsers/dxmwx.py +162 -0
novel_downloader/core/parsers/eightnovel.py +224 -0
novel_downloader/core/parsers/esjzone.py +64 -69
novel_downloader/core/parsers/guidaye.py +128 -0
novel_downloader/core/parsers/hetushu.py +139 -0
novel_downloader/core/parsers/i25zw.py +137 -0
novel_downloader/core/parsers/ixdzs8.py +186 -0
novel_downloader/core/parsers/jpxs123.py +137 -0
novel_downloader/core/parsers/lewenn.py +142 -0
novel_downloader/core/parsers/linovelib.py +48 -64
novel_downloader/core/parsers/piaotia.py +189 -0
novel_downloader/core/parsers/qbtr.py +136 -0
novel_downloader/core/parsers/qianbi.py +48 -50
novel_downloader/core/parsers/qidian/main_parser.py +756 -48
novel_downloader/core/parsers/qidian/utils/__init__.py +3 -21
novel_downloader/core/parsers/qidian/utils/decryptor_fetcher.py +1 -1
novel_downloader/core/parsers/qidian/utils/node_decryptor.py +4 -4
novel_downloader/core/parsers/quanben5.py +103 -0
novel_downloader/core/parsers/registry.py +5 -16
novel_downloader/core/parsers/sfacg.py +38 -45
novel_downloader/core/parsers/shencou.py +215 -0
novel_downloader/core/parsers/shuhaige.py +111 -0
novel_downloader/core/parsers/tongrenquan.py +116 -0
novel_downloader/core/parsers/ttkan.py +132 -0
novel_downloader/core/parsers/wanbengo.py +191 -0
novel_downloader/core/parsers/xiaoshuowu.py +173 -0
novel_downloader/core/parsers/xiguashuwu.py +429 -0
novel_downloader/core/parsers/xs63b.py +161 -0
novel_downloader/core/parsers/xshbook.py +134 -0
novel_downloader/core/parsers/yamibo.py +87 -131
novel_downloader/core/parsers/yibige.py +166 -0
novel_downloader/core/searchers/__init__.py +34 -3
novel_downloader/core/searchers/aaatxt.py +107 -0
novel_downloader/core/searchers/{biquge.py → b520.py} +29 -28
novel_downloader/core/searchers/base.py +112 -36
novel_downloader/core/searchers/dxmwx.py +105 -0
novel_downloader/core/searchers/eightnovel.py +84 -0
novel_downloader/core/searchers/esjzone.py +43 -25
novel_downloader/core/searchers/hetushu.py +92 -0
novel_downloader/core/searchers/i25zw.py +93 -0
novel_downloader/core/searchers/ixdzs8.py +107 -0
novel_downloader/core/searchers/jpxs123.py +107 -0
novel_downloader/core/searchers/piaotia.py +100 -0
novel_downloader/core/searchers/qbtr.py +106 -0
novel_downloader/core/searchers/qianbi.py +74 -40
novel_downloader/core/searchers/quanben5.py +144 -0
novel_downloader/core/searchers/registry.py +24 -8
novel_downloader/core/searchers/shuhaige.py +124 -0
novel_downloader/core/searchers/tongrenquan.py +110 -0
novel_downloader/core/searchers/ttkan.py +92 -0
novel_downloader/core/searchers/xiaoshuowu.py +122 -0
novel_downloader/core/searchers/xiguashuwu.py +95 -0
novel_downloader/core/searchers/xs63b.py +104 -0
novel_downloader/locales/en.json +34 -85
novel_downloader/locales/zh.json +35 -86
novel_downloader/models/__init__.py +21 -22
novel_downloader/models/book.py +44 -0
novel_downloader/models/config.py +4 -37
novel_downloader/models/login.py +1 -1
novel_downloader/models/search.py +5 -0
novel_downloader/resources/config/settings.toml +8 -70
novel_downloader/resources/json/xiguashuwu.json +718 -0
novel_downloader/utils/__init__.py +13 -24
novel_downloader/utils/chapter_storage.py +5 -5
novel_downloader/utils/constants.py +4 -31
novel_downloader/utils/cookies.py +38 -35
novel_downloader/utils/crypto_utils/__init__.py +7 -0
novel_downloader/utils/crypto_utils/aes_util.py +90 -0
novel_downloader/utils/crypto_utils/aes_v1.py +619 -0
novel_downloader/utils/crypto_utils/aes_v2.py +1143 -0
novel_downloader/utils/crypto_utils/rc4.py +54 -0
novel_downloader/utils/epub/__init__.py +3 -4
novel_downloader/utils/epub/builder.py +6 -6
novel_downloader/utils/epub/constants.py +62 -21
novel_downloader/utils/epub/documents.py +95 -201
novel_downloader/utils/epub/models.py +8 -22
novel_downloader/utils/epub/utils.py +73 -106
novel_downloader/utils/file_utils/__init__.py +2 -23
novel_downloader/utils/file_utils/io.py +53 -188
novel_downloader/utils/file_utils/normalize.py +1 -7
novel_downloader/utils/file_utils/sanitize.py +4 -15
novel_downloader/utils/fontocr/__init__.py +5 -14
novel_downloader/utils/fontocr/core.py +216 -0
novel_downloader/utils/fontocr/loader.py +50 -0
novel_downloader/utils/logger.py +81 -65
novel_downloader/utils/network.py +17 -41
novel_downloader/utils/state.py +4 -90
novel_downloader/utils/text_utils/__init__.py +1 -7
novel_downloader/utils/text_utils/diff_display.py +5 -7
novel_downloader/utils/text_utils/text_cleaner.py +39 -30
novel_downloader/utils/text_utils/truncate_utils.py +3 -14
novel_downloader/utils/time_utils/__init__.py +5 -11
novel_downloader/utils/time_utils/datetime_utils.py +20 -29
novel_downloader/utils/time_utils/sleep_utils.py +55 -49
novel_downloader/web/__init__.py +13 -0
novel_downloader/web/components/__init__.py +11 -0
novel_downloader/web/components/navigation.py +35 -0
novel_downloader/web/main.py +66 -0
novel_downloader/web/pages/__init__.py +17 -0
novel_downloader/web/pages/download.py +78 -0
novel_downloader/web/pages/progress.py +147 -0
novel_downloader/web/pages/search.py +329 -0
novel_downloader/web/services/__init__.py +17 -0
novel_downloader/web/services/client_dialog.py +164 -0
novel_downloader/web/services/cred_broker.py +113 -0
novel_downloader/web/services/cred_models.py +35 -0
novel_downloader/web/services/task_manager.py +264 -0
novel_downloader-2.0.1.dist-info/METADATA +172 -0
novel_downloader-2.0.1.dist-info/RECORD +206 -0
{novel_downloader-1.5.0.dist-info → novel_downloader-2.0.1.dist-info}/entry_points.txt +1 -1
novel_downloader/core/downloaders/biquge.py +0 -29
novel_downloader/core/downloaders/esjzone.py +0 -29
novel_downloader/core/downloaders/linovelib.py +0 -29
novel_downloader/core/downloaders/sfacg.py +0 -29
novel_downloader/core/downloaders/yamibo.py +0 -29
novel_downloader/core/exporters/biquge.py +0 -22
novel_downloader/core/exporters/esjzone.py +0 -22
novel_downloader/core/exporters/qianbi.py +0 -22
novel_downloader/core/exporters/sfacg.py +0 -22
novel_downloader/core/exporters/yamibo.py +0 -22
novel_downloader/core/fetchers/base/__init__.py +0 -14
novel_downloader/core/fetchers/base/browser.py +0 -422
novel_downloader/core/fetchers/biquge/__init__.py +0 -14
novel_downloader/core/fetchers/esjzone/__init__.py +0 -14
novel_downloader/core/fetchers/esjzone/browser.py +0 -209
novel_downloader/core/fetchers/linovelib/__init__.py +0 -14
novel_downloader/core/fetchers/linovelib/browser.py +0 -198
novel_downloader/core/fetchers/qianbi/__init__.py +0 -14
novel_downloader/core/fetchers/qidian/__init__.py +0 -14
novel_downloader/core/fetchers/qidian/browser.py +0 -326
novel_downloader/core/fetchers/sfacg/__init__.py +0 -14
novel_downloader/core/fetchers/sfacg/browser.py +0 -194
novel_downloader/core/fetchers/yamibo/__init__.py +0 -14
novel_downloader/core/fetchers/yamibo/browser.py +0 -234
novel_downloader/core/parsers/biquge.py +0 -139
novel_downloader/core/parsers/qidian/book_info_parser.py +0 -90
novel_downloader/core/parsers/qidian/chapter_encrypted.py +0 -528
novel_downloader/core/parsers/qidian/chapter_normal.py +0 -157
novel_downloader/core/parsers/qidian/chapter_router.py +0 -68
novel_downloader/core/parsers/qidian/utils/helpers.py +0 -114
novel_downloader/models/chapter.py +0 -25
novel_downloader/models/types.py +0 -13
novel_downloader/tui/__init__.py +0 -7
novel_downloader/tui/app.py +0 -32
novel_downloader/tui/main.py +0 -17
novel_downloader/tui/screens/__init__.py +0 -14
novel_downloader/tui/screens/home.py +0 -198
novel_downloader/tui/screens/login.py +0 -74
novel_downloader/tui/styles/home_layout.tcss +0 -79
novel_downloader/tui/widgets/richlog_handler.py +0 -24
novel_downloader/utils/cache.py +0 -24
novel_downloader/utils/crypto_utils.py +0 -71
novel_downloader/utils/fontocr/hash_store.py +0 -280
novel_downloader/utils/fontocr/hash_utils.py +0 -103
novel_downloader/utils/fontocr/model_loader.py +0 -69
novel_downloader/utils/fontocr/ocr_v1.py +0 -315
novel_downloader/utils/fontocr/ocr_v2.py +0 -764
novel_downloader/utils/fontocr/ocr_v3.py +0 -744
novel_downloader-1.5.0.dist-info/METADATA +0 -196
novel_downloader-1.5.0.dist-info/RECORD +0 -164
{novel_downloader-1.5.0.dist-info → novel_downloader-2.0.1.dist-info}/WHEEL +0 -0
{novel_downloader-1.5.0.dist-info → novel_downloader-2.0.1.dist-info}/licenses/LICENSE +0 -0
{novel_downloader-1.5.0.dist-info → novel_downloader-2.0.1.dist-info}/top_level.txt +0 -0

novel_downloader/utils/epub/utils.py CHANGED Viewed

@@ -4,20 +4,18 @@ novel_downloader.utils.epub.utils
 ---------------------------------
 Pure utility functions for EPUB assembly, including:
-- Computing file hashes
-- Generating META-INF/container.xml
-- Constructing HTML snippets for the book intro and volume intro
+  * Computing file hashes
+  * Generating META-INF/container.xml
+  * Constructing HTML snippets for the book intro and volume intro
 """
 import hashlib
+from html import escape
 from pathlib import Path
-from lxml import etree, html
 from .constants import (
     CONTAINER_TEMPLATE,
     IMAGE_FOLDER,
-    PRETTY_PRINT_FLAG,
     ROOT_PATH,
 )
@@ -61,48 +59,49 @@ def build_book_intro(
     Build the HTML snippet for the overall book introduction.
     This includes:
-      - A main heading ("Book Introduction")
-      - A list of metadata items (title, author, categories, word count, status)
-      - A "Summary" subheading and one or more paragraphs of summary text
+      * A main heading ("Book Introduction")
+      * A list of metadata items (title, author, categories, word count, status)
+      * A "Summary" subheading and one or more paragraphs of summary text
     :return: A HTML string for inclusion in `intro.xhtml`
     """
-    root = html.Element("div")
-    # Main heading
-    h1 = etree.SubElement(root, "h1")
-    h1.text = "书籍简介"
-    # Metadata list
-    info_div = etree.SubElement(root, "div", {"class": "intro-info"})
-    ul = etree.SubElement(info_div, "ul")
-    _add_li(ul, "书名", f"《{book_name}》" if book_name else "")
-    _add_li(ul, "作者", author)
-    _add_li(ul, "分类", ", ".join(subject) if subject else "")
-    _add_li(ul, "字数", word_count)
-    _add_li(ul, "状态", serial_status)
-    # Summary section
-    if summary:
-        # force page break before summary
-        etree.SubElement(root, "p", {"class": "new-page-after"})
-        h2 = etree.SubElement(root, "h2")
-        h2.text = "简介"
+    lines = []
+    lines.append("<div>")
+    lines.append("<h1>书籍简介</h1>")
+    lines.append('<div class="intro-info">')
+    lines.append("<ul>")
+    name_val = f"《{book_name}》" if book_name else ""
+    subj_val = ", ".join(subject) if subject else ""
+    li_lines = [
+        _li_line("书名", name_val),
+        _li_line("作者", author),
+        _li_line("分类", subj_val),
+        _li_line("字数", word_count),
+        _li_line("状态", serial_status),
+    ]
+    for li in li_lines:
+        if li:
+            lines.append(li)
+    lines.append("</ul>")
+    lines.append("</div>")
-        summary_div = etree.SubElement(root, "div", {"class": "intro-summary"})
+    if summary:
+        lines.append('<p class="new-page-after"></p>')
+        lines.append("<h2>简介</h2>")
+        lines.append('<div class="intro-summary">')
         for line in summary.splitlines():
-            line = line.strip()
-            if not line:
+            s = line.strip()
+            if not s:
                 continue
-            p = etree.SubElement(summary_div, "p")
-            p.text = line
+            lines.append(f"<p>{escape(s, quote=True)}</p>")
+        lines.append("</div>")
-    html_string: str = html.tostring(
-        root,
-        pretty_print=PRETTY_PRINT_FLAG,
-        encoding="unicode",
-    )
-    return html_string
+    lines.append("</div>")
+    return "\n".join(lines)
 def build_volume_intro(
@@ -113,86 +112,54 @@ def build_volume_intro(
     Build the HTML snippet for a single-volume introduction.
     This includes:
-      - A decorative border image (top and bottom)
-      - A primary heading (volume main title)
-      - An optional secondary line (subtitle)
-      - One or more paragraphs of intro text
+      * A decorative border image (top and bottom)
+      * A primary heading (volume main title)
+      * An optional secondary line (subtitle)
+      * One or more paragraphs of intro text
     :param volume_title: e.g. "Volume 1 - The Beginning"
     :param volume_intro_text: multiline intro text for this volume
     :return: A HTML string for inclusion in `vol_<n>.xhtml`
     """
-    root = html.Element("div")
-    # Break the title into two lines if possible
     line1, line2 = _split_volume_title(volume_title)
-    header = etree.SubElement(root, "div", {"class": "vol-header"})
-    # Top decorative border
-    header.append(_make_vol_border_img(flip=False))
-    # Main title
-    h1 = etree.SubElement(header, "h1", {"class": "vol-title-main"})
-    h1.text = line1
-    # Bottom decorative border (flipped)
-    header.append(_make_vol_border_img(flip=True))
-    # Subtitle (if any)
+    lines = []
+    lines.append("<div>")
+    lines.append('<div class="vol-header">')
+    lines.append(_vol_border_div_str(flip=False))
+    lines.append(f'<h1 class="vol-title-main">{escape(line1, quote=True)}</h1>')
+    lines.append(_vol_border_div_str(flip=True))
     if line2:
-        h2 = etree.SubElement(header, "h2", {"class": "vol-title-sub"})
-        h2.text = line2
+        lines.append(f'<h2 class="vol-title-sub">{escape(line2, quote=True)}</h2>')
+    lines.append("</div>")
-    # Intro text paragraphs
     if volume_intro_text:
-        etree.SubElement(root, "p", {"class": "new-page-after"})
-        vol_div = etree.SubElement(root, "div", {"class": "vol-intro-text"})
+        lines.append('<p class="new-page-after"></p>')
+        lines.append('<div class="vol-intro-text">')
         for line in volume_intro_text.splitlines():
-            line = line.strip()
-            if not line:
+            s = line.strip()
+            if not s:
                 continue
-            p = etree.SubElement(vol_div, "p")
-            p.text = line
+            lines.append(f"<p>{escape(s, quote=True)}</p>")
+        lines.append("</div>")
-    html_string: str = html.tostring(
-        root,
-        pretty_print=PRETTY_PRINT_FLAG,
-        encoding="unicode",
-    )
-    return html_string
+    lines.append("</div>")
+    return "\n".join(lines)
-def _add_li(ul: etree._Element, label: str, value: str) -> None:
-    """
-    Append a `<li>` with 'label: value' if value is nonempty.
-    """
-    if value:
-        li = etree.SubElement(ul, "li")
-        li.text = f"{label}: {value}"
+def _li_line(label: str, value: str) -> str:
+    if not value:
+        return ""
+    return f"<li>{escape(label, quote=True)}: {escape(value, quote=True)}</li>"
-def _make_vol_border_img(flip: bool = False) -> html.HtmlElement:
-    """
-    Return a `<div>` containing the `volume_border.png` image,
-    styled by the given class name.
-    """
-    classes = ["vol-border"]
-    if flip:
-        classes.append("flip")
-    cls = " ".join(classes)
-    div = html.Element("div", {"class": cls})
-    etree.SubElement(
-        div,
-        "img",
-        {
-            "src": f"../{IMAGE_FOLDER}/volume_border.png",
-            "alt": "",
-        },
+def _vol_border_div_str(flip: bool = False) -> str:
+    classes = "vol-border" + (" flip" if flip else "")
+    return (
+        f'<div class="{classes}">'
+        f'<img src="../{IMAGE_FOLDER}/volume_border.png" alt="">'
+        f"</div>"
     )
-    return div
 def _split_volume_title(volume_title: str) -> tuple[str, str]:
@@ -202,10 +169,10 @@ def _split_volume_title(volume_title: str) -> tuple[str, str]:
     :param volume_title: Original volume title string.
     :return: Tuple of (line1, line2)
     """
-    if " " in volume_title:
-        parts = volume_title.split(" ", 1)
-    elif "-" in volume_title:
+    if "-" in volume_title:
         parts = volume_title.split("-", 1)
+    elif " " in volume_title:
+        parts = volume_title.split(" ", 1)
     else:
         return volume_title, ""

novel_downloader/utils/file_utils/__init__.py CHANGED Viewed

@@ -4,35 +4,14 @@ novel_downloader.utils.file_utils
 ---------------------------------
 High-level file I/O utility re-exports for convenience.
-This module aggregates commonly used low-level file utilities such as:
-- Path sanitization (for safe filenames)
-- Text normalization (e.g. Windows/Linux line endings)
-- JSON, plain text, and binary file reading/writing
-Included utilities:
-- sanitize_filename: remove invalid characters from filenames
-- normalize_txt_line_endings: standardize line endings in text files
-- save_as_json / save_as_txt: write dict or text to file
-- read_text_file / read_json_file / read_binary_file: load content from file
 """
 __all__ = [
     "sanitize_filename",
-    "save_as_json",
-    "save_as_txt",
-    "read_text_file",
-    "read_json_file",
-    "read_binary_file",
+    "write_file",
     "normalize_txt_line_endings",
 ]
-from .io import (
-    read_binary_file,
-    read_json_file,
-    read_text_file,
-    save_as_json,
-    save_as_txt,
-)
+from .io import write_file
 from .normalize import normalize_txt_line_endings
 from .sanitize import sanitize_filename

novel_downloader/utils/file_utils/io.py CHANGED Viewed

@@ -3,214 +3,79 @@
 novel_downloader.utils.file_utils.io
 ------------------------------------
-File I/O utilities for reading and writing text, JSON, and binary data.
-Includes:
-- Safe, atomic file saving with optional overwrite and auto-renaming
-- JSON pretty-printing with size-aware formatting
-- Simple helpers for reading files with fallback and logging
+File I/O utilities for reading and writing data.
 """
-__all__ = [
-    "save_as_txt",
-    "save_as_json",
-    "read_text_file",
-    "read_json_file",
-    "read_binary_file",
-]
+__all__ = ["write_file"]
-import json
-import logging
 import tempfile
 from pathlib import Path
-from typing import Any, Literal
+from typing import Literal
 from .sanitize import sanitize_filename
-logger = logging.getLogger(__name__)
-_JSON_INDENT_THRESHOLD = 50 * 1024  # bytes
-def _get_non_conflicting_path(path: Path) -> Path:
-    """
-    If the path exists, generate a new one by appending _1, _2, etc.
-    """
-    counter = 1
-    new_path = path
-    while new_path.exists():
-        stem = path.stem
-        suffix = path.suffix
-        new_path = path.with_name(f"{stem}_{counter}{suffix}")
-        counter += 1
-    return new_path
-def _write_file(
-    content: str | bytes | dict[Any, Any] | list[Any] | Any,
-    filepath: str | Path,
-    write_mode: str = "w",
-    *,
-    on_exist: Literal["overwrite", "skip", "rename"] = "overwrite",
-    dump_json: bool = False,
-    encoding: str = "utf-8",
-) -> Path | None:
-    """
-    Write content to a file safely with optional atomic behavior
-    and JSON serialization.
-    :param content: The content to write; can be text, bytes, or a
-        JSON-serializable object.
-    :param filepath: Destination path (str or Path).
-    :param mode: File mode ('w', 'wb'). Auto-determined if None.
-    :param on_exist: Behavior if file exists: 'overwrite', 'skip',
-        or 'rename'.
-    :param dump_json: If True, serialize content as JSON.
-    :param encoding: Text encoding for writing.
-    :return: Path if writing succeeds, None otherwise.
-    """
-    path = Path(filepath)
-    path = path.with_name(sanitize_filename(path.name))
-    path.parent.mkdir(parents=True, exist_ok=True)
-    if path.exists():
-        if on_exist == "skip":
-            logger.debug("[file] '%s' exists, skipping", path)
-            return path
-        if on_exist == "rename":
-            path = _get_non_conflicting_path(path)
-            logger.debug("[file] Renaming target to avoid conflict: %s", path)
-        else:
-            logger.debug("[file] '%s' exists, will overwrite", path)
-    # Prepare content and write mode
-    content_to_write: str | bytes
-    if dump_json:
-        # Serialize original object to JSON string
-        json_str = json.dumps(content, ensure_ascii=False, indent=2)
-        if len(json_str.encode(encoding)) > _JSON_INDENT_THRESHOLD:
-            json_str = json.dumps(content, ensure_ascii=False, separators=(",", ":"))
-        content_to_write = json_str
-        write_mode = "w"
-    else:
-        if isinstance(content, (str | bytes)):
-            content_to_write = content
-        else:
-            raise TypeError("Non-JSON content must be str or bytes.")
-        write_mode = "wb" if isinstance(content, bytes) else "w"
-    try:
-        with tempfile.NamedTemporaryFile(
-            mode=write_mode,
-            encoding=None if "b" in write_mode else encoding,
-            newline=None if "b" in write_mode else "\n",
-            delete=False,
-            dir=path.parent,
-        ) as tmp:
-            tmp.write(content_to_write)
-            tmp_path = Path(tmp.name)
-        tmp_path.replace(path)
-        logger.debug("[file] '%s' written successfully", path)
-        return path
-    except Exception as exc:
-        logger.warning("[file] Error writing %r: %s", path, exc)
-        return None
-def save_as_txt(
-    content: str,
-    filepath: str | Path,
-    *,
-    encoding: str = "utf-8",
-    on_exist: Literal["overwrite", "skip", "rename"] = "overwrite",
-) -> Path | None:
+def _unique_path(path: Path, max_tries: int = 100) -> Path:
     """
-    Save plain text content to the given file path.
+    Return a unique file path by appending _1, _2, ... if needed.
-    :param content: Text content to write.
-    :param filepath: Destination file path.
-    :param encoding: Text encoding to use (default: 'utf-8').
-    :param on_exist: How to handle existing files: 'overwrite', 'skip', or 'rename'.
-    :return: Path if writing succeeds, None otherwise.
+    Falls back to a UUID suffix if all attempts fail.
     """
-    return _write_file(
-        content=content,
-        filepath=filepath,
-        write_mode="w",
-        on_exist=on_exist,
-        dump_json=False,
-        encoding=encoding,
-    )
-def save_as_json(
-    content: Any,
-    filepath: str | Path,
-    *,
-    encoding: str = "utf-8",
-    on_exist: Literal["overwrite", "skip", "rename"] = "overwrite",
-) -> Path | None:
-    """
-    Save JSON-serializable content to the given file path.
+    if not path.exists():
+        return path
-    :param content: Data to write as JSON.
-    :param filepath: Destination file path.
-    :param encoding: Text encoding to use (default: 'utf-8').
-    :param on_exist: How to handle existing files: 'overwrite', 'skip', or 'rename'.
-    :return: Path if writing succeeds, None otherwise.
-    """
-    return _write_file(
-        content=content,
-        filepath=filepath,
-        write_mode="w",
-        on_exist=on_exist,
-        dump_json=True,
-        encoding=encoding,
-    )
+    stem = path.stem
+    suffix = path.suffix
+    for counter in range(1, max_tries + 1):
+        candidate = path.with_name(f"{stem}_{counter}{suffix}")
+        if not candidate.exists():
+            return candidate
-def read_text_file(filepath: str | Path, encoding: str = "utf-8") -> str | None:
-    """
-    Read a UTF-8 text file.
+    # fallback: append a random/unique suffix
+    import uuid
-    :param filepath: Path to file.
-    :param encoding: Encoding to use.
-    :return: Text content or None on failure.
-    """
-    path = Path(filepath)
-    try:
-        return path.read_text(encoding=encoding)
-    except Exception as e:
-        logger.warning("[file] Failed to read %r: %s", path, e)
-        return None
+    return path.with_name(f"{stem}_{uuid.uuid4().hex}{suffix}")
-def read_json_file(filepath: str | Path, encoding: str = "utf-8") -> Any | None:
+def write_file(
+    content: str | bytes,
+    filepath: str | Path,
+    *,
+    on_exist: Literal["overwrite", "skip", "rename"] = "overwrite",
+    encoding: str = "utf-8",
+) -> Path:
     """
-    Read a JSON file and parse it into Python objects.
+    Write content to a file safely with atomic replacement.
-    :param filepath: Path to file.
-    :param encoding: Encoding to use.
-    :return: Python object or None on failure.
+    :param content: The content to write; can be text or bytes.
+    :param filepath: Destination path.
+    :param on_exist: Behavior if file exists.
+    :param encoding: Text encoding for writing.
+    :return: The final path where the content was written.
+    :raise: Any I/O error such as PermissionError or OSError
     """
     path = Path(filepath)
-    try:
-        return json.loads(path.read_text(encoding=encoding))
-    except Exception as e:
-        logger.warning("[file] Failed to read %r: %s", path, e)
-        return None
-def read_binary_file(filepath: str | Path) -> bytes | None:
-    """
-    Read a binary file and return its content as bytes.
+    path = path.with_name(sanitize_filename(path.name))
+    path.parent.mkdir(parents=True, exist_ok=True)
-    :param filepath: Path to file.
-    :return: Bytes or None on failure.
-    """
-    path = Path(filepath)
-    try:
-        return path.read_bytes()
-    except Exception as e:
-        logger.warning("[file] Failed to read %r: %s", path, e)
-        return None
+    if path.exists():
+        match on_exist:
+            case "skip":
+                return path
+            case "rename":
+                path = _unique_path(path)
+    write_mode = "wb" if isinstance(content, bytes) else "w"
+    with tempfile.NamedTemporaryFile(
+        mode=write_mode,
+        encoding=None if "b" in write_mode else encoding,
+        newline=None if "b" in write_mode else "\n",
+        delete=False,
+        dir=path.parent,
+    ) as tmp:
+        tmp.write(content)
+        tmp_path = Path(tmp.name)
+    tmp_path.replace(path)
+    return path

novel_downloader/utils/file_utils/normalize.py CHANGED Viewed

@@ -14,8 +14,6 @@ __all__ = ["normalize_txt_line_endings"]
 import logging
 from pathlib import Path
-logger = logging.getLogger(__name__)
 def normalize_txt_line_endings(folder_path: str | Path) -> None:
     """
@@ -28,7 +26,6 @@ def normalize_txt_line_endings(folder_path: str | Path) -> None:
     """
     path = Path(folder_path).resolve()
     if not path.exists() or not path.is_dir():
-        logger.warning("[file] Invalid folder: %s", path)
         return
     count_success, count_fail = 0, 0
@@ -38,13 +35,10 @@ def normalize_txt_line_endings(folder_path: str | Path) -> None:
             content = txt_file.read_text(encoding="utf-8")
             normalized = content.replace("\r\n", "\n").replace("\r", "\n")
             txt_file.write_text(normalized, encoding="utf-8", newline="\n")
-            logger.debug("[file] Normalized: %s", txt_file)
             count_success += 1
-        except (OSError, UnicodeDecodeError) as e:
-            logger.warning("[file] Failed: %s | %s", txt_file, e)
+        except (OSError, UnicodeDecodeError):
             count_fail += 1
-    logger.info("[file] Completed. Success: %s, Failed: %s", count_success, count_fail)
     return

novel_downloader/utils/file_utils/sanitize.py CHANGED Viewed

@@ -5,21 +5,13 @@ novel_downloader.utils.file_utils.sanitize
 Utility functions for cleaning and validating filenames for safe use
 on different operating systems.
-This module provides a cross-platform `sanitize_filename` function
-that replaces or removes illegal characters from filenames, trims
-lengths, and avoids reserved names on Windows systems.
 """
 __all__ = ["sanitize_filename"]
-import logging
 import os
 import re
-logger = logging.getLogger(__name__)
-# Windows 保留名称列表 (忽略大小写)
 _WIN_RESERVED_NAMES = {
     "CON",
     "PRN",
@@ -40,8 +32,8 @@ def sanitize_filename(filename: str, max_length: int | None = 255) -> str:
     This function checks the operating system environment and applies the appropriate
     filtering rules:
-      - On Windows, it replaces characters: <>:"/\\|?*
-      - On POSIX systems, it replaces the forward slash '/'
+      * On Windows, it replaces characters: <>:"/\\|?*
+      * On POSIX systems, it replaces the forward slash '/'
     :param filename: The input filename to sanitize.
     :param max_length: Optional maximum length of the output filename. Defaults to 255.
@@ -51,7 +43,7 @@ def sanitize_filename(filename: str, max_length: int | None = 255) -> str:
     name = pattern.sub("_", filename).strip(" .")
-    stem, dot, ext = name.partition(".")
+    stem, dot, ext = name.rpartition(".")
     if os.name == "nt" and stem.upper() in _WIN_RESERVED_NAMES:
         stem = f"_{stem}"
     cleaned = f"{stem}{dot}{ext}" if ext else stem
@@ -63,7 +55,4 @@ def sanitize_filename(filename: str, max_length: int | None = 255) -> str:
         else:
             cleaned = cleaned[:max_length]
-    if not cleaned:
-        cleaned = "_untitled"
-    logger.debug("[file] Sanitized filename: %r -> %r", filename, cleaned)
-    return cleaned
+    return cleaned or "_untitled"

novel_downloader/utils/fontocr/__init__.py CHANGED Viewed

@@ -3,20 +3,11 @@
 novel_downloader.utils.fontocr
 ------------------------------
-Utilities for font-based OCR, primarily used to decode custom font obfuscation
-Supports:
-- Font rendering and perceptual hash matching
-- PaddleOCR-based character recognition
-- Frequency-based scoring for ambiguous results
-- Debugging and font mapping persistence
-Exposes the selected OCR engine version via `FontOCR`.
+Lazy-loading interface for FontOCR. Provides a safe entry point
+to obtain an OCR utility instance if optional dependencies are available.
 """
-__all__ = ["FontOCR"]
-__version__ = "3.0"
+__all__ = ["get_font_ocr"]
+__version__ = "4.0"
-# from .ocr_v1 import FontOCRV1 as FontOCR
-# from .ocr_v2 import FontOCRV2 as FontOCR
-from .ocr_v3 import FontOCRV3 as FontOCR
+from .loader import get_font_ocr

novel-downloader 1.5.0__py3-none-any.whl → 2.0.1__py3-none-any.whl

novel-downloader 1.5.0py3-none-any.whl → 2.0.1py3-none-any.whl