PyPI - pdf2imgCrop - Versions diffs - 0.1.0__tar.gz - Mend

pdf2imgCrop 0.1.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (11) hide show

pdf2imgcrop-0.1.0/.github/workflows/pypi.yml +27 -0
pdf2imgcrop-0.1.0/.gitignore +4 -0
pdf2imgcrop-0.1.0/LICENSE.txt +7 -0
pdf2imgcrop-0.1.0/PKG-INFO +10 -0
pdf2imgcrop-0.1.0/README.md +58 -0
pdf2imgcrop-0.1.0/pdf2imgCrop/__init__.py +6 -0
pdf2imgcrop-0.1.0/pdf2imgCrop/__main__.py +41 -0
pdf2imgcrop-0.1.0/pdf2imgCrop/core.py +56 -0
pdf2imgcrop-0.1.0/pyproject.toml +23 -0
pdf2imgcrop-0.1.0/requirements.txt +3 -0
pdf2imgcrop-0.1.0/setup.py +34 -0

pdf2imgcrop-0.1.0/.github/workflows/pypi.yml ADDED Viewed

@@ -0,0 +1,27 @@
+name: Python Package Release
+on:
+  release:
+    types: [created]
+  workflow_dispatch:
+jobs:
+  deploy:
+    runs-on: ubuntu-latest
+    steps:
+    - uses: actions/checkout@v3
+    - name: Set up Python
+      uses: actions/setup-python@v4
+      with:
+        python-version: '3.x'
+    - name: Install dependencies
+      run: |
+        python -m pip install --upgrade pip
+        pip install build twine
+    - name: Build and publish
+      env:
+        TWINE_USERNAME: ${{ secrets.PYPI_USERNAME }}
+        TWINE_PASSWORD: ${{ secrets.PYPI_PASSWORD }}
+      run: |
+        python -m build
+        twine upload dist/*

pdf2imgcrop-0.1.0/.gitignore ADDED Viewed

@@ -0,0 +1,4 @@
+.vscode/
+*.pyc
+__pycache__/
+.venv/

pdf2imgcrop-0.1.0/LICENSE.txt ADDED Viewed

@@ -0,0 +1,7 @@
+Copyright © 2025 <Muxkin>
+Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the “Software”), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED “AS IS”, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.

pdf2imgcrop-0.1.0/PKG-INFO ADDED Viewed

@@ -0,0 +1,10 @@
+Metadata-Version: 2.4
+Name: pdf2imgCrop
+Version: 0.1.0
+Summary: 将PDF文件转换为图片并自动裁剪空白边距
+Author-email: Your Name <your.email@example.com>
+License-File: LICENSE.txt
+Requires-Python: >=3.8
+Requires-Dist: pillow>=10.0.0
+Requires-Dist: pymupdf>=1.23.0
+Requires-Dist: tqdm>=4.65.0

pdf2imgcrop-0.1.0/README.md ADDED Viewed

@@ -0,0 +1,58 @@
+# pdf2imgCrop
+一个用于将PDF文件转换为图片并自动裁剪空白边距的Python工具。
+> 如果想从pptx转换为高清图片，可以先试用Adobe Acrobat的ppt插件。注意需要在插件的**首选项->高级设置->图像**中将分辨率调高到300dpi以上。（我自己用的dpi是2400）
+## 功能特点
+- 将PDF文件转换为JPG或PNG格式的图片
+- 自动裁剪图片周围的空白边距
+- 支持自定义DPI设置
+- 命令行界面，使用简单
+## 安装
+```bash
+pip install pdf2imgCrop
+```
+## 使用方法
+### 命令行使用
+基本用法：
+```bash
+pdf2imgcrop your_file.pdf
+```
+指定DPI和输出格式：
+```bash
+pdf2imgcrop your_file.pdf -d 600 -f png
+```
+查看帮助：
+```bash
+pdf2imgcrop --help
+```
+### 参数说明
+- `file`: PDF文件路径（必需）
+- `-d`, `--dpi`: 输出图片的DPI（默认：300）
+- `-f`, `--format`: 输出图片格式，可选 jpg 或 png（默认：jpg）
+## 代码示例
+```python
+from pdf2imgCrop.core import convert_pdf
+# 基本用法
+convert_pdf("your_file.pdf")
+# 自定义DPI和格式
+convert_pdf("your_file.pdf", dpi=600, file_format="png")
+```
+## 输出
+转换后的图片将保存在与输入PDF文件同名的目录中，后缀为"output"。例如，如果输入文件是"document.pdf"，输出目录将是"documentoutput"。

pdf2imgcrop-0.1.0/pdf2imgCrop/__init__.py ADDED Viewed

@@ -0,0 +1,6 @@
+"""
+PDF to Image Converter with Auto-Cropping
+将PDF文件转换为图片，并自动裁剪空白边距
+"""
+__version__ = "0.1.0"

pdf2imgcrop-0.1.0/pdf2imgCrop/__main__.py ADDED Viewed

@@ -0,0 +1,41 @@
+import argparse
+from .core import convert_pdf
+def main():
+    parser = argparse.ArgumentParser(
+        description="将PDF文件转换为图片并自动裁剪空白边距",
+        formatter_class=argparse.ArgumentDefaultsHelpFormatter
+    )
+    parser.add_argument(
+        "file",
+        help="PDF文件路径,(Path to the PDF file)",
+    )
+    parser.add_argument(
+        "-d", "--dpi",
+        type=int,
+        default=300,
+        help="输出图片的DPI, 默认为 300, (DPI for output images, default is 300)"
+    )
+    parser.add_argument(
+        "-f", "--format",
+        choices=["jpg", "png"],
+        default="jpg",
+        help="输出图片格式, 默认为 'jpg', (Format of output images, default is 'jpg')",
+    )
+    args = parser.parse_args()
+    try:
+        convert_pdf(args.file, args.dpi, args.format)
+        print(f"\n转换完成！输出目录: {args.file}output")
+    except Exception as e:
+        print(f"错误: {str(e)}")
+        return 1
+    return 0
+if __name__ == "__main__":
+    exit(main())

pdf2imgcrop-0.1.0/pdf2imgCrop/core.py ADDED Viewed

@@ -0,0 +1,56 @@
+import fitz
+from PIL import Image, ImageOps
+import os
+from tqdm import tqdm
+from fitz import Page
+def convert_pdf(file: str, dpi: int = 300, file_format: str = "jpg") -> None:
+    """
+    将PDF文件转换为图片并自动裁剪空白边距
+    Args:
+        file (str): PDF文件路径
+        dpi (int, optional): 输出图片的DPI. 默认为 300.
+        file_format (str, optional): 输出图片格式 ('jpg' 或 'png'). 默认为 'jpg'.
+    """
+    doc = fitz.open(file)
+    for pg in tqdm(doc, desc="正在转换页面", unit="页"):
+        # 获取页面的宽高
+        pg_width = pg.rect.width / 72  # in inch
+        pg_height = pg.rect.height / 72  # in inch
+        # 计算对应dpi对应的像素
+        pix_dpi_width = int(pg_width * dpi)
+        pix_dpi_height = int(pg_height * dpi)
+        zoom = 16
+        mat = fitz.Matrix(zoom, zoom).prerotate(0)
+        pix = pg.get_pixmap(matrix=mat, alpha=False)
+        # 准备输出目录
+        filename, _ = os.path.splitext(file)
+        output_dir = filename + "output"
+        if not os.path.exists(output_dir):
+            os.mkdir(output_dir)
+        # 裁剪空白区域
+        img = Image.frombytes("RGB", [pix.width, pix.height], pix.samples)
+        # 将图片大小转为目标DPI大小
+        img = img.resize((pix_dpi_width, pix_dpi_height), Image.LANCZOS)
+        img_inverse = ImageOps.invert(img)
+        bbox = img_inverse.getbbox()
+        cropped_img = img.crop(bbox)
+        # 保存处理后的图片
+        output_path = os.path.join(output_dir, f"{pg.number + 1}.{file_format}")
+        if file_format.lower() == "jpg":
+            cropped_img.save(
+                output_path,
+                quality=95,
+                dpi=(dpi, dpi),
+            )
+        else:
+            cropped_img.save(
+                output_path,
+                dpi=(dpi, dpi),
+            )
+    doc.close()

pdf2imgcrop-0.1.0/pyproject.toml ADDED Viewed

@@ -0,0 +1,23 @@
+[project]
+name = "pdf2imgCrop"
+version = "0.1.0"
+description = "将PDF文件转换为图片并自动裁剪空白边距"
+authors = [
+    {name = "Your Name", email = "your.email@example.com"},
+]
+dependencies = [
+    "PyMuPDF>=1.23.0",
+    "Pillow>=10.0.0",
+    "tqdm>=4.65.0",
+]
+requires-python = ">=3.8"
+[project.scripts]
+pdf2imgcrop = "pdf2imgCrop.__main__:main"
+[build-system]
+requires = ["hatchling"]
+build-backend = "hatchling.build"
+[tool.hatch.build.targets.wheel]
+packages = ["pdf2imgCrop"]

pdf2imgcrop-0.1.0/requirements.txt ADDED Viewed

@@ -0,0 +1,3 @@
+PyMuPDF>=1.23.0
+Pillow>=10.0.0
+tqdm>=4.65.0

pdf2imgcrop-0.1.0/setup.py ADDED Viewed

@@ -0,0 +1,34 @@
+from setuptools import setup, find_packages
+setup(
+    name="pdf2imgCrop",
+    version="0.1.0",
+    packages=find_packages(),
+    url="https://github.com/muxkin/pdf2imgCrop",
+    project_urls={
+        "Bug Tracker": "https://github.com/muxkin/pdf2imgCrop/issues",
+        "Source Code": "https://github.com/muxkin/pdf2imgCrop",
+    },
+    install_requires=[
+        "PyMuPDF",
+        "Pillow",
+        "tqdm",
+    ],
+    entry_points={
+        "console_scripts": [
+            "pdf2imgcrop=pdf2imgCrop.__main__:main",
+        ],
+    },
+    author="Muxkin",
+    description="将PDF文件转换为图片并自动裁剪空白边距",
+    long_description=open("README.md").read(),
+    long_description_content_type="text/markdown",
+    keywords="pdf, image, convert, crop",
+    classifiers=[
+        "Development Status :: 3 - Alpha",
+        "Intended Audience :: End Users/Desktop",
+        "Programming Language :: Python :: 3",
+        "License :: OSI Approved :: MIT License",
+    ],
+    python_requires=">=3.6",
+)