PyPI - ppt2video - Versions diffs - 0.1.0__tar.gz - Mend

ppt2video 0.1.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

ppt2video-0.1.0/LICENSE +21 -0
ppt2video-0.1.0/PKG-INFO +86 -0
ppt2video-0.1.0/README.md +69 -0
ppt2video-0.1.0/ppt2video/__init__.py +0 -0
ppt2video-0.1.0/ppt2video/tools.py +208 -0
ppt2video-0.1.0/ppt2video.egg-info/PKG-INFO +86 -0
ppt2video-0.1.0/ppt2video.egg-info/SOURCES.txt +10 -0
ppt2video-0.1.0/ppt2video.egg-info/dependency_links.txt +1 -0
ppt2video-0.1.0/ppt2video.egg-info/requires.txt +3 -0
ppt2video-0.1.0/ppt2video.egg-info/top_level.txt +1 -0
ppt2video-0.1.0/setup.cfg +4 -0
ppt2video-0.1.0/setup.py +26 -0

ppt2video-0.1.0/LICENSE ADDED Viewed

@@ -0,0 +1,21 @@
+MIT License
+Copyright (c) 2024 Andy Kim
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.

ppt2video-0.1.0/PKG-INFO ADDED Viewed

@@ -0,0 +1,86 @@
+Metadata-Version: 2.1
+Name: ppt2video
+Version: 0.1.0
+Summary: A tool that converts a PowerPoint (PPT) to a video with voice narration (reading the notes from each slide)
+Home-page: https://github.com/iburn78/ppt2video
+Author: IssueTracker
+Author-email: issuetree.tracker@gmail.com
+Classifier: Programming Language :: Python :: 3
+Classifier: License :: OSI Approved :: MIT License
+Classifier: Operating System :: OS Independent
+Requires-Python: >=3.6
+Description-Content-Type: text/markdown
+License-File: LICENSE
+Requires-Dist: python-pptx
+Requires-Dist: moviepy
+Requires-Dist: google-cloud-texttospeech
+# ppt2video
+## A tool that converts a PowerPoint (PPT) to a video with voice narration (reading the notes from each slide)
+This tool reads the note contents from each slide using Google TTS and converts the PPT to an MP4 video.
+### Installation
+```
+pip install ppt2video
+```
+### Usage
++ Step 1: Place your PPT file (or `.pptx`) into a specific folder (e.g., `data/ppt/your_ppt_name.pptx`).
++ Step 2: Open your PowerPoint software and save the slides as images (e.g., PNG) to a specific folder (usually, `data/ppt/your_ppt_name/`).
++ Step 3: Set up Google Cloud Authentication to access the note contents in your slides:
+    - You need to set up authentication using your Google Cloud service account key. Follow these steps:
+        * Go to the Google Cloud Console ([https://console.cloud.google.com/](https://console.cloud.google.com/)).
+        * Create a new project (or use an existing project).
+        * Enable the Text-to-Speech API for that project.
+        * Create a Service Account and download the JSON key file.
++ Step 4: Run the code
+```python
+from ppt2video.tools import *
+meta = Meta(
+    ppt_file='your_ppt_slide.pptx',  # Name of your PPT file
+    image_prefix='slide',  # The prefix for image files (varies depending on the PowerPoint language version)
+    google_application_credentials='/config/google_cloud.json'  # Location and filename of your Google Cloud service account key
+)
+# Run the conversion
+ppt_to_video(meta)
+```
+### Additional settings
+You may adjust additional settings as follows:
+```python
+    # PPT settings
+    ppt_file: str
+    ppt_path: str = 'data/ppt/'  # Directory for the PPT and image files
+    image_prefix: str = 'slide'  # The prefix for image file names (used when saving slides as images)
+    image_extension: str = 'PNG'  # The image file format (default is PNG)
+    ppt_extension: str = '.pptx'  # The PowerPoint file extension
+    # Google TTS settings
+    voice_enabled: bool = True  # Enable or disable voice narration
+    google_application_credentials: str = None  # Location of the Google API key (downloaded as JSON)
+    voice_path: str = 'data/voice/'  # Directory to save the generated audio files
+    max_size: int = 4500  # Maximum text size limit for a single Google TTS API request (default 5000)
+    slide_break: float = 2  # Time delay (in seconds) between slides
+    line_break: float = 0.7  # Time delay (in seconds) when there's a line break in the text (e.g., '\n')
+    lang: str = 'E'  # Language setting: 'E' for English, 'K' for Korean
+    wave: bool = False  # Whether to use Wavenet voices (True or False)
+    # MoviePy video settings
+    fps: int = 24  # Frames per second for the video
+```

ppt2video-0.1.0/README.md ADDED Viewed

@@ -0,0 +1,69 @@
+# ppt2video
+## A tool that converts a PowerPoint (PPT) to a video with voice narration (reading the notes from each slide)
+This tool reads the note contents from each slide using Google TTS and converts the PPT to an MP4 video.
+### Installation
+```
+pip install ppt2video
+```
+### Usage
++ Step 1: Place your PPT file (or `.pptx`) into a specific folder (e.g., `data/ppt/your_ppt_name.pptx`).
++ Step 2: Open your PowerPoint software and save the slides as images (e.g., PNG) to a specific folder (usually, `data/ppt/your_ppt_name/`).
++ Step 3: Set up Google Cloud Authentication to access the note contents in your slides:
+    - You need to set up authentication using your Google Cloud service account key. Follow these steps:
+        * Go to the Google Cloud Console ([https://console.cloud.google.com/](https://console.cloud.google.com/)).
+        * Create a new project (or use an existing project).
+        * Enable the Text-to-Speech API for that project.
+        * Create a Service Account and download the JSON key file.
++ Step 4: Run the code
+```python
+from ppt2video.tools import *
+meta = Meta(
+    ppt_file='your_ppt_slide.pptx',  # Name of your PPT file
+    image_prefix='slide',  # The prefix for image files (varies depending on the PowerPoint language version)
+    google_application_credentials='/config/google_cloud.json'  # Location and filename of your Google Cloud service account key
+)
+# Run the conversion
+ppt_to_video(meta)
+```
+### Additional settings
+You may adjust additional settings as follows:
+```python
+    # PPT settings
+    ppt_file: str
+    ppt_path: str = 'data/ppt/'  # Directory for the PPT and image files
+    image_prefix: str = 'slide'  # The prefix for image file names (used when saving slides as images)
+    image_extension: str = 'PNG'  # The image file format (default is PNG)
+    ppt_extension: str = '.pptx'  # The PowerPoint file extension
+    # Google TTS settings
+    voice_enabled: bool = True  # Enable or disable voice narration
+    google_application_credentials: str = None  # Location of the Google API key (downloaded as JSON)
+    voice_path: str = 'data/voice/'  # Directory to save the generated audio files
+    max_size: int = 4500  # Maximum text size limit for a single Google TTS API request (default 5000)
+    slide_break: float = 2  # Time delay (in seconds) between slides
+    line_break: float = 0.7  # Time delay (in seconds) when there's a line break in the text (e.g., '\n')
+    lang: str = 'E'  # Language setting: 'E' for English, 'K' for Korean
+    wave: bool = False  # Whether to use Wavenet voices (True or False)
+    # MoviePy video settings
+    fps: int = 24  # Frames per second for the video
+```

ppt2video-0.1.0/ppt2video/__init__.py ADDED Viewed

File without changes

ppt2video-0.1.0/ppt2video/tools.py ADDED Viewed

@@ -0,0 +1,208 @@
+from dataclasses import dataclass
+from pptx import Presentation
+from google.cloud import texttospeech_v1beta1 as tts
+from moviepy.editor import ImageClip, concatenate_videoclips, AudioFileClip
+import os
+@dataclass
+class Meta:
+    # PPT settings
+    ppt_file: str
+    ppt_path: str = 'data/ppt/'  # Directory for the PPT and image files
+    image_prefix: str = 'slide'  # The prefix for image file names (used when saving slides as images)
+    image_extension: str = 'PNG'  # The image file format (default is PNG)
+    ppt_extension: str = '.pptx'  # The PowerPoint file extension
+    # Google TTS settings
+    voice_enabled: bool = True  # Enable or disable voice narration
+    google_application_credentials: str = None  # Location of the Google API key (downloaded as JSON)
+    voice_path: str = 'data/voice/'  # Directory to save the generated audio files
+    max_size: int = 4500  # Maximum text size limit for a single Google TTS API request (default 5000)
+    slide_break: float = 2  # Time delay (in seconds) between slides
+    line_break: float = 0.7  # Time delay (in seconds) when there's a line break in the text (e.g., '\n')
+    lang: str = 'E'  # Language setting: 'E' for English, 'K' for Korean
+    wave: bool = False  # Whether to use Wavenet voices (True or False)
+    # MoviePy video settings
+    fps: int = 24  # Frames per second for the video
+def ppt_to_video(meta: Meta):
+    if not os.path.exists(meta.ppt_path):
+        os.makedirs(meta.ppt_path)
+    if meta.voice_enabled:
+        if meta.google_application_credentials == None:
+            print('*****')
+            print('Need to set up Google Cloud Authentication')
+            print('Please refer to the README.md')
+            print('*****')
+            return None
+        if not os.path.exists(meta.voice_path):
+            os.makedirs(meta.voice_path)
+        num = ppt_to_text(meta)
+        timepoints = ppt_tts(meta, num)
+        video_from_ppt_and_voice(meta, timepoints)
+    else:
+        num = ppt_to_text(meta)
+        video_from_ppt(meta, num)
+def ppt_to_text(meta: Meta):
+    ppt = Presentation(os.path.join(meta.ppt_path, meta.ppt_file))
+    if not meta.voice_enabled:
+        return len(ppt.slides)
+    def _write_to_file(content, current_file_number, current_size, meta: Meta):
+        txt_file = f"{os.path.join(meta.voice_path, meta.ppt_file.replace(meta.ppt_extension, ''))}_{current_file_number}.txt"
+        mode = 'w' if current_size == 0 else 'a'
+        with open(txt_file, mode, encoding='utf-8') as notes_file:
+            notes_file.write(content)
+        return current_size + len(content.encode('utf-8'))
+    header = '''<speak>
+    '''
+    footer = '''</speak>
+    '''
+    file_number = 0
+    current_size = _write_to_file(header, file_number, 0, meta)
+    for slide_number, slide in enumerate(ppt.slides):
+        if slide.notes_slide and slide.notes_slide.notes_text_frame:
+            notes = slide.notes_slide.notes_text_frame.text
+            slide_content = f'.<mark name="slide{slide_number}"/>.\n<break time="{round(meta.slide_break/2,1)}s"/>\n'
+            slide_content += notes.replace('\n', f'<break time="{meta.line_break}s"/>\n') + f'<break time="{meta.slide_break}s"/>\n'
+        else:
+            slide_content = f'.<mark name="slide{slide_number}"/>.\n<break time="{meta.slide_break}s"/>\n'
+        if current_size + len(slide_content.encode('utf-8')) > meta.max_size:
+            _write_to_file(footer, file_number, current_size, meta)
+            file_number += 1
+            current_size = 0
+            slide_content = header + slide_content
+        current_size = _write_to_file(slide_content, file_number, current_size, meta)
+    _write_to_file(footer, file_number, current_size, meta)
+    txt_file_number = file_number+1
+    return txt_file_number
+def ppt_tts(meta: Meta, txt_file_number: int):
+    os.environ["GOOGLE_APPLICATION_CREDENTIALS"] = meta.google_application_credentials
+    client = tts.TextToSpeechClient()
+    language_code = 'ko-KR' if meta.lang == 'K' else 'en-US'
+    tag = 'D' if meta.lang == 'K' else 'B'
+    name = language_code+'-Wavenet-'+tag
+    if meta.wave == True: # WaveNet voice (1 mil words/month vs 4 mil in basic)
+        voice = tts.VoiceSelectionParams(language_code=language_code, name=name, ssml_gender=tts.SsmlVoiceGender.MALE)
+    else:
+        voice = tts.VoiceSelectionParams(language_code=language_code, ssml_gender=tts.SsmlVoiceGender.MALE)
+    audio_config = tts.AudioConfig(audio_encoding=tts.AudioEncoding.MP3)
+    timepoint_dict = {}
+    for i in range(txt_file_number):
+        txt_file = f"{os.path.join(meta.voice_path, meta.ppt_file.replace(meta.ppt_extension, '_'+str(i)+'.txt'))}"
+        voice_file =os.path.join(meta.voice_path, meta.ppt_file.replace(meta.ppt_extension, '_'+str(i)+'.mp3'))
+        with open(txt_file, 'r', encoding='utf-8') as file:
+            text_content = file.read()
+        synthesis_input = tts.SynthesisInput(ssml=text_content)
+        request = tts.SynthesizeSpeechRequest(
+            input=synthesis_input,
+            voice=voice,
+            audio_config=audio_config,
+            enable_time_pointing=[tts.SynthesizeSpeechRequest.TimepointType.SSML_MARK]
+        )
+        response = client.synthesize_speech(request=request)
+        with open(voice_file, "wb") as out:
+            out.write(response.audio_content)
+            print(voice_file + ' done')
+        timepoint_list = []
+        if response.timepoints:
+            for time_point in response.timepoints:
+                print(f'Mark name: {time_point.mark_name}, Time: {time_point.time_seconds} seconds')
+                timepoint_list.append([int(time_point.mark_name[5:]), time_point.time_seconds])
+        else:
+            print('No timepoints found.')
+        timepoint_dict[voice_file] = timepoint_list
+    return timepoint_dict
+def video_from_ppt_and_voice(meta: Meta, timepoints, fps=24):
+    images_path = os.path.join(meta.ppt_path, meta.ppt_file.replace(meta.ppt_extension,''))
+    output_file = os.path.join(meta.ppt_path, meta.ppt_file.replace(meta.ppt_extension, '.mp4'))
+    video_with_audios = []
+    for audio_file, slide_times in timepoints.items():
+        audio_clip = AudioFileClip(audio_file)
+        video_clips = []
+        for i in range(len(slide_times)):
+            start_time = slide_times[i][1]  # Get the start time for the slide
+            if i < len(slide_times)-1:
+                end_time = slide_times[i + 1][1]  # Get the end time for the next slide
+            else:
+                end_time = audio_clip.duration
+            slide_number = slide_times[i][0]
+            # Construct the image filename
+            slide_image_filename = f'{meta.image_prefix}{slide_number}.PNG'
+            slide_image_path = os.path.join(images_path, slide_image_filename)
+            # Load the slide image
+            slide_clip = ImageClip(slide_image_path).set_duration(end_time - start_time).set_start(start_time)
+            video_clips.append(slide_clip)
+        # Concatenate video clips for the current audio
+        video_with_audio = concatenate_videoclips(video_clips)
+        video_with_audio = video_with_audio.set_audio(audio_clip).volumex(2)
+        video_with_audios.append(video_with_audio)
+    # Concatenate all videos into one final video
+    final_video = concatenate_videoclips(video_with_audios)
+    # Set fps for the final video
+    final_video.fps = fps
+    # final_video.write_videofile(output_file, codec="libx264")
+    final_video.write_videofile(
+        output_file,
+        codec="libx264",
+    )
+    print('video with audio generated and saved')
+def video_from_ppt(meta: Meta, num_slides: int, fps=24):
+    images_path = os.path.join(meta.ppt_path, meta.ppt_file.replace(meta.ppt_extension,''))
+    output_file = os.path.join(meta.ppt_path, meta.ppt_file.replace(meta.ppt_extension, '.mp4'))
+    video_clips = []
+    for i in range(num_slides):
+        start_time = i*meta.slide_break
+        end_time = start_time+meta.slide_break
+        slide_image_filename = f'{meta.image_prefix}{i}.{meta.image_extension}'
+        slide_image_path = os.path.join(images_path, slide_image_filename)
+        slide_clip = ImageClip(slide_image_path).set_duration(end_time - start_time).set_start(start_time)
+        video_clips.append(slide_clip)
+    final_video = concatenate_videoclips(video_clips)
+    # Set fps for the final video
+    final_video.fps = fps
+    # final_video.write_videofile(output_file, codec="libx264")
+    final_video.write_videofile(
+        output_file,
+        codec="libx264",
+    )
+    print('video generated and saved')

ppt2video-0.1.0/ppt2video.egg-info/PKG-INFO ADDED Viewed

@@ -0,0 +1,86 @@
+Metadata-Version: 2.1
+Name: ppt2video
+Version: 0.1.0
+Summary: A tool that converts a PowerPoint (PPT) to a video with voice narration (reading the notes from each slide)
+Home-page: https://github.com/iburn78/ppt2video
+Author: IssueTracker
+Author-email: issuetree.tracker@gmail.com
+Classifier: Programming Language :: Python :: 3
+Classifier: License :: OSI Approved :: MIT License
+Classifier: Operating System :: OS Independent
+Requires-Python: >=3.6
+Description-Content-Type: text/markdown
+License-File: LICENSE
+Requires-Dist: python-pptx
+Requires-Dist: moviepy
+Requires-Dist: google-cloud-texttospeech
+# ppt2video
+## A tool that converts a PowerPoint (PPT) to a video with voice narration (reading the notes from each slide)
+This tool reads the note contents from each slide using Google TTS and converts the PPT to an MP4 video.
+### Installation
+```
+pip install ppt2video
+```
+### Usage
++ Step 1: Place your PPT file (or `.pptx`) into a specific folder (e.g., `data/ppt/your_ppt_name.pptx`).
++ Step 2: Open your PowerPoint software and save the slides as images (e.g., PNG) to a specific folder (usually, `data/ppt/your_ppt_name/`).
++ Step 3: Set up Google Cloud Authentication to access the note contents in your slides:
+    - You need to set up authentication using your Google Cloud service account key. Follow these steps:
+        * Go to the Google Cloud Console ([https://console.cloud.google.com/](https://console.cloud.google.com/)).
+        * Create a new project (or use an existing project).
+        * Enable the Text-to-Speech API for that project.
+        * Create a Service Account and download the JSON key file.
++ Step 4: Run the code
+```python
+from ppt2video.tools import *
+meta = Meta(
+    ppt_file='your_ppt_slide.pptx',  # Name of your PPT file
+    image_prefix='slide',  # The prefix for image files (varies depending on the PowerPoint language version)
+    google_application_credentials='/config/google_cloud.json'  # Location and filename of your Google Cloud service account key
+)
+# Run the conversion
+ppt_to_video(meta)
+```
+### Additional settings
+You may adjust additional settings as follows:
+```python
+    # PPT settings
+    ppt_file: str
+    ppt_path: str = 'data/ppt/'  # Directory for the PPT and image files
+    image_prefix: str = 'slide'  # The prefix for image file names (used when saving slides as images)
+    image_extension: str = 'PNG'  # The image file format (default is PNG)
+    ppt_extension: str = '.pptx'  # The PowerPoint file extension
+    # Google TTS settings
+    voice_enabled: bool = True  # Enable or disable voice narration
+    google_application_credentials: str = None  # Location of the Google API key (downloaded as JSON)
+    voice_path: str = 'data/voice/'  # Directory to save the generated audio files
+    max_size: int = 4500  # Maximum text size limit for a single Google TTS API request (default 5000)
+    slide_break: float = 2  # Time delay (in seconds) between slides
+    line_break: float = 0.7  # Time delay (in seconds) when there's a line break in the text (e.g., '\n')
+    lang: str = 'E'  # Language setting: 'E' for English, 'K' for Korean
+    wave: bool = False  # Whether to use Wavenet voices (True or False)
+    # MoviePy video settings
+    fps: int = 24  # Frames per second for the video
+```

ppt2video-0.1.0/ppt2video.egg-info/SOURCES.txt ADDED Viewed

@@ -0,0 +1,10 @@
+LICENSE
+README.md
+setup.py
+ppt2video/__init__.py
+ppt2video/tools.py
+ppt2video.egg-info/PKG-INFO
+ppt2video.egg-info/SOURCES.txt
+ppt2video.egg-info/dependency_links.txt
+ppt2video.egg-info/requires.txt
+ppt2video.egg-info/top_level.txt

ppt2video-0.1.0/ppt2video.egg-info/dependency_links.txt ADDED Viewed

	@@ -0,0 +1 @@
1	+

ppt2video-0.1.0/ppt2video.egg-info/requires.txt ADDED Viewed

@@ -0,0 +1,3 @@
+python-pptx
+moviepy
+google-cloud-texttospeech

ppt2video-0.1.0/ppt2video.egg-info/top_level.txt ADDED Viewed

	@@ -0,0 +1 @@
1	+ ppt2video

ppt2video-0.1.0/setup.cfg ADDED Viewed

@@ -0,0 +1,4 @@
+[egg_info]
+tag_build =
+tag_date = 0

ppt2video-0.1.0/setup.py ADDED Viewed

@@ -0,0 +1,26 @@
+from setuptools import setup, find_packages
+setup(
+    name='ppt2video',  # Name of the package
+    version='0.1.0',  # Version number
+    packages=find_packages(),  # Automatically finds all packages in the directory
+    install_requires=[         # List dependencies here
+        'python-pptx',
+        'moviepy',
+        'google-cloud-texttospeech'
+    ],
+    entry_points={             # If your package has entry points (CLI tools)
+    },
+    author='IssueTracker',
+    author_email='issuetree.tracker@gmail.com',
+    description='A tool that converts a PowerPoint (PPT) to a video with voice narration (reading the notes from each slide)',
+    long_description=open('README.md').read(),  # Detailed description (usually from README)
+    long_description_content_type='text/markdown',  # Format of README
+    url='https://github.com/iburn78/ppt2video',  # URL for your package (GitHub link, etc.)
+    classifiers=[              # Optional metadata classifiers
+        'Programming Language :: Python :: 3',
+        'License :: OSI Approved :: MIT License',
+        'Operating System :: OS Independent',
+    ],
+    python_requires='>=3.6',   # Python version requirement
+)