PyPI - yta-video-opengl - Versions diffs - 0.0.11__py3-none-any.whl → 0.0.13__py3-none-any.whl - Mend

yta-video-opengl 0.0.11py3-none-any.whl → 0.0.13py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

yta_video_opengl/complete/timeline.py +147 -59
yta_video_opengl/complete/track.py +302 -27
yta_video_opengl/complete/video_on_track.py +72 -9
yta_video_opengl/reader/__init__.py +190 -89
yta_video_opengl/reader/cache.py +258 -32
yta_video_opengl/t.py +185 -0
yta_video_opengl/tests.py +4 -2
yta_video_opengl/utils.py +169 -8
yta_video_opengl/video.py +85 -12
yta_video_opengl/writer.py +23 -14
{yta_video_opengl-0.0.11.dist-info → yta_video_opengl-0.0.13.dist-info}/METADATA +2 -1
yta_video_opengl-0.0.13.dist-info/RECORD +21 -0
yta_video_opengl-0.0.11.dist-info/RECORD +0 -20
{yta_video_opengl-0.0.11.dist-info → yta_video_opengl-0.0.13.dist-info}/LICENSE +0 -0
{yta_video_opengl-0.0.11.dist-info → yta_video_opengl-0.0.13.dist-info}/WHEEL +0 -0

yta_video_opengl/complete/timeline.py CHANGED Viewed

@@ -1,11 +1,21 @@
+"""
+When we are reading from a source, the reader
+has its own time base and properties. When we
+are writing, the writer has different time
+base and properties. We need to adjust our
+writer to be able to write, because the videos
+we read can be different, and the video we are
+writing is defined by us. The 'time_base' is
+an important property or will make ffmpeg
+become crazy and deny packets (that means no
+video written).
+"""
 from yta_video_opengl.complete.track import Track
 from yta_video_opengl.video import Video
+from yta_video_opengl.t import get_ts, fps_to_time_base, T
 from yta_validation.parameter import ParameterValidator
+from quicktions import Fraction
 from typing import Union
-from fractions import Fraction
-import numpy as np
-import av
 class Timeline:
@@ -18,38 +28,63 @@ class Timeline:
     @property
     def end(
         self
-    ) -> float:
+    ) -> Fraction:
         """
         The end of the last video of the track
         that lasts longer. This is the last time
         moment that has to be rendered.
         """
-        return max(track.end for track in self.tracks)
+        return max(
+            track.end
+            for track in self.tracks
+        )
     def __init__(
         self,
-        size: tuple[int, int] = (1920, 1080),
-        fps: float = 60.0
+        size: tuple[int, int] = (1_920, 1_080),
+        fps: Union[int, float, Fraction] = 60.0,
+        audio_fps: Union[int, Fraction] = 44_100.0, # 48_000.0 for aac
+        # TODO: I don't like this name
+        # TODO: Where does this come from (?)
+        audio_samples_per_frame: int = 1024
     ):
         # TODO: By now we are using just two video
         # tracks to test the composition
         # TODO: We need to be careful with the
         # priority, by now its defined by its
         # position in the array
-        self.tracks: list[Track] = [Track(), Track()]
+        self.tracks: list[Track] = [
+            Track(
+                size = size,
+                fps = fps,
+                audio_fps = audio_fps,
+                # TODO: I need more info about the audio
+                # I think
+                audio_samples_per_frame = audio_samples_per_frame
+            ),
+            Track(
+                size = size,
+                fps = fps,
+                audio_fps = audio_fps,
+                # TODO: I need more info about the audio
+                # I think
+                audio_samples_per_frame = audio_samples_per_frame
+            )
+        ]
         """
         All the video tracks we are handling.
         """
-        # TODO: Handle size and fps
+        # TODO: Handle the other properties
         self.size = size
         self.fps = fps
+        self.audio_fps = audio_fps
     # TODO: Create 'add_track' method, but by now
     # we hare handling only one
     def add_video(
         self,
         video: Video,
-        t: float,
+        t: Union[int, float, Fraction],
         # TODO: This is for testing, it has to
         # disappear
         do_use_second_track: bool = False
@@ -61,19 +96,23 @@ class Timeline:
         TODO: The 'do_use_second_track' parameter
         is temporary.
         """
+        # TODO: This is temporary logic by now
+        # just to be able to test mixing frames
+        # from 2 different tracks at the same
+        # time
         index = 1 * do_use_second_track
         self.tracks[index].add_video(video, t)
         return self
     # TODO: This method is not for the Track but
     # for the timeline, as one track can only
     # have consecutive elements
     def get_frame_at(
         self,
-        t: float
-    ) -> Union['VideoFrame', None]:
+        t: Union[int, float, Fraction]
+    ) -> 'VideoFrame':
         """
         Get all the frames that are played at the
         't' time provided, but combined in one.
@@ -82,29 +121,43 @@ class Timeline:
             track.get_frame_at(t)
             for track in self.tracks
         )
+        # TODO: Here I receive black frames because
+        # it was empty, but I don't have a way to
+        # detect those black empty frames because
+        # they are just VideoFrame instances... I
+        # need a way to know so I can skip them if
+        # other frame in other track, or to know if
+        # I want them as transparent or something
-        frames = [
-            frame
-            for frame in frames
-            if frame is not None
-        ]
-        return (
-            # TODO: Combinate them, I send first by now
-            frames[0]
-            if len(frames) > 0 else
-            # TODO: Should I send None or a full
-            # black (or transparent) frame? I think
-            # None is better because I don't know
-            # the size here (?)
-            None
-        )
+        # TODO: Combinate them, I send first by now
+        return next(frames)
+    def get_audio_frames_at(
+        self,
+        t: float
+    ):
+        # TODO: What if the different audio streams
+        # have also different fps (?)
+        frames = []
+        for track in self.tracks:
+            # TODO: Make this work properly
+            audio_frames = track.get_audio_frames_at(t)
+            # TODO: Combine them
+            if audio_frames is not None:
+                frames = audio_frames
+                break
+        #from yta_video_opengl.utils import get_silent_audio_frame
+        #make_silent_audio_frame()
+        for frame in frames:
+            yield frame
     def render(
         self,
         filename: str,
-        start: float = 0.0,
-        end: Union[float, None] = None
+        start: Union[int, float, Fraction] = 0.0,
+        end: Union[int, float, Fraction, None] = None
     ) -> 'Timeline':
         """
         Render the time range in between the given
@@ -115,8 +168,10 @@ class Timeline:
         project will be rendered.
         """
         ParameterValidator.validate_mandatory_string('filename', filename, do_accept_empty = False)
-        ParameterValidator.validate_mandatory_positive_number('start', start, do_include_zero = True)
-        ParameterValidator.validate_positive_number('end', end, do_include_zero = False)
+        # TODO: We need to accept Fraction as number
+        #ParameterValidator.validate_mandatory_positive_number('start', start, do_include_zero = True)
+        # TODO: We need to accept Fraction as number
+        #ParameterValidator.validate_positive_number('end', end, do_include_zero = False)
         # TODO: Limitate 'end' a bit...
         end = (
@@ -127,20 +182,6 @@ class Timeline:
         if start >= end:
             raise Exception('The provided "start" cannot be greater or equal to the "end" provided.')
-        # TODO: Obtain all the 't', based on 'fps'
-        # that we need to render from 'start' to
-        # 'end'
-        # TODO: I don't want to have this here
-        def generate_times(start: float, end: float, fps: int):
-            dt = 1.0 / fps
-            times = []
-            t = start
-            while t <= end:
-                times.append(t + 0.000001)
-                t += dt
-            return times
         from yta_video_opengl.writer import VideoWriter
@@ -149,31 +190,78 @@ class Timeline:
         # video we are writing
         writer.set_video_stream(
             codec_name = 'h264',
-            fps = 60,
-            size = (1920, 1080),
+            fps = self.fps,
+            size = self.size,
             pixel_format = 'yuv420p'
         )
-        for t in generate_times(start, end, self.fps):
+        writer.set_audio_stream(
+            codec_name = 'aac',
+            fps = self.audio_fps
+        )
+        time_base = fps_to_time_base(self.fps)
+        audio_time_base = fps_to_time_base(self.audio_fps)
+        """
+        We are trying to render this:
+        -----------------------------
+        [0 a 0.5) => Frames negros
+        [0.5 a 1.25) => [0.25 a 1.0) de Video1
+        [1.25 a 1.75) => Frames negros
+        [1.75 a 2.25) => [0.25 a 0.75) de Video1
+        [2.25 a 3.0) => Frames negros
+        [3.0 a 3.75) => [2.25 a 3.0) de Video2
+        """
+        audio_pts = 0
+        for t in get_ts(start, end, self.fps):
             frame = self.get_frame_at(t)
-            if frame is None:
-                # Replace with black background if no frame
-                frame = av.VideoFrame.from_ndarray(
-                    array = np.zeros((1920, 1080, 3), dtype = np.uint8),
-                    format = 'rgb24'
-                )
+            #print(frame)
             # We need to adjust our output elements to be
             # consecutive and with the right values
             # TODO: We are using int() for fps but its float...
-            frame.time_base = Fraction(1, int(self.fps))
-            frame.pts = int(t / frame.time_base)
+            frame.time_base = time_base
+            #frame.pts = int(video_frame_index / frame.time_base)
+            frame.pts = T(t, time_base).truncated_pts
             # TODO: We need to handle the audio
             writer.mux_video_frame(
                 frame = frame
             )
+            #print(f'    [VIDEO] Here in t:{str(t)} -> pts:{str(frame.pts)} - dts:{str(frame.dts)}')
+            # TODO: Uncomment all this below for the audio
+            num_of_audio_frames = 0
+            for audio_frame in self.get_audio_frames_at(t):
+                # TODO: The track gives us empty (black)
+                # frames by default but maybe we need a
+                # @dataclass in the middle to handle if
+                # we want transparent frames or not and/or
+                # to detect them here because, if not,
+                # they are just simple VideoFrames and we
+                # don't know they are 'empty' frames
+                # We need to adjust our output elements to be
+                # consecutive and with the right values
+                # TODO: We are using int() for fps but its float...
+                audio_frame.time_base = audio_time_base
+                #audio_frame.pts = int(audio_frame_index / audio_frame.time_base)
+                audio_frame.pts = audio_pts
+                # We increment for the next iteration
+                audio_pts += audio_frame.samples
+                #audio_frame.pts = int(t + (audio_frame_index * audio_frame.time_base) / audio_frame.time_base)
+                #print(f'[AUDIO] Here in t:{str(t)} -> pts:{str(audio_frame.pts)} - dts:{str(audio_frame.dts)}')
+                #num_of_audio_frames += 1
+                #print(audio_frame)
+                writer.mux_audio_frame(audio_frame)
+            #print(f'Num of audio frames: {str(num_of_audio_frames)}')
         writer.mux_video_frame(None)
+        writer.mux_audio_frame(None)
         writer.output.close()

yta-video-opengl 0.0.11__py3-none-any.whl → 0.0.13__py3-none-any.whl

yta-video-opengl 0.0.11py3-none-any.whl → 0.0.13py3-none-any.whl