PyPI - yta-video-opengl - Versions diffs - 0.0.6__tar.gz → 0.0.8__tar.gz - Mend

yta-video-opengl 0.0.6tar.gz → 0.0.8tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (13) hide show

{yta_video_opengl-0.0.6 → yta_video_opengl-0.0.8}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.3
 Name: yta-video-opengl
-Version: 0.0.6
+Version: 0.0.8
 Summary: Youtube Autonomous Video OpenGL Module
 Author: danialcala94
 Author-email: danielalcalavalera@gmail.com

{yta_video_opengl-0.0.6 → yta_video_opengl-0.0.8}/pyproject.toml RENAMED Viewed

@@ -1,6 +1,6 @@
 [project]
 name = "yta-video-opengl"
-version = "0.0.6"
+version = "0.0.8"
 description = "Youtube Autonomous Video OpenGL Module"
 authors = [
     {name = "danialcala94",email = "danielalcalavalera@gmail.com"}

{yta_video_opengl-0.0.6 → yta_video_opengl-0.0.8}/src/yta_video_opengl/classes.py RENAMED Viewed

@@ -8,7 +8,8 @@ so we use different triangles to build
 our shapes (quad normally).
 """
 from yta_validation.parameter import ParameterValidator
-from yta_video_opengl.utils import frame_to_texture
+from yta_validation import PythonValidator
+from yta_video_opengl.utils import frame_to_texture, get_fullscreen_quad_vao
 from abc import ABC, abstractmethod
 from typing import Union
@@ -24,29 +25,48 @@ class _Uniforms:
     """
     @property
-    def program(
+    def uniforms(
         self
-    ):
+    ) -> dict:
         """
-        Shortcut to the FrameShader program.
+        The uniforms in the program, as a dict, in
+        the format `{key, value}`.
         """
-        return self._shader_instance.program
+        return {
+            key: self.program[key].value
+            for key in self.program
+            if PythonValidator.is_instance_of(self.program[key], moderngl.Uniform)
+        }
     def __init__(
         self,
-        shader_instance: 'FrameShaderBase'
+        program: moderngl.Program
     ):
-        self._shader_instance: 'FrameShaderBase' = shader_instance
+        self.program: moderngl.Program = program
+        """
+        The program instance this handler class
+        belongs to.
+        """
+    def get(
+        self,
+        name: str
+    ) -> Union[any, None]:
         """
-        The instance of the FrameShader class these
-        uniforms belong to.
+        Get the value of the uniform with the
+        given 'name'.
         """
+        return self.uniforms.get(name, None)
+    # TODO: I need to refactor these method to
+    # accept a **kwargs maybe, or to auto-detect
+    # the type and add the uniform as it must be
+    # done
     def set(
         self,
         name: str,
         value
-    ) -> 'FrameShaderBase':
+    ) -> '_Uniforms':
         """
         Set the provided 'value' to the normal type
         uniform with the given 'name'. Here you have
@@ -59,13 +79,13 @@ class _Uniforms:
         if name in self.program:
             self.program[name].value = value
-        return self._shader_instance
+        return self
     def set_vec(
         self,
         name: str,
         values
-    ) -> 'FrameShaderBase':
+    ) -> '_Uniforms':
         """
         Set the provided 'value' to the normal type
         uniform with the given 'name'. Here you have
@@ -78,11 +98,13 @@ class _Uniforms:
         if name in self.program:
             self.program[name].write(np.array(values, dtype = 'f4').tobytes())
+        return self
     def set_mat(
         self,
         name: str,
         value
-    ) -> 'FrameShaderBase':
+    ) -> '_Uniforms':
         """
         Set the provided 'value' to a `matN` type
         uniform with the given 'name'. The 'value'
@@ -99,16 +121,26 @@ class _Uniforms:
         if name in self.program:
             self.program[name].write(value)
-        return self._shader_instance
+        return self
+    def print(
+        self
+    ) -> '_Uniforms':
+        """
+        Print the defined uniforms in console.
+        """
+        for key, value in self.uniforms.items():
+            print(f'"{key}": {str(value)}')
-class FrameShaderBase(ABC):
+class BaseNode:
     """
-    Class to be inherited by any of our own
-    custom opengl program classes.
+    The basic class of a node to manipulate frames
+    as opengl textures. This node will process the
+    frame as an input texture and will generate
+    also a texture as the output.
-    This shader base class must be used by all
-    the classes that are modifying the frames
-    one by one.
+    Nodes can be chained and the result from one
+    node can be applied on another node.
     """
     @property
@@ -117,7 +149,7 @@ class FrameShaderBase(ABC):
         self
     ) -> str:
         """
-        Source code of the vertex shader.
+        The code of the vertex shader.
         """
         pass
@@ -127,47 +159,211 @@ class FrameShaderBase(ABC):
         self
     ) -> str:
         """
-        Source code of the fragment shader.
+        The code of the fragment shader.
         """
         pass
+    def __init__(
+        self,
+        context: moderngl.Context,
+        size: tuple[int, int],
+        **kwargs
+    ):
+        ParameterValidator.validate_mandatory_instance_of('context', context, moderngl.Context)
+        # TODO: Validate size
+        self.context: moderngl.Context = context
+        """
+        The context of the program.
+        """
+        self.size: tuple[int, int] = size
+        """
+        The size we want to use for the frame buffer
+        in a (width, height) format.
+        """
+        # Compile shaders within the program
+        self.program: moderngl.Program = self.context.program(
+            vertex_shader = self.vertex_shader,
+            fragment_shader = self.fragment_shader
+        )
+        # Create the fullscreen quad
+        self.quad = get_fullscreen_quad_vao(
+            context = self.context,
+            program = self.program
+        )
+        # Create the output fbo
+        self.output_tex = self.context.texture(self.size, 4)
+        self.output_tex.filter = (moderngl.LINEAR, moderngl.LINEAR)
+        self.fbo = self.context.framebuffer(color_attachments = [self.output_tex])
+        self.uniforms: _Uniforms = _Uniforms(self.program)
+        """
+        Shortcut to the uniforms functionality.
+        """
+        # Auto set uniforms dynamically if existing
+        for key, value in kwargs.items():
+            self.uniforms.set(key, value)
+    def process(
+        self,
+        input: Union[moderngl.Texture, 'VideoFrame', 'np.ndarray']
+    ) -> moderngl.Texture:
+        """
+        Apply the shader to the 'input', that
+        must be a frame or a texture, and return
+        the new resulting texture.
+        We use and return textures to maintain
+        the process in GPU and optimize it.
+        """
+        # TODO: Maybe we can accept a VideoFrame
+        # or a numpy array and transform it here
+        # into a texture, ready to be used:
+        # frame_to_texture(
+        #     # TODO: Do not use Pillow
+        #     frame = np.array(Image.open("input.jpg").convert("RGBA")),
+        #     context = self.context,
+        #     numpy_format = 'rgba'
+        # )
+        if PythonValidator.is_instance_of(input, ['VideoFrame', 'ndarray']):
+            # TODO: What about the numpy format (?)
+            input = frame_to_texture(input, self.context)
+        self.fbo.use()
+        self.context.clear(0.0, 0.0, 0.0, 0.0)
+        input.use(location = 0)
+        if 'texture' in self.program:
+            self.program['texture'] = 0
+        self.quad.render()
+        return self.output_tex
+class WavingNode(BaseNode):
+    """
+    Just an example, without the shaders code
+    actually, to indicate that we can use
+    custom parameters to make it work.
+    """
     @property
-    def vertices(
+    def vertex_shader(
         self
-    ) -> 'np.ndarray':
+    ) -> str:
+        return (
+            '''
+            #version 330
+            in vec2 in_vert;
+            in vec2 in_texcoord;
+            out vec2 v_uv;
+            void main() {
+                v_uv = in_texcoord;
+                gl_Position = vec4(in_vert, 0.0, 1.0);
+            }
+            '''
+        )
+    @property
+    def fragment_shader(
+        self
+    ) -> str:
+        return (
+            '''
+            #version 330
+            uniform sampler2D tex;
+            uniform float time;
+            uniform float amplitude;
+            uniform float frequency;
+            uniform float speed;
+            in vec2 v_uv;
+            out vec4 f_color;
+            void main() {
+                float wave = sin(v_uv.x * frequency + time * speed) * amplitude;
+                vec2 uv = vec2(v_uv.x, v_uv.y + wave);
+                f_color = texture(tex, uv);
+            }
+            '''
+        )
+    def __init__(
+        self,
+        context: moderngl.Context,
+        size: tuple[int, int],
+        amplitude: float = 0.05,
+        frequency: float = 10.0,
+        speed: float = 2.0
+    ):
+        super().__init__(
+            context = context,
+            size = size,
+            amplitude = amplitude,
+            frequency = frequency,
+            speed = speed
+        )
+    # This is just an example and we are not
+    # using the parameters actually, but we
+    # could set those specific uniforms to be
+    # processed by the code
+    def process(
+        self,
+        input: Union[moderngl.Texture, 'VideoFrame', 'np.ndarray'],
+        t: float = 0.0,
+    ) -> moderngl.Texture:
+        """
+        Apply the shader to the 'input', that
+        must be a frame or a texture, and return
+        the new resulting texture.
+        We use and return textures to maintain
+        the process in GPU and optimize it.
+        """
+        self.uniforms.set('time', t)
+        return super().process(input)
+"""
+TODO: I should try to use the Node classes
+to manipulate the frames because this is how
+Davinci Resolve and other editors work.
+"""
+class FrameShaderBase(ABC):
+    """
+    Class to be inherited by any of our own
+    custom opengl program classes.
+    This shader base class must be used by all
+    the classes that are modifying the frames
+    one by one.
+    """
+    @property
+    @abstractmethod
+    def vertex_shader(
+        self
+    ) -> str:
         """
-        The UV coordinates to build the quad we
-        will use to represent the frame by
-        applying it as a texture.
+        Source code of the vertex shader.
         """
-        return np.array([
-            # vertex 0 - bottom left
-            -1.0, -1.0,  0.0, 0.0,
-            # vertex 1 - bottom right
-            1.0, -1.0,  1.0, 0.0,
-            # vertex 2 - top left
-            -1.0,  1.0,  0.0, 1.0,
-            # vertex 3 - top right
-            1.0,  1.0,  1.0, 1.0
-        ], dtype = 'f4')
+        pass
     @property
-    def indexes(
+    @abstractmethod
+    def fragment_shader(
         self
-    ) -> 'np.ndarray':
+    ) -> str:
         """
-        The indexes of the vertices (see 'vertices'
-        property) to build the 2 opengl triangles
-        that will represent the quad we need for
-        the frame.
+        Source code of the fragment shader.
         """
-        return np.array(
-            [
-                0, 1, 2,
-                2, 1, 3
-            ],
-            dtype = 'i4'
-        )
+        pass
     def __init__(
         self,
@@ -203,14 +399,6 @@ class FrameShaderBase(ABC):
         """
         The frame buffer object.
         """
-        self.vbo: moderngl.Buffer = None
-        """
-        The vertices buffer object.
-        """
-        self.ibo: moderngl.Buffer = None
-        """
-        The indexes buffer object.
-        """
         self.uniforms: _Uniforms = None
         """
         Shortcut to the uniforms functionality.
@@ -221,6 +409,12 @@ class FrameShaderBase(ABC):
     def _initialize_program(
         self
     ):
+        """
+        This method is to allow the effects to
+        change their '__init__' method to be able
+        to provide parameters that will be set as
+        uniforms.
+        """
         # Compile shaders within the program
         self.program: moderngl.Program = self.context.program(
             vertex_shader = self.vertex_shader,
@@ -229,18 +423,9 @@ class FrameShaderBase(ABC):
         # Create frame buffer
         self.fbo = self.context.simple_framebuffer(self.size)
-        # Create buffers
-        # TODO: I could have more than 1 vertices,
-        # so more than 1 vbo and more than 1 vao...
-        self.vbo: moderngl.Buffer = self.context.buffer(self.vertices.tobytes())
-        self.ibo: moderngl.Buffer = self.context.buffer(self.indexes.tobytes())
-        vao_content = [
-            (self.vbo, "2f 2f", "in_vert", "in_texcoord")
-        ]
-        self.vao: moderngl.VertexArray = self.context.vertex_array(self.program, vao_content, self.ibo)
-        self.uniforms: _Uniforms = _Uniforms(self)
+        # Create quad vertex array
+        self.vao: moderngl.VertexArray = get_fullscreen_quad_vao(self.context, self.program)
+        self.uniforms: _Uniforms = _Uniforms(self.program)
         # TODO: How do I manage these textures (?)
         self.textures = {}
@@ -270,8 +455,7 @@ class FrameShaderBase(ABC):
         tex = self.context.texture((image.shape[1], image.shape[0]), 4, image.tobytes())
         tex.use(texture_unit)
         self.textures[uniform_name] = tex
-        if uniform_name in self.program:
-            self.program[uniform_name].value = texture_unit
+        self.uniforms.set(uniform_name, texture_unit)
     @abstractmethod
     def _prepare_frame(

{yta_video_opengl-0.0.6 → yta_video_opengl-0.0.8}/src/yta_video_opengl/reader/__init__.py RENAMED Viewed

@@ -3,6 +3,7 @@ A video reader using the PyAv (av) library
 that, using ffmpeg, detects the video.
 """
 from yta_video_opengl.reader.cache import VideoFrameCache
+from yta_video_opengl.utils import iterate_stream_frames_demuxing
 from yta_validation import PythonValidator
 from av.video.frame import VideoFrame
 from av.audio.frame import AudioFrame
@@ -32,7 +33,7 @@ class VideoReaderFrame:
         Flag to indicate if the instance is a video
         frame.
         """
-        return PythonValidator.is_instance_of(self.data, VideoFrame)
+        return PythonValidator.is_instance_of(self.value, VideoFrame)
     @property
     def is_audio(
@@ -42,18 +43,37 @@ class VideoReaderFrame:
         Flag to indicate if the instance is an audio
         frame.
         """
-        return PythonValidator.is_instance_of(self.data, AudioFrame)
+        return PythonValidator.is_instance_of(self.value, AudioFrame)
+    @property
+    def as_numpy(
+        self
+    ):
+        """
+        The frame as a numpy array.
+        """
+        return self.value.to_ndarray(format = self.pixel_format)
     def __init__(
         self,
         # TODO: Add the type, please
-        data: any
+        frame: any,
+        t: float = None,
+        pixel_format: str = 'rgb24'
     ):
-        self.data: Union[AudioFrame, VideoFrame] = data
+        self.value: Union[AudioFrame, VideoFrame] = frame
         """
         The frame content, that can be audio or video
         frame.
         """
+        self.t: float = t
+        """
+        The 't' time moment of the frame.
+        """
+        self.pixel_format: str = pixel_format
+        """
+        The pixel format of the frame.
+        """
 @dataclass
 class VideoReaderPacket:
@@ -71,7 +91,7 @@ class VideoReaderPacket:
         Flag to indicate if the packet includes video
         frames or not.
         """
-        return self.data.stream.type == 'video'
+        return self.value.stream.type == 'video'
     @property
     def is_audio(
@@ -81,13 +101,13 @@ class VideoReaderPacket:
         Flag to indicate if the packet includes audio
         frames or not.
         """
-        return self.data.stream.type == 'audio'
+        return self.value.stream.type == 'audio'
     def __init__(
         self,
-        data: Packet
+        packet: Packet
     ):
-        self.data: Packet = data
+        self.value: Packet = packet
         """
         The packet, that can include video or audio
         frames and can be decoded.
@@ -100,7 +120,7 @@ class VideoReaderPacket:
         Get the frames but decoded, perfect to make
         modifications and encode to save them again.
         """
-        return self.data.decode()
+        return self.value.decode()
 class VideoReader:
@@ -266,7 +286,55 @@ class VideoReader:
         The fps of the audio.
         """
         # TODO: What if no audio (?)
-        return self.audio_stream.average_rate
+        return self.audio_stream.rate
+    @property
+    def time_base(
+        self
+    ) -> Fraction:
+        """
+        The time base of the video.
+        """
+        return self.video_stream.time_base
+    @property
+    def audio_time_base(
+        self
+    ) -> Fraction:
+        """
+        The time base of the audio.
+        """
+        # TODO: What if no audio (?)
+        return self.audio_stream.time_base
+    @property
+    def duration(
+        self
+    ) -> Union[float, None]:
+        """
+        The duration of the video.
+        """
+        return (
+            float(self.video_stream.duration * self.video_stream.time_base)
+            if self.video_stream.duration else
+            # TODO: What to do in this case (?)
+            None
+        )
+    @property
+    def audio_duration(
+        self
+    ) -> Union[float, None]:
+        """
+        The duration of the audio.
+        """
+        # TODO: What if no audio (?)
+        return (
+            float(self.audio_stream.duration * self.audio_stream.time_base)
+            if self.audio_stream.duration else
+            # TODO: What to do in this case (?)
+            None
+        )
     @property
     def size(
@@ -303,12 +371,18 @@ class VideoReader:
     def __init__(
         self,
-        filename: str
+        filename: str,
+        # Use 'rgba' if alpha channel
+        pixel_format: str = 'rgb24'
     ):
         self.filename: str = filename
         """
         The filename of the video source.
         """
+        self.pixel_format: str = pixel_format
+        """
+        The pixel format.
+        """
         self.container: InputContainer = None
         """
         The av input general container of the
@@ -362,6 +436,26 @@ class VideoReader:
             self.audio_stream.thread_type = 'AUTO'
             self.cache = VideoFrameCache(self)
+    def seek(
+        self,
+        pts,
+        stream = None
+    ) -> 'VideoReader':
+        """
+        Call the container '.seek()' method with
+        the given 'pts' packet time stamp.
+        """
+        stream = (
+            self.video_stream
+            if stream is None else
+            stream
+        )
+        # TODO: Is 'offset' actually a 'pts' (?)
+        self.container.seek(pts, stream = stream)
+        return self
     def iterate(
         self
     ) -> 'Iterator[Union[VideoFrame, AudioFrame]]':
@@ -370,7 +464,11 @@ class VideoReader:
         (already decoded).
         """
         for frame in self.frame_iterator:
-            yield VideoReaderFrame(frame)
+            yield VideoReaderFrame(
+                frame = frame,
+                t = float(frame.pts * self.time_base),
+                pixel_format = self.pixel_format
+            )
     def iterate_with_audio(
         self,
@@ -407,7 +505,58 @@ class VideoReader:
                     yield VideoReaderFrame(frame)
             else:
                 # Return the packet as it is
-                yield VideoReaderPacket(packet)
+                yield VideoReaderPacket(packet)
+    # These methods below are using the demux
+    def iterate_video_frames(
+        self,
+        start_pts: int = 0,
+        end_pts: Union[int, None] = None
+    ):
+        """
+        Iterate over the video stream packets and
+        decode only the ones in the expected range,
+        so only those frames are decoded (which is
+        an expensive process).
+        This method returns a tuple of 3 elements:
+        - `frame` as a `VideoFrame` instance
+        - `t` as the frame time moment
+        - `index` as the frame index
+        """
+        for frame in iterate_stream_frames_demuxing(
+            container = self.container,
+            video_stream = self.video_stream,
+            audio_stream = None,
+            start_pts = start_pts,
+            end_pts = end_pts
+        ):
+            yield frame
+    def iterate_audio_frames(
+        self,
+        start_pts: int = 0,
+        end_pts: Union[int, None] = None
+    ):
+        """
+        Iterate over the audio stream packets and
+        decode only the ones in the expected range,
+        so only those frames are decoded (which is
+        an expensive process).
+        This method returns a tuple of 3 elements:
+        - `frame` as a `AudioFrame` instance
+        - `t` as the frame time moment
+        - `index` as the frame index
+        """
+        for frame in iterate_stream_frames_demuxing(
+            container = self.container,
+            video_stream = None,
+            audio_stream = self.audio_stream,
+            start_pts = start_pts,
+            end_pts = end_pts
+        ):
+            yield frame
     # TODO: Will we use this (?)
     def get_frame(
@@ -419,6 +568,14 @@ class VideoReader:
         the cache system.
         """
         return self.cache.get_frame(index)
+    def close(
+        self
+    ) -> None:
+        """
+        Close the container to free it.
+        """
+        self.container.close()

{yta_video_opengl-0.0.6 → yta_video_opengl-0.0.8}/src/yta_video_opengl/tests.py RENAMED Viewed

@@ -579,7 +579,13 @@ def video_modified_stored():
     # TODO: Where do we obtain this from (?)
     PIXEL_FORMAT = 'yuv420p'
-    from yta_video_opengl.classes import WavingFrame, BreathingFrame, HandheldFrame, OrbitingFrame, RotatingInCenterFrame, StrangeTvFrame, GlitchRgbFrame
+    from yta_video_opengl.classes import WavingFrame, BreathingFrame, HandheldFrame, OrbitingFrame, RotatingInCenterFrame, StrangeTvFrame, GlitchRgbFrame, WavingNode
+    from yta_video_opengl.utils import texture_to_frame, frame_to_texture
+    from yta_video_opengl.video import Video
+    Video(VIDEO_PATH, 0, 0.5).save_as(OUTPUT_PATH)
+    return
     video = VideoReader(VIDEO_PATH)
     video_writer = (
@@ -604,6 +610,10 @@ def video_modified_stored():
         size = video.size,
         first_frame = video.next_frame
     )
+    context = moderngl.create_context(standalone = True)
+    # New way, with nodes
+    node = WavingNode(context, video.size, amplitude = 0.2, frequency = 9, speed = 3)
     # We need to reset it to being again pointing
     # to the first frame...
     # TODO: Improve this by, maybe, storing the first
@@ -624,21 +634,32 @@ def video_modified_stored():
         # To simplify the process
         if frame_or_packet is not None:
-            frame_or_packet = frame_or_packet.data
+            frame_or_packet = frame_or_packet.value
         if is_audio_packet:
             video_writer.mux(frame_or_packet)
         elif is_video_frame:
             with Timer(is_silent_as_context = True) as timer:
                 t = T.video_frame_index_to_video_frame_time(frame_index, float(video.fps))
+                # This is another way of getting 't'
+                #t = float(frame_or_packet.pts * video.time_base)
                 video_writer.mux_video_frame(
-                    effect.process_frame(
-                        frame = frame_or_packet,
-                        t = t,
-                        numpy_format = NUMPY_FORMAT
+                    frame = texture_to_frame(
+                        texture = node.process(
+                            input = frame_or_packet,
+                            t = t
+                        )
                     )
                 )
+                # video_writer.mux_video_frame(
+                #     effect.process_frame(
+                #         frame = frame_or_packet,
+                #         t = t,
+                #         numpy_format = NUMPY_FORMAT
+                #     )
+                # )
                 frame_index += 1

yta_video_opengl-0.0.8/src/yta_video_opengl/utils.py ADDED Viewed

@@ -0,0 +1,343 @@
+from yta_validation import PythonValidator
+from av.container import InputContainer
+from av.video.stream import VideoStream
+from av.audio.stream import AudioStream
+from av.video.frame import VideoFrame
+from typing import Union
+import av
+import numpy as np
+import moderngl
+def frame_to_texture(
+    frame: Union['VideoFrame', 'np.ndarray'],
+    context: moderngl.Context,
+    numpy_format: str = 'rgb24'
+):
+    """
+    Transform the given 'frame' to an opengl
+    texture. The frame can be a VideoFrame
+    instance (from pyav library) or a numpy
+    array.
+    """
+    # To numpy RGB inverted for opengl
+    frame: np.ndarray = (
+        np.flipud(frame.to_ndarray(format = numpy_format))
+        if PythonValidator.is_instance_of(frame, 'VideoFrame') else
+        np.flipud(frame)
+    )
+    return context.texture(
+        size = (frame.shape[1], frame.shape[0]),
+        components = frame.shape[2],
+        data = frame.tobytes()
+    )
+# TODO: I should make different methods to
+# obtain a VideoFrame or a numpy array frame
+def texture_to_frame(
+    texture: moderngl.Texture
+) -> 'VideoFrame':
+    """
+    Transform an opengl texture into a pyav
+    VideoFrame instance.
+    """
+    # RGBA8
+    data = texture.read(alignment = 1)
+    frame = np.frombuffer(data, dtype = np.uint8).reshape((texture.size[1], texture.size[0], 4))
+    # Opengl gives it with the y inverted
+    frame = np.flipud(frame)
+    # TODO: This can be returned as a numpy frame
+    # This is if we need an 'av' VideoFrame (to
+    # export through the demuxer, for example)
+    frame = av.VideoFrame.from_ndarray(frame, format = 'rgba')
+    # TODO: Make this customizable
+    frame = frame.reformat(format = 'yuv420p')
+    return frame
+def get_fullscreen_quad_vao(
+    context: moderngl.Context,
+    program: moderngl.Program
+) -> moderngl.VertexArray:
+    """
+    Get the vertex array object of a quad, by
+    using the vertices, the indexes, the vbo,
+    the ibo and the vao content.
+    """
+    # Quad vertices in NDC (-1..1) with texture
+    # coords (0..1)
+    """
+    The UV coordinates to build the quad we
+    will use to represent the frame by
+    applying it as a texture.
+    """
+    vertices = np.array([
+        # pos.x, pos.y, tex.u, tex.v
+        -1.0, -1.0, 0.0, 0.0,  # vertex 0 - bottom left
+        1.0, -1.0, 1.0, 0.0,  # vertex 1 - bottom right
+        -1.0,  1.0, 0.0, 1.0,  # vertex 2 - top left
+        1.0,  1.0, 1.0, 1.0,  # vertex 3 - top right
+    ], dtype = 'f4')
+    """
+    The indexes of the vertices (see 'vertices'
+    property) to build the 2 opengl triangles
+    that will represent the quad we need for
+    the frame.
+    """
+    indices = np.array([
+        0, 1, 2,
+        2, 1, 3
+    ], dtype = 'i4')
+    vbo = context.buffer(vertices.tobytes())
+    ibo = context.buffer(indices.tobytes())
+    vao_content = [
+        # 2 floats position, 2 floats texcoords
+        (vbo, '2f 2f', 'in_vert', 'in_texcoord'),
+    ]
+    return context.vertex_array(program, vao_content, ibo)
+def iterate_streams_packets(
+    container: 'InputContainer',
+    video_stream: 'VideoStream',
+    audio_stream: 'AudioStream',
+    video_start_pts: int = 0,
+    video_end_pts: Union[int, None] = None,
+    audio_start_pts: int = 0,
+    audio_end_pts: Union[int, None] = None
+):
+    """
+    Iterate over the provided 'stream' packets
+    and yield the ones in the expected range.
+    This is nice when trying to copy a stream
+    without modifications.
+    """
+    # 'video_start_pts' and 'audio_start_pts' must
+    # be 0 or a positive tps
+    if (
+        video_stream is None and
+        audio_stream is None
+    ):
+        raise Exception('No streams provided.')
+    # We only need to seek on video
+    if video_stream is not None:
+        container.seek(video_start_pts, stream = video_stream)
+    if audio_stream is not None:
+        container.seek(audio_start_pts, stream = audio_stream)
+    stream = [
+        stream
+        for stream in (video_stream, audio_stream)
+        if stream
+    ]
+    """
+    Apparently, if we ignore some packets based
+    on the 'pts', we can be ignoring information
+    that is needed for the next frames to be
+    decoded, so we need to decode them all...
+    If we can find some strategy to seek not for
+    the inmediate but some before and read from
+    that one to avoid reading all of the packets
+    we could save some time, but at what cost?
+    We cannot skip any crucial frame so we need
+    to know how many we can skip, and that sounds
+    a bit difficult depending on the codec.
+    """
+    stream_finished: str = ''
+    for packet in container.demux(stream):
+        if packet.pts is None:
+            continue
+        # TODO: We cannot skip like this, we need to
+        # look for the nearest keyframe to be able
+        # to decode the frames later. Take a look at
+        # the VideoFrameCache class and use it.
+        # start_pts = (
+        #     video_start_pts
+        #     if packet.stream.type == 'video' else
+        #     audio_start_pts
+        # )
+        # end_pts = (
+        #     video_end_pts
+        #     if packet.stream.type == 'video' else
+        #     audio_end_pts
+        # )
+        # if packet.pts < start_pts:
+        #     continue
+        # if (
+        #     end_pts is not None and
+        #     packet.pts > end_pts
+        # ):
+        #     if (
+        #         stream_finished != '' and
+        #         (
+        #             # Finish if only one stream
+        #             stream_finished != packet.stream.type or
+        #             video_stream is None or
+        #             audio_stream is None
+        #         )
+        #     ):
+        #         # We have yielded all the frames in the
+        #         # expected range, no more needed
+        #         return
+        #     stream_finished = packet.stream.type
+        #     continue
+        yield packet
+def iterate_stream_frames_demuxing(
+    container: 'InputContainer',
+    video_stream: 'VideoStream',
+    audio_stream: 'AudioStream',
+    video_start_pts : int = 0,
+    video_end_pts: Union[int, None] = None,
+    audio_start_pts: int = 0,
+    audio_end_pts: Union[int, None] = None
+):
+    """
+    Iterate over the provided 'stream' packets
+    and decode only the ones in the expected
+    range, so only those frames are decoded
+    (which is an expensive process).
+    This method returns a tuple of 3 elements:
+    - `frame` as a `VideoFrame` instance
+    - `t` as the frame time moment
+    - `index` as the frame index
+    You can easy transform the frame received
+    to a numpy array by using this:
+    - `frame.to_ndarray(format = format)`
+    """
+    # 'start_pts' must be 0 or a positive tps
+    # 'end_pts' must be None or a positive tps
+    # We cannot skip packets or we will lose
+    # information needed to build the video
+    for packet in iterate_streams_packets(
+        container = container,
+        video_stream = video_stream,
+        audio_stream = audio_stream,
+        video_start_pts = video_start_pts,
+        video_end_pts = video_end_pts,
+        audio_start_pts = audio_start_pts,
+        audio_end_pts = audio_end_pts
+    ):
+        # Only valid and in range packets here
+        # Here only the accepted ones
+        stream_finished: str = ''
+        for frame in packet.decode():
+            if frame.pts is None:
+                continue
+            time_base = (
+                video_stream.time_base
+                if PythonValidator.is_instance_of(frame, VideoFrame) else
+                audio_stream.time_base
+            )
+            average_rate = (
+                video_stream.average_rate
+                if PythonValidator.is_instance_of(frame, VideoFrame) else
+                audio_stream.rate
+            )
+            start_pts = (
+                video_start_pts
+                if packet.stream.type == 'video' else
+                audio_start_pts
+            )
+            end_pts = (
+                video_end_pts
+                if packet.stream.type == 'video' else
+                audio_end_pts
+            )
+            if frame.pts < start_pts:
+                continue
+            if (
+                end_pts is not None and
+                frame.pts > end_pts
+            ):
+                if (
+                    stream_finished != '' and
+                    (
+                        # Finish if only one stream
+                        stream_finished != packet.stream.type or
+                        video_stream is None or
+                        audio_stream is None
+                    )
+                ):
+                    # We have yielded all the frames in the
+                    # expected range, no more needed
+                    return
+                stream_finished = packet.stream.type
+                continue
+            time_base = (
+                video_stream.time_base
+                if PythonValidator.is_instance_of(frame, VideoFrame) else
+                audio_stream.time_base
+            )
+            average_rate = (
+                video_stream.average_rate
+                if PythonValidator.is_instance_of(frame, VideoFrame) else
+                audio_stream.rate
+            )
+            # TODO: Maybe send a @dataclass instead (?)
+            yield (
+                frame,
+                pts_to_t(frame.pts, time_base),
+                pts_to_index(frame.pts, time_base, average_rate)
+            )
+def t_to_pts(
+    t: float,
+    stream_time_base: 'Fraction'
+ ) -> int:
+    """
+    Transform a 't' time moment (in seconds) to
+    a packet timestamp (pts) understandable by
+    the pyav library.
+    """
+    return int((t + 0.000001) / stream_time_base)
+def pts_to_index(
+    pts: int,
+    stream_time_base: 'Fraction',
+    fps: float
+) -> int:
+    """
+    Transform a 'pts' packet timestamp to a
+    frame index.
+    """
+    return int(round(pts_to_t(pts, stream_time_base) * fps))
+def pts_to_t(
+    pts: int,
+    stream_time_base: 'Fraction'
+) -> float:
+    """
+    Transform a 'pts' packet timestamp to a 't'
+    time moment.
+    """
+    return pts * stream_time_base

yta_video_opengl-0.0.8/src/yta_video_opengl/video.py ADDED Viewed

@@ -0,0 +1,164 @@
+from yta_video_opengl.reader import VideoReader
+from yta_video_opengl.writer import VideoWriter
+from yta_video_opengl.utils import iterate_stream_frames_demuxing
+from yta_validation import PythonValidator
+from typing import Union
+# TODO: Where can I obtain this dynamically (?)
+PIXEL_FORMAT = 'yuv420p'
+# TODO: Maybe rename to 'Media' (?)
+class Video:
+    """
+    Class to wrap the functionality related to
+    handling and modifying a video.
+    """
+    @property
+    def start_pts(
+        self
+    ) -> int:
+        """
+        The start packet time stamp (pts), needed
+        to optimize the packet iteration process.
+        """
+        return int(self.start / self.reader.time_base)
+    @property
+    def end_pts(
+        self
+    ) -> Union[int, None]:
+        """
+        The end packet time stamp (pts), needed to
+        optimize the packet iteration process.
+        """
+        return (
+            int(self.end / self.reader.time_base)
+            # TODO: What do we do if no duration (?)
+            if self.duration is not None else
+            None
+        )
+    @property
+    def audio_start_pts(
+        self
+    ) -> int:
+        """
+        The start packet time stamp (pts), needed
+        to optimize the packet iteration process.
+        """
+        return int(self.start / self.reader.audio_time_base)
+    @property
+    def audio_end_pts(
+        self
+    ) -> Union[int, None]:
+        """
+        The end packet time stamp (pts), needed to
+        optimize the packet iteration process.
+        """
+        return (
+            int(self.end / self.reader.audio_time_base)
+            # TODO: What do we do if no duration (?)
+            if self.duration is not None else
+            None
+        )
+    @property
+    def duration(
+        self
+    ):
+        """
+        The duration of the video.
+        """
+        return self.end - self.start
+    @property
+    def frames(
+        self
+    ):
+        """
+        Iterator to yield all the frames, one by
+        one, within the range defined by the
+        'start' and 'end' parameters provided when
+        instantiating it.
+        This method returns a tuple of 3 elements:
+        - `frame` as a `VideoFrame` instance
+        - `t` as the frame time moment
+        - `index` as the frame index
+        """
+        for frame in iterate_stream_frames_demuxing(
+            container = self.reader.container,
+            video_stream = self.reader.video_stream,
+            audio_stream = self.reader.audio_stream,
+            video_start_pts = self.start_pts,
+            video_end_pts = self.end_pts,
+            audio_start_pts = self.audio_start_pts,
+            audio_end_pts = self.audio_end_pts
+        ):
+            yield frame
+    def __init__(
+        self,
+        filename: str,
+        start: float = 0.0,
+        end: Union[float, None] = None
+    ):
+        self.filename: str = filename
+        """
+        The filename of the original video.
+        """
+        # TODO: Detect the 'pixel_format' from the
+        # extension (?)
+        self.reader: VideoReader = VideoReader(self.filename)
+        """
+        The pyav video reader.
+        """
+        self.start: float = start
+        """
+        The time moment 't' in which the video
+        should start.
+        """
+        self.end: Union[float, None] = (
+            # TODO: Is this 'end' ok (?)
+            self.reader.duration
+            if end is None else
+            end
+        )
+        """
+        The time moment 't' in which the video
+        should end.
+        """
+    def save_as(
+        self,
+        filename: str
+    ) -> 'Video':
+        writer =  VideoWriter(filename)
+        #writer.set_video_stream(self.reader.video_stream.codec.name, self.reader.fps, self.reader.size, PIXEL_FORMAT)
+        writer.set_video_stream_from_template(self.reader.video_stream)
+        writer.set_audio_stream_from_template(self.reader.audio_stream)
+        # TODO: I need to process the audio also, so
+        # build a method that do the same but for
+        # both streams at the same time
+        for frame, t, index in self.frames:
+            if PythonValidator.is_instance_of(frame, 'VideoFrame'):
+                print(f'Saving video frame {str(index)}, with t = {str(t)}')
+                writer.mux_video_frame(
+                    frame = frame
+                )
+            else:
+                print(f'Saving audio frame {str(index)} ({str(round(float(t * self.reader.fps), 2))}), with t = {str(t)}')
+                writer.mux_audio_frame(
+                    frame = frame
+                )
+        writer.mux_audio_frame(None)
+        writer.mux_video_frame(None)
+        # TODO: Maybe move this to the '__del__' (?)
+        writer.output.close()
+        self.reader.container.close()

{yta_video_opengl-0.0.6 → yta_video_opengl-0.0.8}/src/yta_video_opengl/writer.py RENAMED Viewed

@@ -1,4 +1,3 @@
-from yta_validation import PythonValidator
 from yta_validation.parameter import ParameterValidator
 from av.stream import Stream
 from av.packet import Packet
@@ -115,9 +114,23 @@ class VideoWriter:
         You can pass the audio stream as it was
         obtained from the reader.
         """
+        self.audio_stream: AudioStream = self.output.add_stream(
+            codec_name = template.codec_context.name,
+            rate = template.codec_context.rate
+        )
+        self.audio_stream.codec_context.format = template.codec_context.format
+        self.audio_stream.codec_context.layout = template.codec_context.layout
+        self.audio_stream.time_base = Fraction(1, template.codec_context.rate)
+        return self
+        # This below is not working
         self.audio_stream: AudioStream = self.output.add_stream_from_template(
             template
         )
+        # TODO: Is this actually needed (?)
+        # Force this 'rate'
+        self.audio_stream.time_base = Fraction(1, template.codec_context.rate)
         return self

yta_video_opengl-0.0.6/src/yta_video_opengl/utils.py DELETED Viewed

@@ -1,24 +0,0 @@
-from yta_validation import PythonValidator
-from typing import Union
-import numpy as np
-import moderngl
-def frame_to_texture(
-    frame: Union['VideoFrame', 'np.ndarray'],
-    context: moderngl.Context,
-    numpy_format: str = 'rgb24'
-):
-    """
-    Transform the given 'frame' to an opengl
-    texture.
-    """
-    # To numpy RGB inverted for opengl
-    frame: np.ndarray = (
-        np.flipud(frame.to_ndarray(format = numpy_format))
-        if PythonValidator.is_instance_of(frame, 'VideoFrame') else
-        np.flipud(frame)
-    )
-    return context.texture((frame.shape[1], frame.shape[0]), 3, frame.tobytes())

{yta_video_opengl-0.0.6 → yta_video_opengl-0.0.8}/LICENSE RENAMED Viewed

File without changes

{yta_video_opengl-0.0.6 → yta_video_opengl-0.0.8}/README.md RENAMED Viewed

File without changes

{yta_video_opengl-0.0.6 → yta_video_opengl-0.0.8}/src/yta_video_opengl/__init__.py RENAMED Viewed

File without changes

{yta_video_opengl-0.0.6 → yta_video_opengl-0.0.8}/src/yta_video_opengl/reader/cache.py RENAMED Viewed

File without changes

yta-video-opengl 0.0.6__tar.gz → 0.0.8__tar.gz

yta-video-opengl 0.0.6tar.gz → 0.0.8tar.gz