PyPI - cutted - Versions diffs - 0.3.3__py3-none-any.whl → 0.4.0__py3-none-any.whl - Mend

cutted 0.3.3py3-none-any.whl → 0.4.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (10) hide show

cutted/__init__.py +1 -1
cutted/app.py +29 -14
cutted/core/audio_processor.py +22 -0
cutted/core/gemini.py +75 -16
{cutted-0.3.3.dist-info → cutted-0.4.0.dist-info}/METADATA +1 -1
cutted-0.4.0.dist-info/RECORD +12 -0
cutted-0.3.3.dist-info/RECORD +0 -12
{cutted-0.3.3.dist-info → cutted-0.4.0.dist-info}/WHEEL +0 -0
{cutted-0.3.3.dist-info → cutted-0.4.0.dist-info}/licenses/LICENSE +0 -0
{cutted-0.3.3.dist-info → cutted-0.4.0.dist-info}/top_level.txt +0 -0

cutted/__init__.py CHANGED Viewed

@@ -1,2 +1,2 @@
-__version__ = "0.3.3"
+__version__ = "0.4.0"
 __author__ = "simon0302010"

cutted/app.py CHANGED Viewed

@@ -109,45 +109,54 @@ class CuttedApp:
     def update_plot(self):
         if self.canvas:
             self.canvas.get_tk_widget().destroy()
+        if hasattr(self, "slider") and self.slider is not None:
+            self.slider.destroy()
         fig = self.AudioProcessor.plot_audio()
         self.ax = fig.axes[0]
         self.canvas = FigureCanvasTkAgg(fig, master=self.plot_frame)
         self.canvas.draw()
-        self.audio_lenght = int(round(self.AudioProcessor.get_length()))
+        self.audio_length = float(self.AudioProcessor.get_length())
         slider_width = self.root.winfo_width() - 40
+        if self.slider_value > self.audio_length:
+            self.slider_value = self.audio_length
+        if self.slider_value < 0:
+            self.slider_value = 0
         self.slider = customtkinter.CTkSlider(
-            self.root, from_=0, to=self.audio_lenght, command=self.set_cursor, width=slider_width
+            self.root, from_=0, to=self.audio_length, command=self.set_cursor, width=slider_width
         )
-        self.slider.set(0)
+        self.slider.set(self.slider_value)
         self.slider.place(relx=0.5, rely=1.0, anchor="s", y=-130)
+        self.set_cursor(self.slider_value)
         self.canvas.get_tk_widget().pack(
             fill=customtkinter.BOTH,
             expand=True,
             padx=10,
             pady=10,
         )
-        self.cursor_line = self.ax.axvline(x=0, color="red", linewidth=2)
+        self.cursor_line = self.ax.axvline(x=self.slider_value, color="red", linewidth=2)
         self.canvas.draw_idle()
     def set_cursor(self, value):
         now = time.time()
-        if now - self.last_slider_update < 0.1:  # 100ms
+        if now - self.last_slider_update < 0.05:  # 100ms
             return
         self.last_slider_update = now
-        self.slider_value = round(value)
+        self.slider_value = round(value, 2)
         if self.cursor_line:
             self.cursor_line.set_xdata([self.slider_value, self.slider_value])
             self.canvas.draw_idle()
+            self.slider.set(self.slider_value)
+            self.set_cursor(self.slider_value)
-        print(f"Slider Value: {self.slider_value}")
+        print_info(f"Slider Value: {self.slider_value}")
     def play_audio(self):
         if not hasattr(self.AudioProcessor, "audio") or self.AudioProcessor.audio is None:
@@ -200,7 +209,7 @@ class CuttedApp:
         text = self.entry.get()
         if text.strip():
-            full_prompt = f"You are a audio editing AI. You are controllable via natural language and editing a audio file. The audio file is {round(self.AudioProcessor.get_length())}s long. The cursor of the user is currently at {self.slider_value}s."
+            full_prompt = f"You are a audio editing AI. You are controllable via natural language and editing a audio file. The audio file is {round(self.AudioProcessor.get_length(), 2)}s long. The cursor of the user is currently at {self.slider_value}s."
             full_prompt += "\nHere is a the waveform samples of the audio. You can use them to determine silent parts, loud parts, silences, beats and much more.\nYou are forced to used these if the user requires you to cut out silent of quiet parts for example."
             full_prompt += "\nAll of your tools should be enough to fullfill almost every task.\nNEVER ASK FOR CONFIRMATION FROM THE USER. DO EVERYTHING!"
             full_prompt += f"\n{self.AudioProcessor.get_waveform_summary()}\n"
@@ -228,6 +237,12 @@ class CuttedApp:
                     result = self.AudioProcessor.cut(args["start"], args["end"])
                     if not result:
                         messagebox.showerror("Error", "Please try again.")
+                if function_call.name == "change_volume":
+                    print_info("Change Volume function called")
+                    args = function_call.args
+                    result = self.AudioProcessor.change_volume(args["start"], args["end"], args["volume"])
+                    if not result:
+                        messagebox.showerror("Error", "Please try again.")
                 self.update_plot()
             elif text_result:
                 messagebox.showerror("Error", text_result.strip())

cutted/core/audio_processor.py CHANGED Viewed

@@ -112,6 +112,28 @@ class AudioProcessor:
         else:
             return False
+    def change_volume(self, start, end, volume):
+        if len(start) == len(end) == len(volume):
+            time_sets = list(zip(start, end, volume))
+            for single_start, single_end, single_volume in time_sets:
+                if single_end <= single_start:
+                    print_fail("End time must be greater than start time.")
+                    continue
+                print_info(f"Changing volume of {single_start} - {single_end} to {str(single_volume)}")
+                start_ms = round(single_start * 1000)
+                end_ms = round(single_end * 1000)
+                part1 = self.audio[:start_ms]
+                part2 = self.audio[start_ms:end_ms]
+                part3 = self.audio[end_ms:]
+                part2 = part2.apply_gain(ratio_to_db(single_volume))
+                self.audio = part1 + part2 + part3
+            return True
+        else:
+            return False
     def play_audio(self, start_time=0):
         if self.audio is None:
             print_fail("No audio loaded.")

cutted/core/gemini.py CHANGED Viewed

@@ -15,6 +15,7 @@ class GeminiClient:
         self.client = genai.Client(
             api_key=GEMINI_API_KEY,
         )
+        self.contents = []
     def generate(self, prompt: str, model: str = "gemini-2.0-flash", audio_base64 = None):
         parts=[
@@ -27,38 +28,76 @@ class GeminiClient:
                 data=base64.b64decode(audio_base64)
             ))
-        contents = [
+        self.contents.append(
             types.Content(
                 role="user",
                 parts=parts
-            ),
-        ]
+            )
+        )
         tools = [
             types.Tool(
                 function_declarations=[
                     types.FunctionDeclaration(
                         name="cut_audio",
-                        description="Cuts specified parts out of audio. Multiple parts can be cut if a list of both start and end values is used as property.",
+                        description=(
+                            "Remove one or more segments from the audio by specifying start and end times in seconds. "
+                            "You can cut multiple segments at once by providing lists of start and end values. "
+                            "Each segment defined by a start and end pair will be removed from the audio."
+                        ),
+                        parameters=genai.types.Schema(
+                            type=genai.types.Type.OBJECT,
+                            required=["start", "end"],
+                            properties={
+                                "start": genai.types.Schema(
+                                    type=genai.types.Type.ARRAY,
+                                    items=genai.types.Schema(
+                                        type=genai.types.Type.NUMBER,
+                                    ),
+                                ),
+                                "end": genai.types.Schema(
+                                    type=genai.types.Type.ARRAY,
+                                    items=genai.types.Schema(
+                                        type=genai.types.Type.NUMBER,
+                                    ),
+                                ),
+                            },
+                        ),
+                    ),
+                    types.FunctionDeclaration(
+                        name="change_volume",
+                        description=(
+                            "Adjust the volume of specific segments in the audio by specifying lists of start times, end times, "
+                            "and volume factors. Each segment between a start and end time will have its volume changed by the "
+                            "corresponding factor (e.g., 0.5 for half volume, 2.0 for double volume). Multiple segments can be "
+                            "adjusted at once by providing lists of values."
+                        ),
                         parameters=genai.types.Schema(
-                            type = genai.types.Type.OBJECT,
-                            required = ["start", "end"],
-                            properties = {
+                            type=genai.types.Type.OBJECT,
+                            required=["start", "end", "volume"],
+                            properties={
                                 "start": genai.types.Schema(
-                                    type = genai.types.Type.ARRAY,
-                                    items = genai.types.Schema(
-                                        type = genai.types.Type.NUMBER,
+                                    type=genai.types.Type.ARRAY,
+                                    items=genai.types.Schema(
+                                        type=genai.types.Type.NUMBER,
                                     ),
                                 ),
                                 "end": genai.types.Schema(
-                                    type = genai.types.Type.ARRAY,
-                                    items = genai.types.Schema(
-                                        type = genai.types.Type.NUMBER,
+                                    type=genai.types.Type.ARRAY,
+                                    items=genai.types.Schema(
+                                        type=genai.types.Type.NUMBER,
                                     ),
+                                ),
+                                "volume": genai.types.Schema(
+                                    type=genai.types.Type.ARRAY,
+                                    items=genai.types.Schema(
+                                        type=genai.types.Type.NUMBER,
                                     ),
+                                ),
                             },
                         ),
                     ),
-                ])
+                ]
+            )
         ]
         generate_content_config = types.GenerateContentConfig(
             tools=tools,
@@ -67,7 +106,7 @@ class GeminiClient:
         response = self.client.models.generate_content(
             model=model,
-            contents=contents,
+            contents=self.contents,
             config=generate_content_config,
         )
@@ -81,7 +120,27 @@ class GeminiClient:
                     if part.text:
                         text_response = part.text
         except TypeError:
-            return None, None
+            pass
+        model_parts = []
+        if text_response:
+            model_parts.append(
+                types.Part.from_text(text=text_response)
+            )
+        if function_call:
+            model_parts.append(
+                types.Part.from_function_call(
+                    name=function_call.name,
+                    args=function_call.args
+                )
+            )
+        self.contents.append(
+            types.Content(
+                role="model",
+                parts=model_parts
+            )
+        )
         return function_call, text_response

{cutted-0.3.3.dist-info → cutted-0.4.0.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: cutted
-Version: 0.3.3
+Version: 0.4.0
 Summary: AI-powered audio editor controllable via natural language.
 Author-email: simon0302010 <simon0302010@gmail.com>
 License-Expression: GPL-3.0

cutted-0.4.0.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,12 @@
+cutted/__init__.py,sha256=7eWSPFhMOE6u-f5s_QomBlTjCze86s3xKt-v0bLJAAs,49
+cutted/__main__.py,sha256=lYGLgtIZ_vGZIJmWG6ZQoqOdyOJnaWEA4NBn5Rc7Q8E,61
+cutted/app.py,sha256=LyVv3RHiAemtcEgLiZCcyenAD_QliaFIZ08JfCNwxq4,11543
+cutted/core/audio_processor.py,sha256=OBxNAKs67zqIfnJIsSgaMDa0UbB0R0mccyWcgNs5Bk0,7663
+cutted/core/gemini.py,sha256=0ATm5gHZWmu4k_9SZOsOx5XYY7nEer5LOzt1SMfQlIk,5836
+cutted/core/logger.py,sha256=AjqrgW2LV9HdPkPQ8oOmyd9lWzVSIg46r74ILR7mVHo,585
+cutted/core/transcribe.py,sha256=0e7aCva4y6D-gKe1xw5HT9VoFgbvHGgV6utn12r8wXA,986
+cutted-0.4.0.dist-info/licenses/LICENSE,sha256=OXLcl0T2SZ8Pmy2_dmlvKuetivmyPd5m1q-Gyd-zaYY,35149
+cutted-0.4.0.dist-info/METADATA,sha256=wEeg-ive3z6zwUmLvZ_3Lh8W0xhsj12mMgSMASxWdUg,1503
+cutted-0.4.0.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+cutted-0.4.0.dist-info/top_level.txt,sha256=PL6glZvzRyKWCDn5aoYI9uH8HlEA5Qd_XFJowJKARYI,7
+cutted-0.4.0.dist-info/RECORD,,

cutted-0.3.3.dist-info/RECORD DELETED Viewed

@@ -1,12 +0,0 @@
-cutted/__init__.py,sha256=F1mzO6qI2gD6d_DQsjZItLuIfNfa1Te5KwCMThWDQT4,49
-cutted/__main__.py,sha256=lYGLgtIZ_vGZIJmWG6ZQoqOdyOJnaWEA4NBn5Rc7Q8E,61
-cutted/app.py,sha256=HaJ3yu8-WVDGKZmFcTVG4CK8q13eHyUQaIyOWMZWV68,10764
-cutted/core/audio_processor.py,sha256=gKBJ1wpdrX2IozmXDzW7MoFVp9uq0Pb3ezz9R3Ahmnw,6691
-cutted/core/gemini.py,sha256=yHsQXk4tDHcW5qJBuL2LpPvdChimxlmEbu76BvsoeY4,3108
-cutted/core/logger.py,sha256=AjqrgW2LV9HdPkPQ8oOmyd9lWzVSIg46r74ILR7mVHo,585
-cutted/core/transcribe.py,sha256=0e7aCva4y6D-gKe1xw5HT9VoFgbvHGgV6utn12r8wXA,986
-cutted-0.3.3.dist-info/licenses/LICENSE,sha256=OXLcl0T2SZ8Pmy2_dmlvKuetivmyPd5m1q-Gyd-zaYY,35149
-cutted-0.3.3.dist-info/METADATA,sha256=ehEIEm5qz3wVqBY74Itpwooe4SYOFpXISXUMZO7LVh4,1503
-cutted-0.3.3.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
-cutted-0.3.3.dist-info/top_level.txt,sha256=PL6glZvzRyKWCDn5aoYI9uH8HlEA5Qd_XFJowJKARYI,7
-cutted-0.3.3.dist-info/RECORD,,

{cutted-0.3.3.dist-info → cutted-0.4.0.dist-info}/WHEEL RENAMED Viewed

File without changes

{cutted-0.3.3.dist-info → cutted-0.4.0.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

{cutted-0.3.3.dist-info → cutted-0.4.0.dist-info}/top_level.txt RENAMED Viewed

File without changes

cutted 0.3.3__py3-none-any.whl → 0.4.0__py3-none-any.whl

cutted 0.3.3py3-none-any.whl → 0.4.0py3-none-any.whl