PyPI - cutted - Versions diffs - 0.3.2__py3-none-any.whl → 0.3.3__py3-none-any.whl - Mend

cutted 0.3.2py3-none-any.whl → 0.3.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (9) hide show

cutted/__init__.py +1 -1
cutted/app.py +17 -4
cutted/core/audio_processor.py +34 -8
{cutted-0.3.2.dist-info → cutted-0.3.3.dist-info}/METADATA +1 -1
cutted-0.3.3.dist-info/RECORD +12 -0
cutted-0.3.2.dist-info/RECORD +0 -12
{cutted-0.3.2.dist-info → cutted-0.3.3.dist-info}/WHEEL +0 -0
{cutted-0.3.2.dist-info → cutted-0.3.3.dist-info}/licenses/LICENSE +0 -0
{cutted-0.3.2.dist-info → cutted-0.3.3.dist-info}/top_level.txt +0 -0

cutted/__init__.py CHANGED Viewed

@@ -1,2 +1,2 @@
-__version__ = "0.3.2"
+__version__ = "0.3.3"
 __author__ = "simon0302010"

cutted/app.py CHANGED Viewed

@@ -25,6 +25,8 @@ class CuttedApp:
         self.canvas = None
         self.cursor_line = None
         self.last_slider_update = 0
+        self.slider_value = 0
+        self.playback_start_time = 0
         self.is_playing = False
         self.last_states = []
         self.setup_ui()
@@ -113,7 +115,7 @@ class CuttedApp:
         self.canvas = FigureCanvasTkAgg(fig, master=self.plot_frame)
         self.canvas.draw()
-        self.audio_lenght = int(round(self.AudioProcessor.get_lenght()))
+        self.audio_lenght = int(round(self.AudioProcessor.get_length()))
         slider_width = self.root.winfo_width() - 40
         self.slider = customtkinter.CTkSlider(
@@ -153,11 +155,16 @@ class CuttedApp:
             return
         start_time = self.slider.get() if hasattr(self, 'slider') else 0
+        self.playback_start_time = start_time
         self.AudioProcessor.play_audio(start_time)
     def stop_audio(self):
-        self.AudioProcessor.stop_audio()
+        rel_pos = self.AudioProcessor.stop_audio()
         self.is_playing = False
+        abs_pos = self.playback_start_time + rel_pos
+        self.slider.set(abs_pos)
+        self.set_cursor(abs_pos)
+        print_info(f"Absolute position in audio: {abs_pos:.2f}s")
     def export_audio(self):
         if not hasattr(self.AudioProcessor, "audio") or self.AudioProcessor.audio is None:
@@ -184,6 +191,7 @@ class CuttedApp:
             print_success(f"Audio exported to {save_path}")
     def send_prompt(self):
+        print(self.AudioProcessor.get_waveform_summary())
         self.save_state()
         if not hasattr(self.AudioProcessor, "audio") or self.AudioProcessor.audio is None:
@@ -192,14 +200,18 @@ class CuttedApp:
         text = self.entry.get()
         if text.strip():
-            full_prompt = f"You are a audio editing AI. You are controllable via natural language and editing a audio file. The audio file is {round(self.AudioProcessor.get_lenght())}s long."
+            full_prompt = f"You are a audio editing AI. You are controllable via natural language and editing a audio file. The audio file is {round(self.AudioProcessor.get_length())}s long. The cursor of the user is currently at {self.slider_value}s."
+            full_prompt += "\nHere is a the waveform samples of the audio. You can use them to determine silent parts, loud parts, silences, beats and much more.\nYou are forced to used these if the user requires you to cut out silent of quiet parts for example."
+            full_prompt += "\nAll of your tools should be enough to fullfill almost every task.\nNEVER ASK FOR CONFIRMATION FROM THE USER. DO EVERYTHING!"
+            full_prompt += f"\n{self.AudioProcessor.get_waveform_summary()}\n"
             if whisper_support:
                 if self.use_transcript_checkbox.get():
                     if not self.whisper:
-                        messagebox.showinfo("Info", "Loading Whisper model. This may take a few minutes depending on your internet connection. See the progress in your command line. If this window appears to be frozen, the transcription is running.")
+                        messagebox.showinfo("Info", "Loading Whisper model. This may take a few minutes depending on your internet connection. See the progress in your command line. If this window appears to be frozen, the transcription is running. Press OK to continue.")
                         self.whisper = transcribe.Whisper()
                     transcript = self.whisper.transcribe(self.AudioProcessor.audio_path)
                     full_prompt += f"\nThis is a transcript with per word timestamps of the audio:\n{transcript}"
+                    full_prompt += "\nThe transcript likely has issues. If you need infos about some words they might just be misspelled in the audio."
             full_prompt += f"\n\nUser Prompt: {text}"
             self.entry.delete(0, "end")
@@ -220,6 +232,7 @@ class CuttedApp:
             elif text_result:
                 messagebox.showerror("Error", text_result.strip())
             else:
+                messagebox.showerror("Error", "Gemini returned no data")
                 print_fail("Gemini returned no data")
     def save_state(self):

cutted/core/audio_processor.py CHANGED Viewed

@@ -62,7 +62,21 @@ class AudioProcessor:
         return fig
-    def get_lenght(self):
+    def get_waveform_summary(self):
+        num_samples = round(self.get_length())
+        if self.audio is None:
+            return "No audio loaded."
+        samples = np.array(self.audio.get_array_of_samples())
+        if self.audio.channels == 2:
+            samples = samples.reshape((-1, 2))
+            samples = samples.mean(axis=1)
+        samples = samples / np.max(np.abs(samples))
+        indices = np.linspace(0, len(samples)-1, num_samples).astype(int)
+        summary = samples[indices]
+        return f"Waveform samples (normalized, {num_samples} points):\n" + \
+            " ".join(f"{x:.2f}" for x in summary)
+    def get_length(self):
         self.duration = self.audio.duration_seconds
         self.duration = round(self.duration, 2)
         return self.duration
@@ -70,17 +84,25 @@ class AudioProcessor:
     def cut(self, start, end):
         if len(start) == len(end):
             if len(start) == 1:
-                print_info(f"Cutting from {start[0]} to {end[0]}")
-                start_ms = round(start[0] * 1000)
-                end_ms = round(end[0] * 1000)
+                single_start = max(0, start[0])
+                single_end = max(0, end[0])
+                if single_end <= single_start:
+                    print_fail("End time must be greater than start time.")
+                    return False
+                print_info(f"Cutting from {single_start} to {single_end}")
+                start_ms = round(single_start * 1000)
+                end_ms = round(single_end * 1000)
                 self.audio = self.audio[:start_ms] + self.audio[end_ms:]
                 return True
             else:
                 time_sets = list(zip(start, end))
                 subtract_time = 0
                 for single_start, single_end in time_sets:
-                    single_start = single_start - subtract_time
-                    single_end = single_end - subtract_time
+                    single_start = max(0, single_start - subtract_time)
+                    single_end = max(0, single_end - subtract_time)
+                    if single_end <= single_start:
+                        print_fail("End time must be greater than start time.")
+                        continue
                     print_info(f"Cutting from {single_start} to {single_end}")
                     start_ms = round(single_start * 1000)
                     end_ms = round(single_end * 1000)
@@ -123,11 +145,15 @@ class AudioProcessor:
     def stop_audio(self):
         try:
             if pygame.mixer.get_init():
+                pos_ms = pygame.mixer.music.get_pos()
+                pos_sec = pos_ms / 1000 if pos_ms >= 0 else 0
                 pygame.mixer.music.stop()
                 self.is_playing_var = False
-                print_info("Audio playback stopped")
+                print_info(f"Audio playback stopped at {pos_sec:.2f}s")
+                return pos_sec
         except Exception as e:
             print_warn(f"Error stopping audio: {e}")
+            return 0
     def is_playing(self):
         try:
@@ -142,7 +168,7 @@ class AudioProcessor:
             return None
         return {
-            "duration": self.get_lenght(),
+            "duration": self.get_length(),
             "channels": self.audio.channels,
             "frame_rate": self.audio.frame_rate,
             "sample_width": self.audio.sample_width

{cutted-0.3.2.dist-info → cutted-0.3.3.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: cutted
-Version: 0.3.2
+Version: 0.3.3
 Summary: AI-powered audio editor controllable via natural language.
 Author-email: simon0302010 <simon0302010@gmail.com>
 License-Expression: GPL-3.0

cutted-0.3.3.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,12 @@
+cutted/__init__.py,sha256=F1mzO6qI2gD6d_DQsjZItLuIfNfa1Te5KwCMThWDQT4,49
+cutted/__main__.py,sha256=lYGLgtIZ_vGZIJmWG6ZQoqOdyOJnaWEA4NBn5Rc7Q8E,61
+cutted/app.py,sha256=HaJ3yu8-WVDGKZmFcTVG4CK8q13eHyUQaIyOWMZWV68,10764
+cutted/core/audio_processor.py,sha256=gKBJ1wpdrX2IozmXDzW7MoFVp9uq0Pb3ezz9R3Ahmnw,6691
+cutted/core/gemini.py,sha256=yHsQXk4tDHcW5qJBuL2LpPvdChimxlmEbu76BvsoeY4,3108
+cutted/core/logger.py,sha256=AjqrgW2LV9HdPkPQ8oOmyd9lWzVSIg46r74ILR7mVHo,585
+cutted/core/transcribe.py,sha256=0e7aCva4y6D-gKe1xw5HT9VoFgbvHGgV6utn12r8wXA,986
+cutted-0.3.3.dist-info/licenses/LICENSE,sha256=OXLcl0T2SZ8Pmy2_dmlvKuetivmyPd5m1q-Gyd-zaYY,35149
+cutted-0.3.3.dist-info/METADATA,sha256=ehEIEm5qz3wVqBY74Itpwooe4SYOFpXISXUMZO7LVh4,1503
+cutted-0.3.3.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+cutted-0.3.3.dist-info/top_level.txt,sha256=PL6glZvzRyKWCDn5aoYI9uH8HlEA5Qd_XFJowJKARYI,7
+cutted-0.3.3.dist-info/RECORD,,

cutted-0.3.2.dist-info/RECORD DELETED Viewed

@@ -1,12 +0,0 @@
-cutted/__init__.py,sha256=ttFLenYuOpXQTaR9nB0dF-3zFB_PeksXf9R4r_TB8S8,49
-cutted/__main__.py,sha256=lYGLgtIZ_vGZIJmWG6ZQoqOdyOJnaWEA4NBn5Rc7Q8E,61
-cutted/app.py,sha256=Ay_yVrPt1TQAE3lqmrII88lFoGZb5Mh5cDwediM9ZG8,9592
-cutted/core/audio_processor.py,sha256=JdPeWO_jAIn_uZFeZYQJX3RC0Vy8GClKrX7xGk4pXR4,5426
-cutted/core/gemini.py,sha256=yHsQXk4tDHcW5qJBuL2LpPvdChimxlmEbu76BvsoeY4,3108
-cutted/core/logger.py,sha256=AjqrgW2LV9HdPkPQ8oOmyd9lWzVSIg46r74ILR7mVHo,585
-cutted/core/transcribe.py,sha256=0e7aCva4y6D-gKe1xw5HT9VoFgbvHGgV6utn12r8wXA,986
-cutted-0.3.2.dist-info/licenses/LICENSE,sha256=OXLcl0T2SZ8Pmy2_dmlvKuetivmyPd5m1q-Gyd-zaYY,35149
-cutted-0.3.2.dist-info/METADATA,sha256=MPuSW4_LjNch0PXeFrGtRW1C4CuJ7unNv1ZZhvFHmSM,1503
-cutted-0.3.2.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
-cutted-0.3.2.dist-info/top_level.txt,sha256=PL6glZvzRyKWCDn5aoYI9uH8HlEA5Qd_XFJowJKARYI,7
-cutted-0.3.2.dist-info/RECORD,,

{cutted-0.3.2.dist-info → cutted-0.3.3.dist-info}/WHEEL RENAMED Viewed

File without changes

{cutted-0.3.2.dist-info → cutted-0.3.3.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

{cutted-0.3.2.dist-info → cutted-0.3.3.dist-info}/top_level.txt RENAMED Viewed

File without changes

cutted 0.3.2__py3-none-any.whl → 0.3.3__py3-none-any.whl

cutted 0.3.2py3-none-any.whl → 0.3.3py3-none-any.whl