PyPI - io4it - Versions diffs - 0.0.0.12.10__py3-none-any.whl - Mend

io4it 0.0.0.12.10__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (30) hide show

io4it-0.0.0.12.10-py3.11-nspkg.pth +1 -0
io4it-0.0.0.12.10.dist-info/License.txt +6 -0
io4it-0.0.0.12.10.dist-info/METADATA +23 -0
io4it-0.0.0.12.10.dist-info/RECORD +30 -0
io4it-0.0.0.12.10.dist-info/WHEEL +5 -0
io4it-0.0.0.12.10.dist-info/entry_points.txt +2 -0
io4it-0.0.0.12.10.dist-info/namespace_packages.txt +1 -0
io4it-0.0.0.12.10.dist-info/top_level.txt +1 -0
orangecontrib/IO4IT/__init__.py +0 -0
orangecontrib/IO4IT/ocr_function/__init__.py +0 -0
orangecontrib/IO4IT/ocr_function/word_converter.py +327 -0
orangecontrib/IO4IT/widgets/OWMarkdownizer.py +202 -0
orangecontrib/IO4IT/widgets/OWPathPropagator.py +123 -0
orangecontrib/IO4IT/widgets/OWS3Uploader.py +92 -0
orangecontrib/IO4IT/widgets/OWS3downloader.py +94 -0
orangecontrib/IO4IT/widgets/OWS3list.py +107 -0
orangecontrib/IO4IT/widgets/OWSpeechToText.py +362 -0
orangecontrib/IO4IT/widgets/OWwordpdf2docx.py +129 -0
orangecontrib/IO4IT/widgets/__init__.py +19 -0
orangecontrib/IO4IT/widgets/designer/ow_in_or_out_path.ui +85 -0
orangecontrib/IO4IT/widgets/designer/owspeechtotext.ui +104 -0
orangecontrib/IO4IT/widgets/designer/wordpdf2docx.ui +57 -0
orangecontrib/IO4IT/widgets/icons/category.svg +50 -0
orangecontrib/IO4IT/widgets/icons/download.png +0 -0
orangecontrib/IO4IT/widgets/icons/in_or_out.png +0 -0
orangecontrib/IO4IT/widgets/icons/list_aws.png +0 -0
orangecontrib/IO4IT/widgets/icons/md.png +0 -0
orangecontrib/IO4IT/widgets/icons/speech_to_text.png +0 -0
orangecontrib/IO4IT/widgets/icons/upload.png +0 -0
orangecontrib/IO4IT/widgets/icons/wordpdf2docx.png +0 -0

orangecontrib/IO4IT/widgets/OWSpeechToText.py ADDED Viewed

@@ -0,0 +1,362 @@
+import datetime
+import ntpath
+import os
+import wave
+import tempfile
+import shutil
+import os
+from PyQt5.QtCore import QThread, pyqtSignal
+from PyQt5.QtWidgets import QApplication, QTextEdit, QPushButton, QSpinBox
+from pyannote.audio import Audio
+from pyannote.core import Segment
+import numpy as np
+import torch
+import whisper
+from Orange.data import Table, Domain, StringVariable
+from Orange.widgets import widget
+from Orange.widgets.utils.signals import Output
+from sklearn.cluster import KMeans
+from speechbrain.inference.speaker import EncoderClassifier
+if "site-packages/Orange/widgets" in os.path.dirname(os.path.abspath(__file__)).replace("\\", "/"):
+    from orangecontrib.AAIT.utils.import_uic import uic
+    from orangecontrib.AAIT.utils import SimpleDialogQt
+    from orangecontrib.AAIT.utils.MetManagement import get_local_store_path, GetFromRemote
+else:
+    from orangecontrib.AAIT.utils.import_uic import uic
+    from orangecontrib.AAIT.utils import SimpleDialogQt
+    from orangecontrib.AAIT.utils.MetManagement import get_local_store_path, GetFromRemote
+import subprocess
+def convert_audio_to_pcm(file_path, ffmpeg_path):
+    try:
+        import subprocess
+        ext = os.path.splitext(file_path)[1].lower()
+        if ext not in [".mp3", ".wav"]:
+            print(f"[ERREUR] Type de fichier non supporté : {ext}")
+            return None
+        pcm_wav_path = file_path.replace(ext, "_pcm.wav")  # pas de nom compliqué ici
+        ffmpeg_cmd = [
+            ffmpeg_path, "-y",
+            "-i", file_path,
+            "-acodec", "pcm_s16le",
+            "-ar", "16000",
+            "-ac", "1",
+            pcm_wav_path
+        ]
+        print(f"[INFO] Lancement de ffmpeg : {' '.join(ffmpeg_cmd)}")
+        result = subprocess.run(ffmpeg_cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True)
+        if result.returncode != 0:
+            print(f"[ERREUR] ffmpeg a échoué avec le code {result.returncode}")
+            print("[STDERR]", result.stderr)
+            return None
+        if os.path.exists(pcm_wav_path):
+            print(f"[INFO] Fichier converti : {pcm_wav_path}")
+            return pcm_wav_path
+        else:
+            print("[ERREUR] Le fichier converti n’a pas été trouvé.")
+            return None
+    except Exception as e:
+        print("❌ Exception pendant la conversion audio :", e)
+        return None
+def get_wav_duration(wav_path):
+    try:
+        with wave.open(wav_path, "rb") as wav_file:
+            frames = wav_file.getnframes()
+            rate = wav_file.getframerate()
+            return frames / float(rate)
+    except Exception as e:
+        # and print the error message
+        print("An error occurred when getting the  wav duration : ", e)
+        return
+class TranscriptionThread(QThread):
+    result_signal = pyqtSignal(str, list, float)
+    def __init__(self, file_path, model, embedding_model, audio_helper, num_speakers=2):
+        super().__init__()
+        self.file_path = file_path
+        self.model = model
+        self.embedding_model = embedding_model
+        self.audio_helper = audio_helper
+        self.num_speakers = num_speakers
+    def run(self):
+        try:
+            print("[THREAD] Démarrage du thread de transcription")
+            print(f"[THREAD] Fichier à traiter : {self.file_path}")
+            if not os.path.exists(self.file_path):
+                print(f"[ERREUR] Le fichier n'existe pas : {self.file_path}")
+                self.result_signal.emit("Erreur : fichier introuvable.", [], 0.0)
+                return
+            file_duration = get_wav_duration(self.file_path)
+            print(f"[INFO] Durée du fichier : {file_duration:.2f} sec" if file_duration else "[ERREUR] Durée inconnue")
+            if file_duration is None:
+                self.result_signal.emit("Error: File duration unknown.", [], 0.0)
+                return
+            print("[INFO] Début de la transcription avec Whisper")
+            start_time = datetime.datetime.now()
+            result = self.model.transcribe(
+                self.file_path,
+                language="fr",
+                without_timestamps=False,
+                temperature=0
+            )
+            transcription_time = (datetime.datetime.now() - start_time).total_seconds() / 60
+            print(f"[INFO] Transcription terminée en {transcription_time:.2f} min")
+            if not result or "segments" not in result or not result["segments"]:
+                print("[ERREUR] Aucun segment détecté")
+                self.result_signal.emit("Error: No speech detected.", [], transcription_time)
+                return
+            segments = result["segments"]
+            print(f"[INFO] Nombre de segments détectés : {len(segments)}")
+            embeddings = None
+            for i, segment in enumerate(segments):
+                start, end = segment["start"], segment["end"]
+                if end > file_duration:
+                    print(f"[AVERTISSEMENT] Segment {i} ignoré (fin hors durée)")
+                    continue
+                try:
+                    waveform, _ = self.audio_helper.crop(self.file_path, Segment(start, end))
+                    if waveform.ndim == 1:
+                        waveform = waveform.unsqueeze(0)
+                    with torch.no_grad():
+                        embedding = self.embedding_model.encode_batch(waveform).squeeze().cpu().numpy()
+                    if embeddings is None:
+                        embeddings = np.zeros((len(segments), embedding.shape[0]))
+                    embeddings[i] = embedding
+                except Exception as crop_err:
+                    print(f"[ERREUR] Erreur lors du crop ou de l'embedding pour le segment {i} : {crop_err}")
+                    continue
+            print("[INFO] Clustering des embeddings avec KMeans")
+            clustering = KMeans(n_clusters=min(self.num_speakers, len(segments)), random_state=42).fit(embeddings)
+            labels = clustering.labels_
+            speaker_map = {}
+            merged_segments = []
+            current_speaker = None
+            current_text = ""
+            current_start = None
+            table_output = []
+            print("[INFO] Regroupement par locuteur")
+            for i, segment in enumerate(segments):
+                speaker_id = labels[i]
+                if speaker_id not in speaker_map:
+                    speaker_map[speaker_id] = f"SPEAKER {len(speaker_map) + 1}"
+                speaker = speaker_map[speaker_id]
+                if current_speaker == speaker:
+                    current_text += f" {segment['text']}"
+                else:
+                    if current_speaker is not None:
+                        timestamp = str(datetime.timedelta(seconds=round(current_start)))
+                        merged_segments.append(f"{current_speaker} {timestamp}: {current_text}")
+                        table_output.append([current_speaker, timestamp, current_text])
+                    current_speaker = speaker
+                    current_text = segment["text"]
+                    current_start = segment["start"]
+            print("[INFO] Finalisation des résultats")
+            speaker_text_output = "\n".join(merged_segments)
+            self.result_signal.emit(speaker_text_output, table_output, transcription_time)
+            print("[THREAD] Transcription terminée et signal émis")
+        except Exception as e:
+            print("❌ An error occurred during transcription:", e)
+            import traceback
+            traceback.print_exc()
+            return
+class OWSpeech_To_Text(widget.OWWidget):
+    name = "Speech To Text"
+    description = "Convert audio to text with speaker recognition"
+    priority = 1111
+    category = "Advanced Artificial Intelligence Tools"
+    icon = "icons/speech_to_text.png"
+    if "site-packages/Orange/widgets" in os.path.dirname(os.path.abspath(__file__)).replace("\\", "/"):
+        icon = "icons_dev/speech_to_text.png"
+    gui = os.path.join(os.path.dirname(os.path.abspath(__file__)), "designer/owspeechtotext.ui")
+    class Outputs:
+        data = Output("Data", Table)
+        global_transcription = Output("Global Transcription", Table)
+    def __init__(self):
+        super().__init__()
+        self.file_path = ""
+        self.num_speakers = 4 # spin box a defaut 4
+        self.local_store_path = get_local_store_path()
+        model_name = "large-v3-turbo.pt"
+        self.embedding_model_name = "spkrec-ecapa-voxceleb"
+        self.model_path = os.path.join(self.local_store_path, "Models", "S2T", model_name)
+        self.embedding_model_path = os.path.join(self.local_store_path, "Models", "S2T", self.embedding_model_name)
+        self.ffmpeg_path = os.path.join(self.local_store_path, "Models", "S2T", "ffmpeg", "bin", "ffmpeg.exe")
+        # Extraire le dossier de ffmpeg.exe
+        ffmpeg_bin_dir = os.path.dirname(self.ffmpeg_path)
+        # Ajouter ffmpeg au PATH pour whisper/ffmpeg-python
+        if ffmpeg_bin_dir not in os.environ["PATH"]:
+            os.environ["PATH"] = ffmpeg_bin_dir + os.pathsep + os.environ["PATH"]
+            print(f"[INFO] Dossier ffmpeg ajouté au PATH Python : {ffmpeg_bin_dir}")
+        if not os.path.exists(self.model_path):
+            if not SimpleDialogQt.BoxYesNo("Whisper turbo Transcription Model isn't in your computer. Do you want to download it from AAIT store?"):
+                return
+            try:
+                if 0 != GetFromRemote("Whisper turbo"):
+                    return
+            except Exception as e:
+                print(e)
+                SimpleDialogQt.BoxError("Unable to get the Whisper turbo.")
+                return
+        if not os.path.exists(self.embedding_model_path):
+            if not SimpleDialogQt.BoxYesNo("Voxceleb Embedding Model isn't in your computer. Do you want to download it from AAIT store?"):
+                return
+            try:
+                if 0 != GetFromRemote("Voxceleb"):
+                    return
+            except Exception as e:
+                print(e)
+                SimpleDialogQt.BoxError("Unable to get the Voxceleb.")
+                return
+        if not os.path.exists(self.ffmpeg_path):
+            if not SimpleDialogQt.BoxYesNo("FFMPEG isn't in your computer. Do you want to download it from AAIT store?"):
+                return
+            try:
+                if 0 != GetFromRemote("FFMPEG"):
+                    return
+            except Exception as e:
+                print(e)
+                SimpleDialogQt.BoxError("Unable to get the ffmpeg.")
+                return
+        self.model = whisper.load_model(self.model_path)
+        print("Version of PyTorch :", torch.__version__)
+        print("Used cuda version :", torch.version.cuda)
+        print("CUDA available ? :", torch.cuda.is_available())
+        if torch.cuda.is_available():
+            print("Number of GPU :", torch.cuda.device_count())
+            print("GPU's name :", torch.cuda.get_device_name(0))
+        # Définition d'un model d'embedding (hard codé pour l'instant)
+        self.embedding_model = EncoderClassifier.from_hparams(source=self.embedding_model_path)
+        self.audio_helper = Audio()
+        uic.loadUi(self.gui, self)
+        self.file_button = self.findChild(QPushButton,
+                                          'fileButton')
+        self.file_button.clicked.connect(self.select_file)
+        self.process_button = self.findChild(QPushButton,
+                                             'processButton')
+        self.process_button.clicked.connect(self.process_recording)
+        self.text_area = self.findChild(QTextEdit, 'textArea')
+        self.spinBox_nb_people=self.findChild(QSpinBox,'spinBox_nb_people')
+        self.spinBox_nb_people.setValue(int(self.num_speakers))
+        self.spinBox_nb_people.valueChanged.connect(self.spinbox_value_changed)
+        self.process_button.setEnabled(False)
+    def spinbox_value_changed(self, value):
+        self.num_speakers = value
+    def select_file(self):
+        file_path = SimpleDialogQt.BoxSelectExistingFile(self, extention="Audio files (*.wav *.mp3)")
+        if file_path:
+            # 🔃 Copie dans un chemin sans accents ni caractères spéciaux
+            temp_dir = tempfile.gettempdir()
+            base_ext = os.path.splitext(file_path)[1]
+            clean_copy = os.path.join(temp_dir, "input_audio" + base_ext)
+            shutil.copy(file_path, clean_copy)
+            print(f"[INFO] Copie vers fichier temporaire sans accents : {clean_copy}")
+            # 🔁 Conversion dans ce dossier temporaire
+            pcm_path = convert_audio_to_pcm(clean_copy, self.ffmpeg_path)
+            print(f"[DEBUG] pcm_path: {pcm_path}")
+            if pcm_path:
+                self.file_path = pcm_path
+                self.temp_pcm_path = pcm_path
+                self.process_button.setEnabled(True)
+            else:
+                SimpleDialogQt.BoxError("Erreur : La conversion audio a échoué.")
+        else:
+            print("[ERREUR] Aucun fichier sélectionné.")
+    def process_recording(self):
+        self.process_button.setEnabled(False)
+        if not self.file_path:
+            SimpleDialogQt.BoxError(
+                "Aucun fichier sélectionné. Veuillez choisir un fichier audio avant de lancer la transcription.")
+            return
+        self.num_speakers = self.spinBox_nb_people.value()
+        self.text_area.setText("Transcription in progress...")
+        self.thread = TranscriptionThread(
+            self.file_path, self.model, self.embedding_model, self.audio_helper, self.num_speakers
+        )
+        self.thread.result_signal.connect(self.display_text)
+        self.thread.start()
+        self.progressBarInit()  # Ajout de la barre de progression
+    def display_text(self, text, table_output, transcription_time):
+        self.text_area.setText(f"{text}\n\n⏳ Temps de transcription: {transcription_time:.2f} minutes")
+        # Sortie 1 : tableau par speaker
+        domain = Domain([],
+                        metas=[StringVariable("Speaker"), StringVariable("Timestamp"), StringVariable("Transcription")])
+        metas = [[row[0], row[1], row[2]] for row in table_output] if table_output else [["", "", ""]]
+        out_data = Table(domain, [[] for _ in metas])
+        for i, meta in enumerate(metas):
+            out_data.metas[i] = meta
+        self.Outputs.data.send(out_data)
+        # Sortie 2 : une seule ligne avec toutes les infos
+        global_domain = Domain([],
+                               metas=[StringVariable("Nom du fichier"),
+                                      StringVariable("Transcription"),
+                                      StringVariable("Temps de transcription (min)")])
+        filename = ntpath.basename(self.file_path)  # Pour ne garder que le nom du fichier
+        global_metas = [[filename, text, f"{transcription_time:.2f}"]]
+        global_table = Table(global_domain, [[]])
+        global_table.metas[0] = global_metas[0]
+        self.Outputs.global_transcription.send(global_table)
+        self.progressBarFinished()
+if __name__ == "__main__":
+    import sys
+    app = QApplication(sys.argv)
+    window = OWSpeech_To_Text()
+    window.show()
+    sys.exit(app.exec_())

orangecontrib/IO4IT/widgets/OWwordpdf2docx.py ADDED Viewed

@@ -0,0 +1,129 @@
+import os
+import sys
+import Orange.data
+from AnyQt.QtWidgets import QApplication,QCheckBox
+from Orange.widgets import widget
+from Orange.widgets.utils.signals import Input, Output
+if "site-packages/Orange/widgets" in os.path.dirname(os.path.abspath(__file__)).replace("\\", "/"):
+    from Orange.widgets.orangecontrib.AAIT.utils import thread_management
+    from Orange.widgets.orangecontrib.AAIT.utils.import_uic import uic
+    from Orange.widgets.orangecontrib.IO4IT.ocr_function import word_converter
+else:
+    from orangecontrib.AAIT.utils import thread_management
+    from orangecontrib.AAIT.utils.import_uic import uic
+    from orangecontrib.IO4IT.ocr_function import word_converter
+class OWwordpdf2docx(widget.OWWidget):
+    name = "WordPdf2Docx"
+    description = "Convert pdf from a directory to docx using word"
+    icon = "icons/wordpdf2docx.png"
+    if "site-packages/Orange/widgets" in os.path.dirname(os.path.abspath(__file__)).replace("\\", "/"):
+        icon = "icons_dev/wordpdf2docx.png"
+    gui = os.path.join(os.path.dirname(os.path.abspath(__file__)), "designer/wordpdf2docx.ui")
+    want_control_area = False
+    priority = 3000
+    class Inputs:
+        data = Input("Data", Orange.data.Table)
+    class Outputs:
+        data = Output("Data", Orange.data.Table)
+    @Inputs.data
+    def set_data(self, in_data):
+        self.data = in_data
+        if self.autorun:
+            self.run()
+    def __init__(self):
+        super().__init__()
+        # Qt Management
+        self.setFixedWidth(470)
+        self.setFixedHeight(300)
+        uic.loadUi(self.gui, self)
+        self.check_box= self.findChild(QCheckBox, 'checkBox')
+        # Data Management
+        self.data = None
+        self.thread = None
+        self.autorun = True
+        self.result = None
+        self.post_initialized()
+    def run(self):
+        self.error("")
+        # if thread is running quit
+        if self.thread is not None:
+            self.thread.safe_quit()
+        if self.data is None:
+            return
+        # Verification of in_data
+        self.error("")
+        try:
+            self.data.domain["input_dir"]
+        except KeyError:
+            self.error('You need a "input_dir" column in input data')
+            return
+        if type(self.data.domain["input_dir"]).__name__ != 'StringVariable':
+            self.error('"input_dir" column needs to be a Text')
+            return
+        try:
+            self.data.domain["output_dir"]
+        except KeyError:
+            self.error('You need a "output_dir" column in input data')
+            return
+        if type(self.data.domain["output_dir"]).__name__ != 'StringVariable':
+            self.error('"output_dir" column needs to be a Text')
+            return
+        input_dir = self.data.get_column("input_dir")
+        output_dir = self.data.get_column("output_dir")
+        # Start progress bar
+        self.progressBarInit()
+        # Connect and start thread : main function, progress, result and finish
+        # --> progress is used in the main function to track progress (with a callback)
+        # --> result is used to collect the result from main function
+        # --> finish is just an empty signal to indicate that the thread is finished
+        ignore_existing_docx=False
+        if self.check_box.isChecked():
+            ignore_existing_docx=True
+        self.thread = thread_management.Thread(word_converter.convert_pdf_structure, input_dir, output_dir,ignore_exsting_out_put=ignore_existing_docx)
+        self.thread.progress.connect(self.handle_progress)
+        self.thread.result.connect(self.handle_result)
+        self.thread.finish.connect(self.handle_finish)
+        self.thread.start()
+    def handle_progress(self, value: float) -> None:
+        self.progressBarSet(value)
+    def handle_result(self, result):
+        try:
+            self.result = result
+            self.error(result)
+            self.Outputs.data.send(self.data)
+        except Exception as e:
+            print("An error occurred when sending out_data:", e)
+            self.Outputs.data.send(None)
+            return
+    def handle_finish(self):
+        print("conversion finished")
+        self.progressBarFinished()
+    def post_initialized(self):
+        pass
+if __name__ == "__main__":
+    app = QApplication(sys.argv)
+    my_widget = OWwordpdf2docx()
+    my_widget.show()
+    app.exec_()

orangecontrib/IO4IT/widgets/__init__.py ADDED Viewed

@@ -0,0 +1,19 @@
+"""
+Widgets from Development workflow category
+"""
+# ID = "orangecontrib.AAIT"
+NAME = "Advanced Artificial Intelligence Tools"
+# Category icon show in the menu
+ICON = "icons/category.svg"
+BACKGROUND = "light-green"
+DESCRIPTION = ("Advanced Artificial Intelligence Tools is a package meant to develop and enable advanced AI "
+               "functionalities in Orange Data Mining.")
+# PRIORITY = 6

orangecontrib/IO4IT/widgets/designer/ow_in_or_out_path.ui ADDED Viewed

@@ -0,0 +1,85 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<ui version="4.0">
+ <class>Form</class>
+ <widget class="QWidget" name="Form">
+  <property name="geometry">
+   <rect>
+    <x>0</x>
+    <y>0</y>
+    <width>727</width>
+    <height>151</height>
+   </rect>
+  </property>
+  <property name="windowTitle">
+   <string>Input_dir or Output_dir</string>
+  </property>
+  <widget class="QLabel" name="Description">
+   <property name="geometry">
+    <rect>
+     <x>40</x>
+     <y>10</y>
+     <width>641</width>
+     <height>41</height>
+    </rect>
+   </property>
+   <property name="sizePolicy">
+    <sizepolicy hsizetype="Maximum" vsizetype="Expanding">
+     <horstretch>0</horstretch>
+     <verstretch>0</verstretch>
+    </sizepolicy>
+   </property>
+   <property name="font">
+    <font>
+     <pointsize>8</pointsize>
+    </font>
+   </property>
+   <property name="text">
+    <string>This widget get a folder path to propagate it as a path , either as input or output path</string>
+   </property>
+   <property name="wordWrap">
+    <bool>true</bool>
+   </property>
+  </widget>
+  <widget class="QPushButton" name="fileButton">
+   <property name="geometry">
+    <rect>
+     <x>60</x>
+     <y>70</y>
+     <width>291</width>
+     <height>51</height>
+    </rect>
+   </property>
+   <property name="text">
+    <string>📂 Select a fodler</string>
+   </property>
+  </widget>
+  <widget class="QRadioButton" name="input_dir">
+   <property name="geometry">
+    <rect>
+     <x>470</x>
+     <y>60</y>
+     <width>131</width>
+     <height>31</height>
+    </rect>
+   </property>
+   <property name="text">
+    <string>input_dir</string>
+   </property>
+  </widget>
+  <widget class="QRadioButton" name="output_dir">
+   <property name="geometry">
+    <rect>
+     <x>470</x>
+     <y>100</y>
+     <width>131</width>
+     <height>31</height>
+    </rect>
+   </property>
+   <property name="text">
+    <string>output_dir</string>
+   </property>
+  </widget>
+ </widget>
+ <resources/>
+ <connections/>
+</ui>