pygpt-net 2.6.30__py3-none-any.whl → 2.6.32__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (122) hide show
  1. pygpt_net/CHANGELOG.txt +15 -0
  2. pygpt_net/__init__.py +3 -3
  3. pygpt_net/app.py +7 -1
  4. pygpt_net/app_core.py +3 -1
  5. pygpt_net/config.py +3 -1
  6. pygpt_net/controller/__init__.py +9 -2
  7. pygpt_net/controller/audio/audio.py +38 -1
  8. pygpt_net/controller/audio/ui.py +2 -2
  9. pygpt_net/controller/chat/audio.py +1 -8
  10. pygpt_net/controller/chat/common.py +23 -62
  11. pygpt_net/controller/chat/handler/__init__.py +0 -0
  12. pygpt_net/controller/chat/handler/stream_worker.py +1124 -0
  13. pygpt_net/controller/chat/output.py +8 -3
  14. pygpt_net/controller/chat/stream.py +3 -1071
  15. pygpt_net/controller/chat/text.py +3 -2
  16. pygpt_net/controller/kernel/kernel.py +11 -3
  17. pygpt_net/controller/kernel/reply.py +5 -1
  18. pygpt_net/controller/lang/custom.py +2 -2
  19. pygpt_net/controller/media/__init__.py +12 -0
  20. pygpt_net/controller/media/media.py +115 -0
  21. pygpt_net/controller/realtime/__init__.py +12 -0
  22. pygpt_net/controller/realtime/manager.py +53 -0
  23. pygpt_net/controller/realtime/realtime.py +293 -0
  24. pygpt_net/controller/ui/mode.py +23 -2
  25. pygpt_net/controller/ui/ui.py +19 -1
  26. pygpt_net/core/audio/audio.py +6 -1
  27. pygpt_net/core/audio/backend/native/__init__.py +12 -0
  28. pygpt_net/core/audio/backend/{native.py → native/native.py} +426 -127
  29. pygpt_net/core/audio/backend/native/player.py +139 -0
  30. pygpt_net/core/audio/backend/native/realtime.py +250 -0
  31. pygpt_net/core/audio/backend/pyaudio/__init__.py +12 -0
  32. pygpt_net/core/audio/backend/pyaudio/playback.py +194 -0
  33. pygpt_net/core/audio/backend/pyaudio/pyaudio.py +923 -0
  34. pygpt_net/core/audio/backend/pyaudio/realtime.py +312 -0
  35. pygpt_net/core/audio/backend/pygame/__init__.py +12 -0
  36. pygpt_net/core/audio/backend/{pygame.py → pygame/pygame.py} +130 -19
  37. pygpt_net/core/audio/backend/shared/__init__.py +38 -0
  38. pygpt_net/core/audio/backend/shared/conversions.py +211 -0
  39. pygpt_net/core/audio/backend/shared/envelope.py +38 -0
  40. pygpt_net/core/audio/backend/shared/player.py +137 -0
  41. pygpt_net/core/audio/backend/shared/rt.py +52 -0
  42. pygpt_net/core/audio/capture.py +5 -0
  43. pygpt_net/core/audio/output.py +14 -2
  44. pygpt_net/core/audio/whisper.py +6 -2
  45. pygpt_net/core/bridge/bridge.py +2 -1
  46. pygpt_net/core/bridge/worker.py +4 -1
  47. pygpt_net/core/dispatcher/dispatcher.py +37 -1
  48. pygpt_net/core/events/__init__.py +2 -1
  49. pygpt_net/core/events/realtime.py +55 -0
  50. pygpt_net/core/image/image.py +56 -5
  51. pygpt_net/core/realtime/__init__.py +0 -0
  52. pygpt_net/core/realtime/options.py +87 -0
  53. pygpt_net/core/realtime/shared/__init__.py +0 -0
  54. pygpt_net/core/realtime/shared/audio.py +213 -0
  55. pygpt_net/core/realtime/shared/loop.py +64 -0
  56. pygpt_net/core/realtime/shared/session.py +59 -0
  57. pygpt_net/core/realtime/shared/text.py +37 -0
  58. pygpt_net/core/realtime/shared/tools.py +276 -0
  59. pygpt_net/core/realtime/shared/turn.py +38 -0
  60. pygpt_net/core/realtime/shared/types.py +16 -0
  61. pygpt_net/core/realtime/worker.py +160 -0
  62. pygpt_net/core/render/web/body.py +24 -3
  63. pygpt_net/core/text/utils.py +54 -2
  64. pygpt_net/core/types/__init__.py +1 -0
  65. pygpt_net/core/types/image.py +54 -0
  66. pygpt_net/core/video/__init__.py +12 -0
  67. pygpt_net/core/video/video.py +290 -0
  68. pygpt_net/data/config/config.json +26 -5
  69. pygpt_net/data/config/models.json +221 -103
  70. pygpt_net/data/config/settings.json +244 -6
  71. pygpt_net/data/css/web-blocks.css +6 -0
  72. pygpt_net/data/css/web-chatgpt.css +6 -0
  73. pygpt_net/data/css/web-chatgpt_wide.css +6 -0
  74. pygpt_net/data/locale/locale.de.ini +35 -7
  75. pygpt_net/data/locale/locale.en.ini +56 -17
  76. pygpt_net/data/locale/locale.es.ini +35 -7
  77. pygpt_net/data/locale/locale.fr.ini +35 -7
  78. pygpt_net/data/locale/locale.it.ini +35 -7
  79. pygpt_net/data/locale/locale.pl.ini +38 -7
  80. pygpt_net/data/locale/locale.uk.ini +35 -7
  81. pygpt_net/data/locale/locale.zh.ini +31 -3
  82. pygpt_net/data/locale/plugin.audio_input.en.ini +4 -0
  83. pygpt_net/data/locale/plugin.audio_output.en.ini +4 -0
  84. pygpt_net/data/locale/plugin.cmd_web.en.ini +8 -0
  85. pygpt_net/item/model.py +22 -1
  86. pygpt_net/plugin/audio_input/plugin.py +37 -4
  87. pygpt_net/plugin/audio_input/simple.py +57 -8
  88. pygpt_net/plugin/cmd_files/worker.py +3 -0
  89. pygpt_net/provider/api/google/__init__.py +76 -7
  90. pygpt_net/provider/api/google/audio.py +8 -1
  91. pygpt_net/provider/api/google/chat.py +45 -6
  92. pygpt_net/provider/api/google/image.py +226 -86
  93. pygpt_net/provider/api/google/realtime/__init__.py +12 -0
  94. pygpt_net/provider/api/google/realtime/client.py +1945 -0
  95. pygpt_net/provider/api/google/realtime/realtime.py +186 -0
  96. pygpt_net/provider/api/google/video.py +364 -0
  97. pygpt_net/provider/api/openai/__init__.py +22 -2
  98. pygpt_net/provider/api/openai/realtime/__init__.py +12 -0
  99. pygpt_net/provider/api/openai/realtime/client.py +1828 -0
  100. pygpt_net/provider/api/openai/realtime/realtime.py +193 -0
  101. pygpt_net/provider/audio_input/google_genai.py +103 -0
  102. pygpt_net/provider/audio_output/google_genai_tts.py +229 -0
  103. pygpt_net/provider/audio_output/google_tts.py +0 -12
  104. pygpt_net/provider/audio_output/openai_tts.py +8 -5
  105. pygpt_net/provider/core/config/patch.py +241 -178
  106. pygpt_net/provider/core/model/patch.py +28 -2
  107. pygpt_net/provider/llms/google.py +8 -9
  108. pygpt_net/provider/web/duckduck_search.py +212 -0
  109. pygpt_net/ui/layout/toolbox/audio.py +55 -0
  110. pygpt_net/ui/layout/toolbox/footer.py +14 -42
  111. pygpt_net/ui/layout/toolbox/image.py +7 -13
  112. pygpt_net/ui/layout/toolbox/raw.py +52 -0
  113. pygpt_net/ui/layout/toolbox/split.py +48 -0
  114. pygpt_net/ui/layout/toolbox/toolbox.py +8 -8
  115. pygpt_net/ui/layout/toolbox/video.py +49 -0
  116. pygpt_net/ui/widget/option/combo.py +15 -1
  117. {pygpt_net-2.6.30.dist-info → pygpt_net-2.6.32.dist-info}/METADATA +46 -22
  118. {pygpt_net-2.6.30.dist-info → pygpt_net-2.6.32.dist-info}/RECORD +121 -73
  119. pygpt_net/core/audio/backend/pyaudio.py +0 -554
  120. {pygpt_net-2.6.30.dist-info → pygpt_net-2.6.32.dist-info}/LICENSE +0 -0
  121. {pygpt_net-2.6.30.dist-info → pygpt_net-2.6.32.dist-info}/WHEEL +0 -0
  122. {pygpt_net-2.6.30.dist-info → pygpt_net-2.6.32.dist-info}/entry_points.txt +0 -0
@@ -404,4 +404,10 @@ think {{
404
404
  }}
405
405
  .tips.visible {{
406
406
  opacity: 1;
407
+ }}
408
+
409
+ .extra-src-video-box,
410
+ .video-player {{
411
+ max-width: 400px;
412
+ text-align: left;
407
413
  }}
@@ -434,4 +434,10 @@ think {{
434
434
 
435
435
  .name-user {{
436
436
  display: none;
437
+ }}
438
+
439
+ .extra-src-video-box,
440
+ .video-player {{
441
+ max-width: 400px;
442
+ text-align: left;
437
443
  }}
@@ -430,4 +430,10 @@ think {{
430
430
 
431
431
  .name-user {{
432
432
  display: none;
433
+ }}
434
+
435
+ .extra-src-video-box,
436
+ .video-player {{
437
+ max-width: 400px;
438
+ text-align: left;
433
439
  }}
@@ -191,6 +191,7 @@ attachments_uploaded.tab = Hochgeladene Dateien
191
191
  audio.cache.clear.confirm = Sind Sie sicher, dass Sie alle zwischengespeicherten Audiodateien löschen möchten?
192
192
  audio.cache.clear.success = OK. Alle Audio-Cache-Dateien wurden gelöscht.
193
193
  audio.control.btn = Sprachsteuerung
194
+ audio.loop = Schleife
194
195
  audio.magic_word.detected = Zauberwort erkannt!
195
196
  audio.magic_word.invalid = Kein Zauberwort :(
196
197
  audio.magic_word.please = Bitte das Zauberwort...
@@ -845,7 +846,7 @@ mode.agent_openai.tooltip = Fortgeschrittene Agenten (OpenAI)
845
846
  mode.agent.tooltip = Einfache Agenten (legacy)
846
847
  mode.assistant = Assistent
847
848
  mode.assistant.tooltip = Chat mittels Assistants API
848
- mode.audio = Chat mit Audio
849
+ mode.audio = Realtime + audio
849
850
  mode.chat = Chat
850
851
  mode.chat.tooltip = Chatmodus (Standard)
851
852
  mode.completion = Vervollständigung
@@ -854,7 +855,7 @@ mode.computer = Computerbenutzung
854
855
  mode.computer.tooltip = Computerbenutzung (Maus, Tastatur, Navigation)
855
856
  mode.expert = Experten (Kooperation)
856
857
  mode.expert.tooltip = Experten zum Hintergrund rufen
857
- mode.img = Bild
858
+ mode.img = Bild und Video
858
859
  mode.img.tooltip = Bildgenerierung mit DALL-E
859
860
  mode.langchain = Langchain
860
861
  mode.langchain.tooltip = Chat mit Modellen von Langchain
@@ -1127,6 +1128,8 @@ settings.audio.input.stop_interval.desc = Intervall in Sekunden für automatisch
1127
1128
  settings.audio.input.timeout = Aufnahme-Zeitüberschreitung
1128
1129
  settings.audio.input.timeout.continuous = Zeitüberschreitung im Dauerbetrieb aktivieren
1129
1130
  settings.audio.input.timeout.desc = Zeitüberschreitung (Sekunden) für automatische Stop-Aufzeichnung, 0 zum Deaktivieren, Standard: 120
1131
+ settings.audio.input.vad.prefix = VAD-Präfix-Puffer (in ms)
1132
+ settings.audio.input.vad.silence = VAD-Endstille (in ms)
1130
1133
  settings.audio.output.backend = Backend für Audioausgabe
1131
1134
  settings.audio.output.backend.desc = Wählen Sie das Backend für die Audioausgabe.
1132
1135
  settings.audio.output.device = Gerät für Audioausgabe
@@ -1197,9 +1200,10 @@ settings.frequency_penalty = Frequenzstrafe
1197
1200
  settings.func_call.native = Native API-Funktionsaufrufe verwenden
1198
1201
  settings.func_call.native.desc = Wenn aktiviert, benutzt die Anwendung native API-Funktionsaufrufe anstelle des internen pygpt-Formats und der unten stehenden Befehlsprompten. Nur Chat- und Assistenz-Modi.
1199
1202
  settings.img_dialog_open = Bild-Dialog nach Generierung öffnen (Bildmodus)
1200
- settings.img_prompt_model = DALL-E: Modell zur Prompterzeugung
1201
- settings.img_quality = DALL-E: image quality
1202
- settings.img_resolution = DALL-E: Bildgröße
1203
+ settings.img_prompt_model = Modell zur Prompterzeugung
1204
+ settings.img_prompt_model.desc = LLM zur Verfeinerung Ihrer Eingabeaufforderung vor der Bilderzeugung (nicht das Bildmodell)
1205
+ settings.img_quality = image quality
1206
+ settings.img_resolution = Bildgröße
1203
1207
  settings.layout.animation.disable = Animationen deaktivieren
1204
1208
  settings.layout.animation.disable.desc = Deaktiviert Layout-Animationen, wie animierte Ladegeräte usw.
1205
1209
  settings.layout.density = Layoutdichte
@@ -1294,8 +1298,10 @@ settings.prompt.ctx.auto_summary.user = Kontext: Auto-Zusammenfassung (Benutzern
1294
1298
  settings.prompt.ctx.auto_summary.user.desc = Platzhalter: {input}, {output}
1295
1299
  settings.prompt.expert = Experte: Masteraufforderung
1296
1300
  settings.prompt.expert.desc = Anweisung (Systemaufforderung) für den Master-Experten, wie man Sklavenexperten handhabt. Anweisungen für Sklavenexperten werden aus ihren Voreinstellungen gegeben.
1297
- settings.prompt.img = DALL-E: Bildgenerierung
1301
+ settings.prompt.img = Bildgenerierung
1298
1302
  settings.prompt.img.desc = Aufforderung zur Erzeugung von Anweisungen für DALL-E (falls Rohmodus deaktiviert ist). Nur im Bildmodus.
1303
+ settings.prompt.video = Videogenerierung
1304
+ settings.prompt.video.desc = Eingabeaufforderung zur Erzeugung von Eingabeaufforderungen für das Videomodell (wenn der Rohmodus deaktiviert ist). Nur Bild-/Videomodus.
1299
1305
  settings.remote_tools.code_interpreter = Code-Interpreter
1300
1306
  settings.remote_tools.code_interpreter.desc = Aktivieren Sie das `code_interpreter` Remote-Tool im Chat-Modus / über OpenAI Responses API.
1301
1307
  settings.remote_tools.file_search = File search
@@ -1339,7 +1345,9 @@ settings.section.ctx = Kontext
1339
1345
  settings.section.debug = Fehlerbehebung
1340
1346
  settings.section.files = Dateien und Anhänge
1341
1347
  settings.section.general = Allgemein
1342
- settings.section.images = Bilder
1348
+ settings.section.images = Bilder und Videos
1349
+ settings.section.images.image = Bild
1350
+ settings.section.images.video = Video
1343
1351
  settings.section.layout = Layout
1344
1352
  settings.section.llama_index = Indizes / LlamaIndex
1345
1353
  settings.section.llama-index.chat = Chat
@@ -1367,6 +1375,22 @@ settings.upload.data_dir.desc = Włącz, aby przechowywać wszystko w jednym kat
1367
1375
  settings.upload.store = Speichere Anhänge im Arbeitsverzeichnis im Upload-Ordner
1368
1376
  settings.upload.store.desc = Aktiviere das Speichern einer lokalen Kopie hochgeladener Anhänge zur späteren Verwendung
1369
1377
  settings.use_context = Kontext (Erinnerung) verwenden
1378
+ settings.video.aspect_ratio = Seitenverhältnis
1379
+ settings.video.aspect_ratio.desc = Seitenverhältnis des Rahmens (z.B. 16:9, 9:16, 1:1); Verfügbarkeit hängt vom ausgewählten Modell ab
1380
+ settings.video.duration = Videodauer
1381
+ settings.video.duration.desc = Clip-Länge in Sekunden; Grenzen können je nach Modell variieren
1382
+ settings.video.fps = FPS
1383
+ settings.video.fps.desc = Bilder pro Sekunde (z.B. 24, 25, 30); kann vom Modell gerundet oder ignoriert werden
1384
+ settings.video.generate_audio = Audio generieren
1385
+ settings.video.generate_audio.desc = Bei Unterstützung durch das Modell synthetisiertes Hintergrundaudio einschließen
1386
+ settings.video.negative_prompt = Negative Eingabeaufforderung
1387
+ settings.video.negative_prompt.desc = Wörter oder Sätze, die im Ergebnis vermieden werden sollen (durch Kommas getrennt)
1388
+ settings.video.prompt_model = Modell zur Verbesserung von Eingabeaufforderungen
1389
+ settings.video.prompt_model.desc = LLM zur Verfeinerung Ihrer Eingabeaufforderung vor der Videogenerierung (nicht das Videomodell)
1390
+ settings.video.resolution = Videoauflösung
1391
+ settings.video.resolution.desc = Zielausgabeauflösung (z.B. 720p, 1080p); Verfügbarkeit hängt vom Modell ab
1392
+ settings.video.seed = Startwert
1393
+ settings.video.seed.desc = Optionaler Zufallsstartwert für reproduzierbare Ergebnisse; leer lassen für zufällig
1370
1394
  settings.vision.capture.auto = Automatisches Erfassen
1371
1395
  settings.vision.capture.enabled = Kamera
1372
1396
  settings.vision.capture.height = Kamerabildhöhe (px)
@@ -1526,6 +1550,10 @@ updater.check.launch = Beim Start prüfen
1526
1550
  update.released = Build
1527
1551
  update.snap = Zum Snap Store gehen
1528
1552
  update.title = Nach Updates suchen
1553
+ vid.status.downloading = Video wird heruntergeladen... bitte warten...
1554
+ vid.status.generating = Video wird generiert von
1555
+ vid.status.prompt.error = Fehler bei der Verbesserungsaufforderung
1556
+ vid.status.prompt.wait = Vorbereitung der Eingabeaufforderung... bitte warten...
1529
1557
  vision.capture.auto = Automatische Erfassung
1530
1558
  vision.capture.auto.click = Automatisches Erfassen ist aktiviert!
1531
1559
  vision.capture.auto.label = Automatische Erfassung aktiviert
@@ -188,9 +188,11 @@ attachments_uploaded.clear.confirm = WARNING: are you sure you want to delete al
188
188
  attachments_uploaded.delete.confirm = WARNING: are you sure you want to delete this file from the remote server?
189
189
  attachments_uploaded.sync.tip = Tip: click on 'Sync' to retrieve the file list from OpenAI
190
190
  attachments_uploaded.tab = Uploaded
191
+ audio.auto_turn = Auto (VAD)
191
192
  audio.cache.clear.confirm = Are you sure you want to delete all cached audio files?
192
193
  audio.cache.clear.success = OK. All audio cache files cleared.
193
194
  audio.control.btn = Voice control
195
+ audio.loop = Loop
194
196
  audio.magic_word.detected = Magic word detected!
195
197
  audio.magic_word.invalid = Not a magic word :(
196
198
  audio.magic_word.please = Magic word please...
@@ -845,7 +847,7 @@ mode.agent_openai.tooltip = Advanced agents (OpenAI)
845
847
  mode.agent.tooltip = Simple agents (legacy)
846
848
  mode.assistant = Assistants
847
849
  mode.assistant.tooltip = Chat using Assistants API
848
- mode.audio = Chat with Audio
850
+ mode.audio = Realtime + audio
849
851
  mode.chat = Chat
850
852
  mode.chat.tooltip = Chat mode (default)
851
853
  mode.completion = Completion
@@ -854,8 +856,8 @@ mode.computer = Computer use
854
856
  mode.computer.tooltip = Computer use (mouse, keyboard, navigation)
855
857
  mode.expert = Experts (Co-op)
856
858
  mode.expert.tooltip = Experts to call in the background
857
- mode.img = Image
858
- mode.img.tooltip = Image generation using DALL-E
859
+ mode.img = Image and video
860
+ mode.img.tooltip = Image generation
859
861
  mode.langchain = Langchain
860
862
  mode.langchain.tooltip = Chat with models provided by Langchain
861
863
  model.ctx = Context tokens
@@ -1119,7 +1121,15 @@ settings.api_key.voyage.desc = Required for the Voyage API - embeddings for Anth
1119
1121
  settings.api_key.xai = xAI API KEY
1120
1122
  settings.api_key.xai.desc = Required for the xAI API and Grok models.
1121
1123
  settings.api_native_google = Use native API SDK
1124
+ settings.api_native_google.app_credentials = Google Application credentials (path)
1125
+ settings.api_native_google.app_credentials.desc = Absolute path to credentials.json, e.g. /home/user/credentials.json
1126
+ settings.api_native_google.cloud_location = Google Cloud location
1127
+ settings.api_native_google.cloud_location.desc = Provide your Google Cloud project location, default: us-central1
1128
+ settings.api_native_google.cloud_project = Google Cloud project
1129
+ settings.api_native_google.cloud_project.desc = Provide your Google Cloud project name
1122
1130
  settings.api_native_google.desc = Use native GenAI SDK instead of compatible OpenAI client
1131
+ settings.api_native_google.use_vertex = Use VertexAI
1132
+ settings.api_native_google.use_vertex.desc = Enable to use VertexAI in Google GenAI SDK
1123
1133
  settings.api_proxy = Proxy address
1124
1134
  settings.api_proxy.desc = Optional, proxy for OpenAI API, e.g. http://proxy.example.com or socks5://user:pass@host:port
1125
1135
  settings.api_use_responses = Use Responses API in Chat mode
@@ -1147,6 +1157,8 @@ settings.audio.input.stop_interval.desc = Interval in seconds for auto-transcrib
1147
1157
  settings.audio.input.timeout = Recording timeout
1148
1158
  settings.audio.input.timeout.continuous = Enable timeout in continuous mode
1149
1159
  settings.audio.input.timeout.desc = Timeout (seconds) for auto-stop recording, 0 to disable, default: 120
1160
+ settings.audio.input.vad.prefix = VAD prefix padding (in ms)
1161
+ settings.audio.input.vad.silence = VAD end silence (in ms)
1150
1162
  settings.audio.output.backend = Audio Output Backend
1151
1163
  settings.audio.output.backend.desc = Select the audio output backend.
1152
1164
  settings.audio.output.device = Audio Output Device
@@ -1219,9 +1231,10 @@ settings.frequency_penalty = Frequency Penalty
1219
1231
  settings.func_call.native = Use native API function calls
1220
1232
  settings.func_call.native.desc = If enabled, the application will use native API function calls instead of the internal pygpt format and the command prompts from below will not be used. Chat and Assistants modes ONLY.
1221
1233
  settings.img_dialog_open = Open image dialog after generation (Image mode)
1222
- settings.img_prompt_model = DALL-E: prompt generation model
1223
- settings.img_quality = DALL-E: image quality
1224
- settings.img_resolution = DALL-E: image size
1234
+ settings.img_prompt_model = Prompt generation model
1235
+ settings.img_prompt_model.desc = LLM used to refine your prompt before image generation (not the image model)
1236
+ settings.img_quality = Image quality
1237
+ settings.img_resolution = Image size
1225
1238
  settings.layout.animation.disable = Disable animations
1226
1239
  settings.layout.animation.disable.desc = Disables layout animations, like animated loaders, etc.
1227
1240
  settings.layout.density = Layout density
@@ -1318,26 +1331,30 @@ settings.prompt.ctx.auto_summary.user = Context: auto-summary (user message)
1318
1331
  settings.prompt.ctx.auto_summary.user.desc = Placeholders: {input}, {output}
1319
1332
  settings.prompt.expert = Expert: Master prompt
1320
1333
  settings.prompt.expert.desc = Instruction (system prompt) for Master expert on how to handle slave experts. Instructions for slave experts are given from their presets.
1321
- settings.prompt.img = DALL-E: image generation
1322
- settings.prompt.img.desc = Prompt for generating prompts for DALL-E (if raw-mode is disabled). Image mode only.
1334
+ settings.prompt.img = Image generation
1335
+ settings.prompt.img.desc = Prompt for generating prompts for image model (if raw-mode is disabled). Image / Video modes only.
1336
+ settings.prompt.video = Video generation
1337
+ settings.prompt.video.desc = Prompt for generating prompts for video model (if raw-mode is disabled). Image / Videos mode only.
1323
1338
  settings.remote_tools.code_interpreter = Code Interpreter
1324
- settings.remote_tools.code_interpreter.desc = Enable `code_interpreter` remote tool in Chat mode / via OpenAI Responses API.
1339
+ settings.remote_tools.code_interpreter.desc = Enable `code_interpreter` remote tool - Responses API only.
1325
1340
  settings.remote_tools.file_search = File search
1326
1341
  settings.remote_tools.file_search.args = File search vector store IDs
1327
1342
  settings.remote_tools.file_search.args.desc = Vector store IDs, separated by comma (,)
1328
- settings.remote_tools.file_search.desc = Enable `file_search` remote tool in Chat mode / via OpenAI Responses API.
1343
+ settings.remote_tools.file_search.desc = Enable `file_search` remote tool - Responses API only.
1329
1344
  settings.remote_tools.google.code_interpreter = Code Interpreter
1330
- settings.remote_tools.google.code_interpreter.desc = Enable Code Interpreter remote tool in Chat mode.
1331
- settings.remote_tools.google.web_search = Google Web Search
1332
- settings.remote_tools.google.web_search.desc = Enable Google Search remote tool in Chat mode.
1345
+ settings.remote_tools.google.code_interpreter.desc = Enable Code Interpreter remote tool.
1346
+ settings.remote_tools.google.url_ctx = URL Context
1347
+ settings.remote_tools.google.url_ctx.desc = Enable URL Context remote tool.
1348
+ settings.remote_tools.google.web_search = Google Search
1349
+ settings.remote_tools.google.web_search.desc = Enable Google Search remote tool.
1333
1350
  settings.remote_tools.image = Image generation
1334
- settings.remote_tools.image.desc = Enable `image_generation` remote tool in Chat mode / via OpenAI Responses API.
1351
+ settings.remote_tools.image.desc = Enable `image_generation` remote tool - Responses API only.
1335
1352
  settings.remote_tools.mcp = Remote MCP
1336
1353
  settings.remote_tools.mcp.args = Remote MCP configuration
1337
1354
  settings.remote_tools.mcp.args.desc = Configuration in JSON format (will be used in request)
1338
- settings.remote_tools.mcp.desc = Enable `mcp` remote tool in Chat mode / via OpenAI Responses API.
1355
+ settings.remote_tools.mcp.desc = Enable `mcp` remote tool - Responses API only.
1339
1356
  settings.remote_tools.web_search = Web Search
1340
- settings.remote_tools.web_search.desc = Enable `web_search` remote tool in Chat mode / via OpenAI Responses API.
1357
+ settings.remote_tools.web_search.desc = Enable `web_search` remote tool - Responses API only.
1341
1358
  settings.render.code_syntax = Code syntax highlight
1342
1359
  settings.render.engine = Rendering engine
1343
1360
  settings.render.open_gl = OpenGL hardware acceleration
@@ -1369,7 +1386,9 @@ settings.section.ctx = Context
1369
1386
  settings.section.debug = Debug
1370
1387
  settings.section.files = Files and attachments
1371
1388
  settings.section.general = General
1372
- settings.section.images = Images
1389
+ settings.section.images = Images and video
1390
+ settings.section.images.image = Image
1391
+ settings.section.images.video = Video
1373
1392
  settings.section.layout = Layout
1374
1393
  settings.section.llama_index = Indexes / LlamaIndex
1375
1394
  settings.section.llama-index.chat = Chat
@@ -1398,6 +1417,22 @@ settings.upload.data_dir.desc = Enable to store everything in a single data dire
1398
1417
  settings.upload.store = Store attachments in the workdir upload directory
1399
1418
  settings.upload.store.desc = Enable to store a local copy of uploaded attachments for future use
1400
1419
  settings.use_context = Use context (memory)
1420
+ settings.video.aspect_ratio = Aspect ratio
1421
+ settings.video.aspect_ratio.desc = Frame aspect ratio (e.g., 16:9, 9:16, 1:1); availability depends on the selected model
1422
+ settings.video.duration = Video duration
1423
+ settings.video.duration.desc = Clip length in seconds; limits may vary by model
1424
+ settings.video.fps = FPS
1425
+ settings.video.fps.desc = Frames per second (e.g., 24, 25, 30); may be rounded or ignored by the model
1426
+ settings.video.generate_audio = Generate audio
1427
+ settings.video.generate_audio.desc = Include synthesized background audio if supported by the model
1428
+ settings.video.negative_prompt = Negative prompt
1429
+ settings.video.negative_prompt.desc = Words or phrases to avoid in the output (comma-separated)
1430
+ settings.video.prompt_model = Prompt enhancement model
1431
+ settings.video.prompt_model.desc = LLM used to refine your prompt before video generation (not the video model)
1432
+ settings.video.resolution = Video resolution
1433
+ settings.video.resolution.desc = Target output resolution (e.g., 720p, 1080p); availability depends on the model
1434
+ settings.video.seed = Seed
1435
+ settings.video.seed.desc = Optional random seed for reproducible results; leave empty for random
1401
1436
  settings.vision.capture.auto = Auto capture
1402
1437
  settings.vision.capture.enabled = Camera
1403
1438
  settings.vision.capture.height = Camera height (px)
@@ -1559,6 +1594,10 @@ updater.check.launch = Check on launch
1559
1594
  update.released = build
1560
1595
  update.snap = Go to Snap Store
1561
1596
  update.title = Check for Updates
1597
+ vid.status.downloading = Downloading video... please wait...
1598
+ vid.status.generating = Generating video from
1599
+ vid.status.prompt.error = Enhancement prompt error occured
1600
+ vid.status.prompt.wait = Preparing prompt... please wait...
1562
1601
  vision.capture.auto = Auto capture
1563
1602
  vision.capture.auto.click = Auto-capture is enabled!
1564
1603
  vision.capture.auto.label = Auto capture enabled
@@ -191,6 +191,7 @@ attachments_uploaded.tab = Archivos subidos
191
191
  audio.cache.clear.confirm = ¿Está seguro de querer eliminar todos los archivos de audio en caché?
192
192
  audio.cache.clear.success = OK. Todos los archivos de caché de audio fueron eliminados.
193
193
  audio.control.btn = Control de voz
194
+ audio.loop = Bucle
194
195
  audio.magic_word.detected = ¡Palabra mágica detectada!
195
196
  audio.magic_word.invalid = No es una palabra mágica :(
196
197
  audio.magic_word.please = Por favor, una palabra mágica...
@@ -846,7 +847,7 @@ mode.agent_openai.tooltip = Agentes avanzados (OpenAI)
846
847
  mode.agent.tooltip = Agentes simples (legacy)
847
848
  mode.assistant = Asistente
848
849
  mode.assistant.tooltip = Chatear usando la API de Asistentes
849
- mode.audio = Chat con audio
850
+ mode.audio = Realtime + audio
850
851
  mode.chat = Chat
851
852
  mode.chat.tooltip = Modo de chat (predeterminado)
852
853
  mode.completion = Finalización
@@ -855,7 +856,7 @@ mode.computer = Uso de la computadora
855
856
  mode.computer.tooltip = Uso de la computadora (ratón, teclado, navegación)
856
857
  mode.expert = Expertos (cooperación)
857
858
  mode.expert.tooltip = Llamar a expertos en segundo plano
858
- mode.img = Imagen
859
+ mode.img = Imagen y video
859
860
  mode.img.tooltip = Generar imagen usando DALL-E
860
861
  mode.langchain = Langchain
861
862
  mode.langchain.tooltip = Chatear con modelos proporcionados por Langchain
@@ -1128,6 +1129,8 @@ settings.audio.input.stop_interval.desc = Intervalo en segundos para transcribir
1128
1129
  settings.audio.input.timeout = Tiempo de espera de grabación
1129
1130
  settings.audio.input.timeout.continuous = Habilitar tiempo de espera en modo continuo
1130
1131
  settings.audio.input.timeout.desc = Tiempo de espera (segundos) para detener la grabación automáticamente, 0 para deshabilitar, por defecto: 120
1132
+ settings.audio.input.vad.prefix = Relleno de prefijo VAD (en ms)
1133
+ settings.audio.input.vad.silence = Silencio de final VAD (en ms)
1131
1134
  settings.audio.output.backend = Backend para la salida de audio
1132
1135
  settings.audio.output.backend.desc = Selecciona el backend para la salida de audio.
1133
1136
  settings.audio.output.device = Dispositivo para la salida de audio
@@ -1198,9 +1201,10 @@ settings.frequency_penalty = Penalización de frecuencia
1198
1201
  settings.func_call.native = Usar llamadas a funciones API nativas
1199
1202
  settings.func_call.native.desc = Si está habilitado, la aplicación usará llamadas a funciones API nativas en lugar del formato pygpt interno y los prompt de comandos a continuación no se usarán. Solo modos de Chat y Asistentes.
1200
1203
  settings.img_dialog_open = Abrir diálogo de imagen después de generar (Modo imagen)
1201
- settings.img_prompt_model = DALL-E: modelo de generación de indicaciones
1202
- settings.img_quality = DALL-E: calidad de imagen
1203
- settings.img_resolution = DALL-E: tamaño de imagen
1204
+ settings.img_prompt_model = Modelo de generación de indicaciones
1205
+ settings.img_prompt_model.desc = LLM utilizado para refinar su indicación antes de la generación de imágenes (no el modelo de imágenes)
1206
+ settings.img_quality = Calidad de imagen
1207
+ settings.img_resolution = Tamaño de imagen
1204
1208
  settings.layout.animation.disable = Desactivar animaciones
1205
1209
  settings.layout.animation.disable.desc = Desactivar animaciones de diseño, como cargadores animados, etc.
1206
1210
  settings.layout.density = Densidad de la disposición
@@ -1295,8 +1299,10 @@ settings.prompt.ctx.auto_summary.user = Contexto: resumen automático (mensaje d
1295
1299
  settings.prompt.ctx.auto_summary.user.desc = Marcadores de posición: {input}, {output}
1296
1300
  settings.prompt.expert = Experto: Master prompt
1297
1301
  settings.prompt.expert.desc = Instrucción (prompt del sistema) para el experto Master cómo manejar a los expertos subordinados. Las instrucciones para los expertos subordinados se dan desde sus presets.
1298
- settings.prompt.img = DALL-E: generación de imagen
1302
+ settings.prompt.img = Generación de imagen
1299
1303
  settings.prompt.img.desc = Mensaje para generar comandos para DALL-E (si el modo crudo está desactivado). Solo modo de imagen.
1304
+ settings.prompt.video = Generación de video
1305
+ settings.prompt.video.desc = Indicaciones para generar indicaciones para el modelo de video (si el modo sin formato está desactivado). Solo modo Imagen/Videos.
1300
1306
  settings.remote_tools.code_interpreter = Intérprete de Código
1301
1307
  settings.remote_tools.code_interpreter.desc = Habilitar herramienta remota `code_interpreter` en modo Chat / vía API de Respuestas de OpenAI.
1302
1308
  settings.remote_tools.file_search = File search
@@ -1340,7 +1346,9 @@ settings.section.ctx = Contexto
1340
1346
  settings.section.debug = Depuración
1341
1347
  settings.section.files = Archivos y adjuntos
1342
1348
  settings.section.general = General
1343
- settings.section.images = Imágenes
1349
+ settings.section.images = Imágenes y vídeo
1350
+ settings.section.images.image = Imagen
1351
+ settings.section.images.video = Video
1344
1352
  settings.section.layout = Diseño
1345
1353
  settings.section.llama_index = Índices / LlamaIndex
1346
1354
  settings.section.llama-index.chat = Chat
@@ -1368,6 +1376,22 @@ settings.upload.data_dir.desc = Habilite para almacenar todo en un único direct
1368
1376
  settings.upload.store = Almacenar adjuntos en el directorio de subida del directorio de trabajo
1369
1377
  settings.upload.store.desc = Habilitar el almacenamiento de una copia local de los adjuntos subidos para su uso futuro
1370
1378
  settings.use_context = Utilizar contexto (memoria)
1379
+ settings.video.aspect_ratio = Relación de aspecto
1380
+ settings.video.aspect_ratio.desc = Relación de aspecto del cuadro (por ejemplo, 16:9, 9:16, 1:1); la disponibilidad depende del modelo seleccionado
1381
+ settings.video.duration = Duración de video
1382
+ settings.video.duration.desc = Longitud del clip en segundos; los límites pueden variar según el modelo
1383
+ settings.video.fps = FPS
1384
+ settings.video.fps.desc = Fotogramas por segundo (por ejemplo, 24, 25, 30); puede ser redondeado o ignorado por el modelo
1385
+ settings.video.generate_audio = Generar audio
1386
+ settings.video.generate_audio.desc = Incluir audio de fondo sintetizado si es compatible con el modelo
1387
+ settings.video.negative_prompt = Indicaciones negativas
1388
+ settings.video.negative_prompt.desc = Palabras o frases a evitar en el resultado (separadas por comas)
1389
+ settings.video.prompt_model = Modelo de mejora de indicación
1390
+ settings.video.prompt_model.desc = LLM utilizado para refinar su indicación antes de la generación de video (no el modelo de video)
1391
+ settings.video.resolution = Resolución de video
1392
+ settings.video.resolution.desc = Resolución de salida objetivo (por ejemplo, 720p, 1080p); la disponibilidad depende del modelo
1393
+ settings.video.seed = Semilla
1394
+ settings.video.seed.desc = Semilla aleatoria opcional para resultados reproducibles; déjelo vacío para aleatorio
1371
1395
  settings.vision.capture.auto = Captura automática
1372
1396
  settings.vision.capture.enabled = Cámara
1373
1397
  settings.vision.capture.height = Altura de captura de cámara (px)
@@ -1527,6 +1551,10 @@ updater.check.launch = Comprobar al iniciar
1527
1551
  update.released = Versión
1528
1552
  update.snap = Ir a Snap Store
1529
1553
  update.title = Buscando actualizaciones
1554
+ vid.status.downloading = Descargando video... por favor espere...
1555
+ vid.status.generating = Generando video desde
1556
+ vid.status.prompt.error = Ocurrió un error en la indicación de mejora
1557
+ vid.status.prompt.wait = Preparando indicación... por favor espere...
1530
1558
  vision.capture.auto = Captura automática
1531
1559
  vision.capture.auto.click = ¡La captura automática está habilitada!
1532
1560
  vision.capture.auto.label = Captura automática habilitada
@@ -191,6 +191,7 @@ attachments_uploaded.tab = Fichiers téléchargés
191
191
  audio.cache.clear.confirm = Êtes-vous sûr de vouloir supprimer tous les fichiers audio en cache ?
192
192
  audio.cache.clear.success = OK. Tous les fichiers de cache audio ont été effacés.
193
193
  audio.control.btn = Contrôle vocal
194
+ audio.loop = Boucle
194
195
  audio.magic_word.detected = Mot magique détecté !
195
196
  audio.magic_word.invalid = Pas un mot magique :(
196
197
  audio.magic_word.please = S'il vous plaît, le mot magique...
@@ -845,7 +846,7 @@ mode.agent_openai.tooltip = Agents avancés (OpenAI)
845
846
  mode.agent.tooltip = Agents simples (legacy)
846
847
  mode.assistant = Assistant
847
848
  mode.assistant.tooltip = Discuter via l'API des Assistants
848
- mode.audio = Chat avec audio
849
+ mode.audio = Realtime + audio
849
850
  mode.chat = Chat
850
851
  mode.chat.tooltip = Mode chat (par défaut)
851
852
  mode.completion = Complétion
@@ -854,7 +855,7 @@ mode.computer = Utilisation de l'ordinateur
854
855
  mode.computer.tooltip = Utilisation de l'ordinateur (souris, clavier, navigation)
855
856
  mode.expert = Experts (co-opération)
856
857
  mode.expert.tooltip = Appeler des experts en arrière-plan
857
- mode.img = Image
858
+ mode.img = Image et vidéo
858
859
  mode.img.tooltip = Génération d'image avec DALL-E
859
860
  mode.langchain = Langchain
860
861
  mode.langchain.tooltip = Discussion avec les modèles fournis par Langchain
@@ -1127,6 +1128,8 @@ settings.audio.input.stop_interval.desc = Intervalle en secondes pour la transcr
1127
1128
  settings.audio.input.timeout = Délai d'enregistrement
1128
1129
  settings.audio.input.timeout.continuous = Activer le délai en mode continu
1129
1130
  settings.audio.input.timeout.desc = Délai (secondes) pour l'arrêt automatique de l'enregistrement, 0 pour désactiver, par défaut : 120
1131
+ settings.audio.input.vad.prefix = Padding du préfixe VAD (en ms)
1132
+ settings.audio.input.vad.silence = Silence de fin VAD (en ms)
1130
1133
  settings.audio.output.backend = Backend pour la sortie audio
1131
1134
  settings.audio.output.backend.desc = Sélectionnez le backend pour la sortie audio.
1132
1135
  settings.audio.output.device = Périphérique pour la sortie audio
@@ -1197,9 +1200,10 @@ settings.frequency_penalty = Pénalité de fréquence
1197
1200
  settings.func_call.native = Utiliser les appels de fonction API natives
1198
1201
  settings.func_call.native.desc = Si activé, l'application utilisera les appels de fonction API natives au lieu du format interne de pygpt et les commandes prompt ci-dessous ne seront pas utilisées. Modes uniquement Chat et Assistants.
1199
1202
  settings.img_dialog_open = Ouvrir la boîte de dialogue d'image après la génération (Mode image)
1200
- settings.img_prompt_model = DALL-E : modèle de génération d'invite
1201
- settings.img_quality = DALL-E: qualité d'image
1202
- settings.img_resolution = DALL-E : taille de l'image
1203
+ settings.img_prompt_model = Modèle de génération d'invite
1204
+ settings.img_prompt_model.desc = LLM utilisé pour affiner votre invite avant la génération d'images (pas le modèle d'image)
1205
+ settings.img_quality = Qualité d'image
1206
+ settings.img_resolution = Taille de l'image
1203
1207
  settings.layout.animation.disable = Désactiver les animations
1204
1208
  settings.layout.animation.disable.desc = Désactive les animations de mise en page, comme les chargeurs animés, etc.
1205
1209
  settings.layout.density = Densité de la disposition
@@ -1294,8 +1298,10 @@ settings.prompt.ctx.auto_summary.user = Contexte: résumé automatique (message
1294
1298
  settings.prompt.ctx.auto_summary.user.desc = Espaces réservés: {input}, {output}
1295
1299
  settings.prompt.expert = Expert : Master prompt
1296
1300
  settings.prompt.expert.desc = Instruction (prompt système) pour l'expert Master sur comment gérer les experts esclaves. Les instructions pour les experts esclaves sont données à partir de leurs presets.
1297
- settings.prompt.img = DALL-E: génération d'image
1301
+ settings.prompt.img = Génération d'image
1298
1302
  settings.prompt.img.desc = Prompt pour générer des commandes pour DALL-E (si le mode brut est désactivé). Mode image uniquement.
1303
+ settings.prompt.video = Génération de vidéo
1304
+ settings.prompt.video.desc = Invite pour générer des invites pour le modèle vidéo (si le mode brut est désactivé). Mode Image/Vidéo uniquement.
1299
1305
  settings.remote_tools.code_interpreter = Interpréteur de code
1300
1306
  settings.remote_tools.code_interpreter.desc = Activer l'outil distant `code_interpreter` en mode Chat/ via OpenAI Responses API.
1301
1307
  settings.remote_tools.file_search = File search
@@ -1339,7 +1345,9 @@ settings.section.ctx = Contexte
1339
1345
  settings.section.debug = Débogage
1340
1346
  settings.section.files = Fichiers et pièces jointes
1341
1347
  settings.section.general = Général
1342
- settings.section.images = Images
1348
+ settings.section.images = Images et vidéos
1349
+ settings.section.images.image = Image
1350
+ settings.section.images.video = Vidéo
1343
1351
  settings.section.layout = Mise en page
1344
1352
  settings.section.llama_index = Indexes / LlamaIndex
1345
1353
  settings.section.llama-index.chat = Chat
@@ -1367,6 +1375,22 @@ settings.upload.data_dir.desc = Activez pour stocker tout dans un seul répertoi
1367
1375
  settings.upload.store = Stocker les pièces jointes dans le répertoire d'upload du répertoire de travail
1368
1376
  settings.upload.store.desc = Activer le stockage d'une copie locale des pièces jointes téléchargées pour une utilisation future
1369
1377
  settings.use_context = Utiliser le contexte (mémoire)
1378
+ settings.video.aspect_ratio = Ratio d'aspect
1379
+ settings.video.aspect_ratio.desc = Ratio d'aspect du cadre (ex. : 16:9, 9:16, 1:1); disponibilité dépend du modèle sélectionné
1380
+ settings.video.duration = Durée de la vidéo
1381
+ settings.video.duration.desc = Longueur du clip en secondes; les limites peuvent varier selon le modèle
1382
+ settings.video.fps = FPS
1383
+ settings.video.fps.desc = Images par seconde (ex. : 24, 25, 30); peut être arrondi ou ignoré par le modèle
1384
+ settings.video.generate_audio = Générer de l'audio
1385
+ settings.video.generate_audio.desc = Inclure un fond audio synthétisé si pris en charge par le modèle
1386
+ settings.video.negative_prompt = Invite négative
1387
+ settings.video.negative_prompt.desc = Mots ou phrases à éviter dans le résultat (séparés par des virgules)
1388
+ settings.video.prompt_model = Modèle d'amélioration de l'invite
1389
+ settings.video.prompt_model.desc = LLM utilisé pour affiner votre invite avant la génération de la vidéo (pas le modèle vidéo)
1390
+ settings.video.resolution = Résolution vidéo
1391
+ settings.video.resolution.desc = Résolution de sortie cible (ex. : 720p, 1080p); disponibilité dépend du modèle
1392
+ settings.video.seed = Graine
1393
+ settings.video.seed.desc = Graine aléatoire facultative pour des résultats reproductibles; laisser vide pour aléatoire
1370
1394
  settings.vision.capture.auto = Capture automatique
1371
1395
  settings.vision.capture.enabled = Caméra
1372
1396
  settings.vision.capture.height = Hauteur de capture par caméra (px)
@@ -1526,6 +1550,10 @@ updater.check.launch = Vérifier au démarrage
1526
1550
  update.released = build
1527
1551
  update.snap = Aller au Snap Store
1528
1552
  update.title = Vérification des mises à jour
1553
+ vid.status.downloading = Téléchargement de la vidéo... veuillez patienter...
1554
+ vid.status.generating = Génération de la vidéo à partir de
1555
+ vid.status.prompt.error = Erreur d'amélioration de l'invite survenue
1556
+ vid.status.prompt.wait = Préparation de l'invite... veuillez patienter...
1529
1557
  vision.capture.auto = Capture automatique
1530
1558
  vision.capture.auto.click = La capture automatique est activée !
1531
1559
  vision.capture.auto.label = Capture automatique activée
@@ -191,6 +191,7 @@ attachments_uploaded.tab = File caricati
191
191
  audio.cache.clear.confirm = Sei sicuro di voler eliminare tutti i file audio memorizzati nella cache?
192
192
  audio.cache.clear.success = OK. Tutti i file della cache audio sono stati cancellati.
193
193
  audio.control.btn = Controllo vocale
194
+ audio.loop = Ciclo
194
195
  audio.magic_word.detected = Parola magica rilevata!
195
196
  audio.magic_word.invalid = Non è una parola magica :(
196
197
  audio.magic_word.please = Per favore, parola magica...
@@ -845,7 +846,7 @@ mode.agent_openai.tooltip = Agenti avanzati (OpenAI)
845
846
  mode.agent.tooltip = Agenti semplici (legacy)
846
847
  mode.assistant = Assistente
847
848
  mode.assistant.tooltip = Chattare utilizzando l'API degli Assistenti
848
- mode.audio = Chat con audio
849
+ mode.audio = Realtime + audio
849
850
  mode.chat = Chat
850
851
  mode.chat.tooltip = Modalità chat (predefinita)
851
852
  mode.completion = Completamento
@@ -854,7 +855,7 @@ mode.computer = Uso del computer
854
855
  mode.computer.tooltip = Uso del computer (mouse, tastiera, navigazione)
855
856
  mode.expert = Esperti (cooperazione)
856
857
  mode.expert.tooltip = Chiamare esperti in background
857
- mode.img = Immagine
858
+ mode.img = Immagine e video
858
859
  mode.img.tooltip = Generazione immagini con DALL-E
859
860
  mode.langchain = Langchain
860
861
  mode.langchain.tooltip = Chattare con modelli forniti da Langchain
@@ -1127,6 +1128,8 @@ settings.audio.input.stop_interval.desc = Intervallo in secondi per la trascrizi
1127
1128
  settings.audio.input.timeout = Timeout di registrazione
1128
1129
  settings.audio.input.timeout.continuous = Abilita timeout in modalità continua
1129
1130
  settings.audio.input.timeout.desc = Timeout (secondi) per l'arresto automatico della registrazione, 0 per disabilitare, predefinito: 120
1131
+ settings.audio.input.vad.prefix = Padding prefisso VAD (in ms)
1132
+ settings.audio.input.vad.silence = Silenzio finale VAD (in ms)
1130
1133
  settings.audio.output.backend = Backend per l'uscita audio
1131
1134
  settings.audio.output.backend.desc = Seleziona il backend per l'uscita audio.
1132
1135
  settings.audio.output.device = Dispositivo per l'uscita audio
@@ -1197,9 +1200,10 @@ settings.frequency_penalty = Penale di frequenza
1197
1200
  settings.func_call.native = Usa chiamate di funzione API native
1198
1201
  settings.func_call.native.desc = Se abilitato, l'applicazione utilizzerà le chiamate di funzione API native invece del formato interno pygpt e i prompt di comando di seguito non saranno utilizzati. Solo modalità chat e assistenti.
1199
1202
  settings.img_dialog_open = Apri la finestra di dialogo dell'immagine dopo la generazione (Modalità immagine)
1200
- settings.img_prompt_model = DALL-E: modello di generazione del prompt
1201
- settings.img_quality = DALL-E: qualità dell'immagine
1202
- settings.img_resolution = DALL-E: dimensione dell'immagine
1203
+ settings.img_prompt_model = Modello di generazione del prompt
1204
+ settings.img_prompt_model.desc = LLM utilizzato per affinare il tuo prompt prima della generazione di immagini (non il modello di immagini)
1205
+ settings.img_quality = Qualità dell'immagine
1206
+ settings.img_resolution = Dimensione dell'immagine
1203
1207
  settings.layout.animation.disable = Disabilita animazioni
1204
1208
  settings.layout.animation.disable.desc = Disabilita le animazioni del layout, come i caricamenti animati, ecc.
1205
1209
  settings.layout.density = Densità del layout
@@ -1294,8 +1298,10 @@ settings.prompt.ctx.auto_summary.user = Contesto: auto-riassunto (messaggio dell
1294
1298
  settings.prompt.ctx.auto_summary.user.desc = Placeholder: {input}, {output}
1295
1299
  settings.prompt.expert = Esperto: Master prompt
1296
1300
  settings.prompt.expert.desc = Istruzione (prompt del sistema) per l'esperto Master su come gestire gli esperti subalterni. Le istruzioni per gli esperti subalterni sono date dalle loro preimpostazioni.
1297
- settings.prompt.img = DALL-E: generazione immagine
1301
+ settings.prompt.img = Generazione immagine
1298
1302
  settings.prompt.img.desc = Prompt per generare comandi per DALL-E (se la modalità grezza è disabilitata). Solo modalità immagine.
1303
+ settings.prompt.video = Generazione video
1304
+ settings.prompt.video.desc = Prompt per generare prompt per il modello video (se la modalità raw è disattivata). Solo modalità Immagine/Video.
1299
1305
  settings.remote_tools.code_interpreter = Interprete del codice
1300
1306
  settings.remote_tools.code_interpreter.desc = Abilita l'attrezzo remoto `code_interpreter` in modalità Chat / tramite API delle Risposte di OpenAI.
1301
1307
  settings.remote_tools.file_search = File search
@@ -1339,7 +1345,9 @@ settings.section.ctx = Contesto
1339
1345
  settings.section.debug = Debug
1340
1346
  settings.section.files = File e allegati
1341
1347
  settings.section.general = Generale
1342
- settings.section.images = Immagini
1348
+ settings.section.images = Immagini e video
1349
+ settings.section.images.image = Immagine
1350
+ settings.section.images.video = Video
1343
1351
  settings.section.layout = Layout
1344
1352
  settings.section.llama_index = Indici / LlamaIndex
1345
1353
  settings.section.llama-index.chat = Chat
@@ -1367,6 +1375,22 @@ settings.upload.data_dir.desc = Abilita per memorizzare tutto in una singola dir
1367
1375
  settings.upload.store = Conserva gli allegati nella cartella di upload del workdir
1368
1376
  settings.upload.store.desc = Abilita la conservazione di una copia locale degli allegati caricati per un uso futuro
1369
1377
  settings.use_context = Usa contesto (memoria)
1378
+ settings.video.aspect_ratio = Rapporto d'aspetto
1379
+ settings.video.aspect_ratio.desc = Rapporto d'aspetto del fotogramma (es. 16:9, 9:16, 1:1); la disponibilità dipende dal modello selezionato
1380
+ settings.video.duration = Durata video
1381
+ settings.video.duration.desc = Lunghezza della clip in secondi; i limiti possono variare in base al modello
1382
+ settings.video.fps = FPS
1383
+ settings.video.fps.desc = Fotogrammi al secondo (es. 24, 25, 30); può essere arrotondato o ignorato dal modello
1384
+ settings.video.generate_audio = Genera audio
1385
+ settings.video.generate_audio.desc = Include audio di sottofondo sintetizzato se supportato dal modello
1386
+ settings.video.negative_prompt = Prompt negativo
1387
+ settings.video.negative_prompt.desc = Parole o frasi da evitare nel risultato (separate da virgole)
1388
+ settings.video.prompt_model = Modello di miglioramento del prompt
1389
+ settings.video.prompt_model.desc = LLM utilizzato per affinare il tuo prompt prima della generazione video (non il modello video)
1390
+ settings.video.resolution = Risoluzione video
1391
+ settings.video.resolution.desc = Risoluzione di uscita target (es. 720p, 1080p); la disponibilità dipende dal modello
1392
+ settings.video.seed = Seme
1393
+ settings.video.seed.desc = Seme casuale opzionale per risultati riproducibili; lascia vuoto per casuale
1370
1394
  settings.vision.capture.auto = Cattura automatica
1371
1395
  settings.vision.capture.enabled = Fotocamera
1372
1396
  settings.vision.capture.height = Altezza cattura fotocamera (px)
@@ -1526,6 +1550,10 @@ updater.check.launch = Controlla all'avvio
1526
1550
  update.released = build
1527
1551
  update.snap = Vai allo Snap Store
1528
1552
  update.title = Controllo degli aggiornamenti
1553
+ vid.status.downloading = Download del video... si prega di attendere...
1554
+ vid.status.generating = Generazione video da
1555
+ vid.status.prompt.error = Si è verificato un errore nel prompt di miglioramento
1556
+ vid.status.prompt.wait = Preparazione del prompt... si prega di attendere...
1529
1557
  vision.capture.auto = Cattura automatica
1530
1558
  vision.capture.auto.click = La cattura automatica è abilitata!
1531
1559
  vision.capture.auto.label = Cattura automatica abilitata