pygpt-net 2.6.31__py3-none-any.whl → 2.6.32__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (56) hide show
  1. pygpt_net/CHANGELOG.txt +7 -0
  2. pygpt_net/__init__.py +3 -3
  3. pygpt_net/app.py +3 -1
  4. pygpt_net/app_core.py +3 -1
  5. pygpt_net/config.py +3 -1
  6. pygpt_net/controller/__init__.py +5 -1
  7. pygpt_net/controller/audio/audio.py +13 -0
  8. pygpt_net/controller/chat/common.py +18 -83
  9. pygpt_net/controller/lang/custom.py +2 -2
  10. pygpt_net/controller/media/__init__.py +12 -0
  11. pygpt_net/controller/media/media.py +115 -0
  12. pygpt_net/controller/realtime/realtime.py +27 -2
  13. pygpt_net/controller/ui/mode.py +16 -2
  14. pygpt_net/core/audio/backend/pyaudio/realtime.py +51 -14
  15. pygpt_net/core/audio/output.py +3 -2
  16. pygpt_net/core/image/image.py +6 -5
  17. pygpt_net/core/realtime/worker.py +1 -5
  18. pygpt_net/core/render/web/body.py +24 -3
  19. pygpt_net/core/text/utils.py +54 -2
  20. pygpt_net/core/types/image.py +7 -1
  21. pygpt_net/core/video/__init__.py +12 -0
  22. pygpt_net/core/video/video.py +290 -0
  23. pygpt_net/data/config/config.json +19 -4
  24. pygpt_net/data/config/models.json +75 -3
  25. pygpt_net/data/config/settings.json +194 -6
  26. pygpt_net/data/css/web-blocks.css +6 -0
  27. pygpt_net/data/css/web-chatgpt.css +6 -0
  28. pygpt_net/data/css/web-chatgpt_wide.css +6 -0
  29. pygpt_net/data/locale/locale.de.ini +30 -2
  30. pygpt_net/data/locale/locale.en.ini +40 -7
  31. pygpt_net/data/locale/locale.es.ini +30 -2
  32. pygpt_net/data/locale/locale.fr.ini +30 -2
  33. pygpt_net/data/locale/locale.it.ini +30 -2
  34. pygpt_net/data/locale/locale.pl.ini +33 -2
  35. pygpt_net/data/locale/locale.uk.ini +30 -2
  36. pygpt_net/data/locale/locale.zh.ini +30 -2
  37. pygpt_net/data/locale/plugin.cmd_web.en.ini +8 -0
  38. pygpt_net/item/model.py +22 -1
  39. pygpt_net/provider/api/google/__init__.py +38 -2
  40. pygpt_net/provider/api/google/video.py +364 -0
  41. pygpt_net/provider/api/openai/realtime/realtime.py +1 -2
  42. pygpt_net/provider/core/config/patch.py +226 -178
  43. pygpt_net/provider/core/model/patch.py +17 -2
  44. pygpt_net/provider/web/duckduck_search.py +212 -0
  45. pygpt_net/ui/layout/toolbox/audio.py +55 -0
  46. pygpt_net/ui/layout/toolbox/footer.py +14 -58
  47. pygpt_net/ui/layout/toolbox/image.py +3 -14
  48. pygpt_net/ui/layout/toolbox/raw.py +52 -0
  49. pygpt_net/ui/layout/toolbox/split.py +48 -0
  50. pygpt_net/ui/layout/toolbox/toolbox.py +8 -8
  51. pygpt_net/ui/layout/toolbox/video.py +49 -0
  52. {pygpt_net-2.6.31.dist-info → pygpt_net-2.6.32.dist-info}/METADATA +23 -11
  53. {pygpt_net-2.6.31.dist-info → pygpt_net-2.6.32.dist-info}/RECORD +56 -46
  54. {pygpt_net-2.6.31.dist-info → pygpt_net-2.6.32.dist-info}/LICENSE +0 -0
  55. {pygpt_net-2.6.31.dist-info → pygpt_net-2.6.32.dist-info}/WHEEL +0 -0
  56. {pygpt_net-2.6.31.dist-info → pygpt_net-2.6.32.dist-info}/entry_points.txt +0 -0
@@ -81,7 +81,7 @@
81
81
  "multiplier": null,
82
82
  "step": null,
83
83
  "secret": false,
84
- "advanced": false,
84
+ "advanced": true,
85
85
  "tab": "OpenAI"
86
86
  },
87
87
  "api_use_responses_llama": {
@@ -96,7 +96,7 @@
96
96
  "multiplier": null,
97
97
  "step": null,
98
98
  "secret": false,
99
- "advanced": false,
99
+ "advanced": true,
100
100
  "tab": "OpenAI"
101
101
  },
102
102
  "api_key_google": {
@@ -148,6 +148,66 @@
148
148
  "advanced": false,
149
149
  "tab": "Google"
150
150
  },
151
+ "api_native_google.use_vertex": {
152
+ "section": "api_keys",
153
+ "type": "bool",
154
+ "slider": false,
155
+ "label": "settings.api_native_google.use_vertex",
156
+ "description": "settings.api_native_google.use_vertex.desc",
157
+ "value": true,
158
+ "min": null,
159
+ "max": null,
160
+ "multiplier": null,
161
+ "step": null,
162
+ "secret": false,
163
+ "advanced": true,
164
+ "tab": "Google"
165
+ },
166
+ "api_native_google.cloud_project": {
167
+ "section": "api_keys",
168
+ "type": "text",
169
+ "slider": false,
170
+ "label": "settings.api_native_google.cloud_project",
171
+ "description": "settings.api_native_google.cloud_project.desc",
172
+ "value": "",
173
+ "min": null,
174
+ "max": null,
175
+ "multiplier": null,
176
+ "step": null,
177
+ "secret": false,
178
+ "advanced": true,
179
+ "tab": "Google"
180
+ },
181
+ "api_native_google.cloud_location": {
182
+ "section": "api_keys",
183
+ "type": "text",
184
+ "slider": false,
185
+ "label": "settings.api_native_google.cloud_location",
186
+ "description": "settings.api_native_google.cloud_location.desc",
187
+ "value": "us-central1",
188
+ "min": null,
189
+ "max": null,
190
+ "multiplier": null,
191
+ "step": null,
192
+ "secret": false,
193
+ "advanced": true,
194
+ "tab": "Google"
195
+ },
196
+ "api_native_google.app_credentials": {
197
+ "section": "api_keys",
198
+ "type": "text",
199
+ "slider": false,
200
+ "label": "settings.api_native_google.app_credentials",
201
+ "description": "settings.api_native_google.app_credentials.desc",
202
+ "value": "us-central1",
203
+ "min": null,
204
+ "max": null,
205
+ "multiplier": null,
206
+ "step": null,
207
+ "secret": false,
208
+ "advanced": true,
209
+ "tab": "Google"
210
+ },
151
211
  "api_key_anthropic": {
152
212
  "section": "api_keys",
153
213
  "type": "text",
@@ -1256,6 +1316,19 @@
1256
1316
  "step": null,
1257
1317
  "advanced": false
1258
1318
  },
1319
+ "prompt.video": {
1320
+ "section": "prompts",
1321
+ "type": "textarea",
1322
+ "slider": false,
1323
+ "label": "settings.prompt.video",
1324
+ "description": "settings.prompt.video.desc",
1325
+ "value": "",
1326
+ "min": null,
1327
+ "max": null,
1328
+ "multiplier": null,
1329
+ "step": null,
1330
+ "advanced": false
1331
+ },
1259
1332
  "img_resolution": {
1260
1333
  "section": "images",
1261
1334
  "type": "combo",
@@ -1294,7 +1367,8 @@
1294
1367
  {"2560x1792": "[Imagen 4.0] 2560x1792"},
1295
1368
  {"1536x2816": "[Imagen 4.0] 1536x2816"},
1296
1369
  {"2816x1536": "[Imagen 4.0] 2816x1536"}
1297
- ]
1370
+ ],
1371
+ "tab": "image"
1298
1372
  },
1299
1373
  "img_quality": {
1300
1374
  "section": "images",
@@ -1315,7 +1389,8 @@
1315
1389
  {"standard": "[DALL-E 3] standard"},
1316
1390
  {"hd": "[DALL-E 3] hd"},
1317
1391
  {"standard": "[DALL-E 2] standard"}
1318
- ]
1392
+ ],
1393
+ "tab": "image"
1319
1394
  },
1320
1395
  "img_prompt_model": {
1321
1396
  "section": "images",
@@ -1323,12 +1398,125 @@
1323
1398
  "use": "models",
1324
1399
  "slider": false,
1325
1400
  "label": "settings.img_prompt_model",
1326
- "value": "gpt-4-1106-preview",
1401
+ "description": "settings.img_prompt_model.desc",
1402
+ "value": "gpt-4o",
1327
1403
  "min": null,
1328
1404
  "max": null,
1329
1405
  "multiplier": null,
1330
1406
  "step": null,
1331
- "advanced": true
1407
+ "tab": "image"
1408
+ },
1409
+ "video.aspect_ratio": {
1410
+ "section": "images",
1411
+ "type": "text",
1412
+ "slider": false,
1413
+ "label": "settings.video.aspect_ratio",
1414
+ "description": "settings.video.aspect_ratio.desc",
1415
+ "value": "",
1416
+ "min": null,
1417
+ "max": null,
1418
+ "multiplier": null,
1419
+ "step": null,
1420
+ "advanced": false,
1421
+ "tab": "video"
1422
+ },
1423
+ "video.duration": {
1424
+ "section": "images",
1425
+ "type": "int",
1426
+ "slider": false,
1427
+ "label": "settings.video.duration",
1428
+ "description": "settings.video.duration.desc",
1429
+ "value": "",
1430
+ "min": 1,
1431
+ "max": null,
1432
+ "multiplier": null,
1433
+ "step": null,
1434
+ "advanced": false,
1435
+ "tab": "video"
1436
+ },
1437
+ "video.fps": {
1438
+ "section": "images",
1439
+ "type": "int",
1440
+ "slider": false,
1441
+ "label": "settings.video.fps",
1442
+ "description": "settings.video.fps.desc",
1443
+ "value": "",
1444
+ "min": null,
1445
+ "max": null,
1446
+ "multiplier": null,
1447
+ "step": null,
1448
+ "advanced": false,
1449
+ "tab": "video"
1450
+ },
1451
+ "video.seed": {
1452
+ "section": "images",
1453
+ "type": "text",
1454
+ "slider": false,
1455
+ "label": "settings.video.seed",
1456
+ "description": "settings.video.seed.desc",
1457
+ "value": "",
1458
+ "min": null,
1459
+ "max": null,
1460
+ "multiplier": null,
1461
+ "step": null,
1462
+ "advanced": false,
1463
+ "tab": "video"
1464
+ },
1465
+ "video.generate_audio": {
1466
+ "section": "images",
1467
+ "type": "bool",
1468
+ "slider": false,
1469
+ "label": "settings.video.generate_audio",
1470
+ "description": "settings.video.generate_audio.desc",
1471
+ "value": false,
1472
+ "min": null,
1473
+ "max": null,
1474
+ "multiplier": null,
1475
+ "step": null,
1476
+ "advanced": false,
1477
+ "tab": "video"
1478
+ },
1479
+ "video.resolution": {
1480
+ "section": "images",
1481
+ "type": "text",
1482
+ "slider": false,
1483
+ "label": "settings.video.resolution",
1484
+ "description": "settings.video.resolution.desc",
1485
+ "value": "",
1486
+ "min": null,
1487
+ "max": null,
1488
+ "multiplier": null,
1489
+ "step": null,
1490
+ "advanced": false,
1491
+ "tab": "video"
1492
+ },
1493
+ "video.negative_prompt": {
1494
+ "section": "images",
1495
+ "type": "textarea",
1496
+ "slider": false,
1497
+ "label": "settings.video.negative_prompt",
1498
+ "description": "settings.video.negative_prompt.desc",
1499
+ "value": "",
1500
+ "min": null,
1501
+ "max": null,
1502
+ "multiplier": null,
1503
+ "step": null,
1504
+ "advanced": false,
1505
+ "tab": "video"
1506
+ },
1507
+ "video.prompt_model": {
1508
+ "section": "images",
1509
+ "type": "combo",
1510
+ "use": "models",
1511
+ "slider": false,
1512
+ "label": "settings.video.prompt_model",
1513
+ "description": "settings.video.prompt_model.desc",
1514
+ "value": "gemini-2.5-flash",
1515
+ "min": null,
1516
+ "max": null,
1517
+ "multiplier": null,
1518
+ "step": null,
1519
+ "tab": "video"
1332
1520
  },
1333
1521
  "vision.capture.idx": {
1334
1522
  "section": "vision",
@@ -404,4 +404,10 @@ think {{
404
404
  }}
405
405
  .tips.visible {{
406
406
  opacity: 1;
407
+ }}
408
+
409
+ .extra-src-video-box,
410
+ .video-player {{
411
+ max-width: 400px;
412
+ text-align: left;
407
413
  }}
@@ -434,4 +434,10 @@ think {{
434
434
 
435
435
  .name-user {{
436
436
  display: none;
437
+ }}
438
+
439
+ .extra-src-video-box,
440
+ .video-player {{
441
+ max-width: 400px;
442
+ text-align: left;
437
443
  }}
@@ -430,4 +430,10 @@ think {{
430
430
 
431
431
  .name-user {{
432
432
  display: none;
433
+ }}
434
+
435
+ .extra-src-video-box,
436
+ .video-player {{
437
+ max-width: 400px;
438
+ text-align: left;
433
439
  }}
@@ -191,6 +191,7 @@ attachments_uploaded.tab = Hochgeladene Dateien
191
191
  audio.cache.clear.confirm = Sind Sie sicher, dass Sie alle zwischengespeicherten Audiodateien löschen möchten?
192
192
  audio.cache.clear.success = OK. Alle Audio-Cache-Dateien wurden gelöscht.
193
193
  audio.control.btn = Sprachsteuerung
194
+ audio.loop = Schleife
194
195
  audio.magic_word.detected = Zauberwort erkannt!
195
196
  audio.magic_word.invalid = Kein Zauberwort :(
196
197
  audio.magic_word.please = Bitte das Zauberwort...
@@ -854,7 +855,7 @@ mode.computer = Computerbenutzung
854
855
  mode.computer.tooltip = Computerbenutzung (Maus, Tastatur, Navigation)
855
856
  mode.expert = Experten (Kooperation)
856
857
  mode.expert.tooltip = Experten zum Hintergrund rufen
857
- mode.img = Bild
858
+ mode.img = Bild und Video
858
859
  mode.img.tooltip = Bildgenerierung mit DALL-E
859
860
  mode.langchain = Langchain
860
861
  mode.langchain.tooltip = Chat mit Modellen von Langchain
@@ -1127,6 +1128,8 @@ settings.audio.input.stop_interval.desc = Intervall in Sekunden für automatisch
1127
1128
  settings.audio.input.timeout = Aufnahme-Zeitüberschreitung
1128
1129
  settings.audio.input.timeout.continuous = Zeitüberschreitung im Dauerbetrieb aktivieren
1129
1130
  settings.audio.input.timeout.desc = Zeitüberschreitung (Sekunden) für automatische Stop-Aufzeichnung, 0 zum Deaktivieren, Standard: 120
1131
+ settings.audio.input.vad.prefix = VAD-Präfix-Puffer (in ms)
1132
+ settings.audio.input.vad.silence = VAD-Endstille (in ms)
1130
1133
  settings.audio.output.backend = Backend für Audioausgabe
1131
1134
  settings.audio.output.backend.desc = Wählen Sie das Backend für die Audioausgabe.
1132
1135
  settings.audio.output.device = Gerät für Audioausgabe
@@ -1198,6 +1201,7 @@ settings.func_call.native = Native API-Funktionsaufrufe verwenden
1198
1201
  settings.func_call.native.desc = Wenn aktiviert, benutzt die Anwendung native API-Funktionsaufrufe anstelle des internen pygpt-Formats und der unten stehenden Befehlsprompten. Nur Chat- und Assistenz-Modi.
1199
1202
  settings.img_dialog_open = Bild-Dialog nach Generierung öffnen (Bildmodus)
1200
1203
  settings.img_prompt_model = Modell zur Prompterzeugung
1204
+ settings.img_prompt_model.desc = LLM zur Verfeinerung Ihrer Eingabeaufforderung vor der Bilderzeugung (nicht das Bildmodell)
1201
1205
  settings.img_quality = image quality
1202
1206
  settings.img_resolution = Bildgröße
1203
1207
  settings.layout.animation.disable = Animationen deaktivieren
@@ -1296,6 +1300,8 @@ settings.prompt.expert = Experte: Masteraufforderung
1296
1300
  settings.prompt.expert.desc = Anweisung (Systemaufforderung) für den Master-Experten, wie man Sklavenexperten handhabt. Anweisungen für Sklavenexperten werden aus ihren Voreinstellungen gegeben.
1297
1301
  settings.prompt.img = Bildgenerierung
1298
1302
  settings.prompt.img.desc = Aufforderung zur Erzeugung von Anweisungen für DALL-E (falls Rohmodus deaktiviert ist). Nur im Bildmodus.
1303
+ settings.prompt.video = Videogenerierung
1304
+ settings.prompt.video.desc = Eingabeaufforderung zur Erzeugung von Eingabeaufforderungen für das Videomodell (wenn der Rohmodus deaktiviert ist). Nur Bild-/Videomodus.
1299
1305
  settings.remote_tools.code_interpreter = Code-Interpreter
1300
1306
  settings.remote_tools.code_interpreter.desc = Aktivieren Sie das `code_interpreter` Remote-Tool im Chat-Modus / über OpenAI Responses API.
1301
1307
  settings.remote_tools.file_search = File search
@@ -1339,7 +1345,9 @@ settings.section.ctx = Kontext
1339
1345
  settings.section.debug = Fehlerbehebung
1340
1346
  settings.section.files = Dateien und Anhänge
1341
1347
  settings.section.general = Allgemein
1342
- settings.section.images = Bilder
1348
+ settings.section.images = Bilder und Videos
1349
+ settings.section.images.image = Bild
1350
+ settings.section.images.video = Video
1343
1351
  settings.section.layout = Layout
1344
1352
  settings.section.llama_index = Indizes / LlamaIndex
1345
1353
  settings.section.llama-index.chat = Chat
@@ -1367,6 +1375,22 @@ settings.upload.data_dir.desc = Włącz, aby przechowywać wszystko w jednym kat
1367
1375
  settings.upload.store = Speichere Anhänge im Arbeitsverzeichnis im Upload-Ordner
1368
1376
  settings.upload.store.desc = Aktiviere das Speichern einer lokalen Kopie hochgeladener Anhänge zur späteren Verwendung
1369
1377
  settings.use_context = Kontext (Erinnerung) verwenden
1378
+ settings.video.aspect_ratio = Seitenverhältnis
1379
+ settings.video.aspect_ratio.desc = Seitenverhältnis des Rahmens (z.B. 16:9, 9:16, 1:1); Verfügbarkeit hängt vom ausgewählten Modell ab
1380
+ settings.video.duration = Videodauer
1381
+ settings.video.duration.desc = Clip-Länge in Sekunden; Grenzen können je nach Modell variieren
1382
+ settings.video.fps = FPS
1383
+ settings.video.fps.desc = Bilder pro Sekunde (z.B. 24, 25, 30); kann vom Modell gerundet oder ignoriert werden
1384
+ settings.video.generate_audio = Audio generieren
1385
+ settings.video.generate_audio.desc = Bei Unterstützung durch das Modell synthetisiertes Hintergrundaudio einschließen
1386
+ settings.video.negative_prompt = Negative Eingabeaufforderung
1387
+ settings.video.negative_prompt.desc = Wörter oder Sätze, die im Ergebnis vermieden werden sollen (durch Kommas getrennt)
1388
+ settings.video.prompt_model = Modell zur Verbesserung von Eingabeaufforderungen
1389
+ settings.video.prompt_model.desc = LLM zur Verfeinerung Ihrer Eingabeaufforderung vor der Videogenerierung (nicht das Videomodell)
1390
+ settings.video.resolution = Videoauflösung
1391
+ settings.video.resolution.desc = Zielausgabeauflösung (z.B. 720p, 1080p); Verfügbarkeit hängt vom Modell ab
1392
+ settings.video.seed = Startwert
1393
+ settings.video.seed.desc = Optionaler Zufallsstartwert für reproduzierbare Ergebnisse; leer lassen für zufällig
1370
1394
  settings.vision.capture.auto = Automatisches Erfassen
1371
1395
  settings.vision.capture.enabled = Kamera
1372
1396
  settings.vision.capture.height = Kamerabildhöhe (px)
@@ -1526,6 +1550,10 @@ updater.check.launch = Beim Start prüfen
1526
1550
  update.released = Build
1527
1551
  update.snap = Zum Snap Store gehen
1528
1552
  update.title = Nach Updates suchen
1553
+ vid.status.downloading = Video wird heruntergeladen... bitte warten...
1554
+ vid.status.generating = Video wird generiert von
1555
+ vid.status.prompt.error = Fehler bei der Verbesserungsaufforderung
1556
+ vid.status.prompt.wait = Vorbereitung der Eingabeaufforderung... bitte warten...
1529
1557
  vision.capture.auto = Automatische Erfassung
1530
1558
  vision.capture.auto.click = Automatisches Erfassen ist aktiviert!
1531
1559
  vision.capture.auto.label = Automatische Erfassung aktiviert
@@ -192,6 +192,7 @@ audio.auto_turn = Auto (VAD)
192
192
  audio.cache.clear.confirm = Are you sure you want to delete all cached audio files?
193
193
  audio.cache.clear.success = OK. All audio cache files cleared.
194
194
  audio.control.btn = Voice control
195
+ audio.loop = Loop
195
196
  audio.magic_word.detected = Magic word detected!
196
197
  audio.magic_word.invalid = Not a magic word :(
197
198
  audio.magic_word.please = Magic word please...
@@ -855,8 +856,8 @@ mode.computer = Computer use
855
856
  mode.computer.tooltip = Computer use (mouse, keyboard, navigation)
856
857
  mode.expert = Experts (Co-op)
857
858
  mode.expert.tooltip = Experts to call in the background
858
- mode.img = Image
859
- mode.img.tooltip = Image generation using DALL-E
859
+ mode.img = Image and video
860
+ mode.img.tooltip = Image generation
860
861
  mode.langchain = Langchain
861
862
  mode.langchain.tooltip = Chat with models provided by Langchain
862
863
  model.ctx = Context tokens
@@ -1120,7 +1121,15 @@ settings.api_key.voyage.desc = Required for the Voyage API - embeddings for Anth
1120
1121
  settings.api_key.xai = xAI API KEY
1121
1122
  settings.api_key.xai.desc = Required for the xAI API and Grok models.
1122
1123
  settings.api_native_google = Use native API SDK
1124
+ settings.api_native_google.app_credentials = Google Application credentials (path)
1125
+ settings.api_native_google.app_credentials.desc = Absolute path to credentials.json, e.g. /home/user/credentials.json
1126
+ settings.api_native_google.cloud_location = Google Cloud location
1127
+ settings.api_native_google.cloud_location.desc = Provide your Google Cloud project location, default: us-central1
1128
+ settings.api_native_google.cloud_project = Google Cloud project
1129
+ settings.api_native_google.cloud_project.desc = Provide your Google Cloud project name
1123
1130
  settings.api_native_google.desc = Use native GenAI SDK instead of compatible OpenAI client
1131
+ settings.api_native_google.use_vertex = Use VertexAI
1132
+ settings.api_native_google.use_vertex.desc = Enable to use VertexAI in Google GenAI SDK
1124
1133
  settings.api_proxy = Proxy address
1125
1134
  settings.api_proxy.desc = Optional, proxy for OpenAI API, e.g. http://proxy.example.com or socks5://user:pass@host:port
1126
1135
  settings.api_use_responses = Use Responses API in Chat mode
@@ -1148,6 +1157,8 @@ settings.audio.input.stop_interval.desc = Interval in seconds for auto-transcrib
1148
1157
  settings.audio.input.timeout = Recording timeout
1149
1158
  settings.audio.input.timeout.continuous = Enable timeout in continuous mode
1150
1159
  settings.audio.input.timeout.desc = Timeout (seconds) for auto-stop recording, 0 to disable, default: 120
1160
+ settings.audio.input.vad.prefix = VAD prefix padding (in ms)
1161
+ settings.audio.input.vad.silence = VAD end silence (in ms)
1151
1162
  settings.audio.output.backend = Audio Output Backend
1152
1163
  settings.audio.output.backend.desc = Select the audio output backend.
1153
1164
  settings.audio.output.device = Audio Output Device
@@ -1221,6 +1232,7 @@ settings.func_call.native = Use native API function calls
1221
1232
  settings.func_call.native.desc = If enabled, the application will use native API function calls instead of the internal pygpt format and the command prompts from below will not be used. Chat and Assistants modes ONLY.
1222
1233
  settings.img_dialog_open = Open image dialog after generation (Image mode)
1223
1234
  settings.img_prompt_model = Prompt generation model
1235
+ settings.img_prompt_model.desc = LLM used to refine your prompt before image generation (not the image model)
1224
1236
  settings.img_quality = Image quality
1225
1237
  settings.img_resolution = Image size
1226
1238
  settings.layout.animation.disable = Disable animations
@@ -1320,7 +1332,9 @@ settings.prompt.ctx.auto_summary.user.desc = Placeholders: {input}, {output}
1320
1332
  settings.prompt.expert = Expert: Master prompt
1321
1333
  settings.prompt.expert.desc = Instruction (system prompt) for Master expert on how to handle slave experts. Instructions for slave experts are given from their presets.
1322
1334
  settings.prompt.img = Image generation
1323
- settings.prompt.img.desc = Prompt for generating prompts for DALL-E (if raw-mode is disabled). Image mode only.
1335
+ settings.prompt.img.desc = Prompt for generating prompts for image model (if raw-mode is disabled). Image / Video modes only.
1336
+ settings.prompt.video = Video generation
1337
+ settings.prompt.video.desc = Prompt for generating prompts for video model (if raw-mode is disabled). Image / Videos mode only.
1324
1338
  settings.remote_tools.code_interpreter = Code Interpreter
1325
1339
  settings.remote_tools.code_interpreter.desc = Enable `code_interpreter` remote tool - Responses API only.
1326
1340
  settings.remote_tools.file_search = File search
@@ -1372,7 +1386,9 @@ settings.section.ctx = Context
1372
1386
  settings.section.debug = Debug
1373
1387
  settings.section.files = Files and attachments
1374
1388
  settings.section.general = General
1375
- settings.section.images = Images
1389
+ settings.section.images = Images and video
1390
+ settings.section.images.image = Image
1391
+ settings.section.images.video = Video
1376
1392
  settings.section.layout = Layout
1377
1393
  settings.section.llama_index = Indexes / LlamaIndex
1378
1394
  settings.section.llama-index.chat = Chat
@@ -1401,6 +1417,22 @@ settings.upload.data_dir.desc = Enable to store everything in a single data dire
1401
1417
  settings.upload.store = Store attachments in the workdir upload directory
1402
1418
  settings.upload.store.desc = Enable to store a local copy of uploaded attachments for future use
1403
1419
  settings.use_context = Use context (memory)
1420
+ settings.video.aspect_ratio = Aspect ratio
1421
+ settings.video.aspect_ratio.desc = Frame aspect ratio (e.g., 16:9, 9:16, 1:1); availability depends on the selected model
1422
+ settings.video.duration = Video duration
1423
+ settings.video.duration.desc = Clip length in seconds; limits may vary by model
1424
+ settings.video.fps = FPS
1425
+ settings.video.fps.desc = Frames per second (e.g., 24, 25, 30); may be rounded or ignored by the model
1426
+ settings.video.generate_audio = Generate audio
1427
+ settings.video.generate_audio.desc = Include synthesized background audio if supported by the model
1428
+ settings.video.negative_prompt = Negative prompt
1429
+ settings.video.negative_prompt.desc = Words or phrases to avoid in the output (comma-separated)
1430
+ settings.video.prompt_model = Prompt enhancement model
1431
+ settings.video.prompt_model.desc = LLM used to refine your prompt before video generation (not the video model)
1432
+ settings.video.resolution = Video resolution
1433
+ settings.video.resolution.desc = Target output resolution (e.g., 720p, 1080p); availability depends on the model
1434
+ settings.video.seed = Seed
1435
+ settings.video.seed.desc = Optional random seed for reproducible results; leave empty for random
1404
1436
  settings.vision.capture.auto = Auto capture
1405
1437
  settings.vision.capture.enabled = Camera
1406
1438
  settings.vision.capture.height = Camera height (px)
@@ -1562,6 +1594,10 @@ updater.check.launch = Check on launch
1562
1594
  update.released = build
1563
1595
  update.snap = Go to Snap Store
1564
1596
  update.title = Check for Updates
1597
+ vid.status.downloading = Downloading video... please wait...
1598
+ vid.status.generating = Generating video from
1599
+ vid.status.prompt.error = Enhancement prompt error occured
1600
+ vid.status.prompt.wait = Preparing prompt... please wait...
1565
1601
  vision.capture.auto = Auto capture
1566
1602
  vision.capture.auto.click = Auto-capture is enabled!
1567
1603
  vision.capture.auto.label = Auto capture enabled
@@ -1575,6 +1611,3 @@ vision.capture.manual.captured.success = Image captured from the camera:
1575
1611
  vision.capture.name.prefix = Camera capture:
1576
1612
  vision.capture.options.title = Video capture
1577
1613
  vision.checkbox.tooltip = If checked, the vision model is active. It will be automatically activated upon image upload. You can deactivate it in real-time.
1578
-
1579
- settings.audio.input.vad.prefix = VAD prefix padding (in ms)
1580
- settings.audio.input.vad.silence = VAD end silence (in ms)
@@ -191,6 +191,7 @@ attachments_uploaded.tab = Archivos subidos
191
191
  audio.cache.clear.confirm = ¿Está seguro de querer eliminar todos los archivos de audio en caché?
192
192
  audio.cache.clear.success = OK. Todos los archivos de caché de audio fueron eliminados.
193
193
  audio.control.btn = Control de voz
194
+ audio.loop = Bucle
194
195
  audio.magic_word.detected = ¡Palabra mágica detectada!
195
196
  audio.magic_word.invalid = No es una palabra mágica :(
196
197
  audio.magic_word.please = Por favor, una palabra mágica...
@@ -855,7 +856,7 @@ mode.computer = Uso de la computadora
855
856
  mode.computer.tooltip = Uso de la computadora (ratón, teclado, navegación)
856
857
  mode.expert = Expertos (cooperación)
857
858
  mode.expert.tooltip = Llamar a expertos en segundo plano
858
- mode.img = Imagen
859
+ mode.img = Imagen y video
859
860
  mode.img.tooltip = Generar imagen usando DALL-E
860
861
  mode.langchain = Langchain
861
862
  mode.langchain.tooltip = Chatear con modelos proporcionados por Langchain
@@ -1128,6 +1129,8 @@ settings.audio.input.stop_interval.desc = Intervalo en segundos para transcribir
1128
1129
  settings.audio.input.timeout = Tiempo de espera de grabación
1129
1130
  settings.audio.input.timeout.continuous = Habilitar tiempo de espera en modo continuo
1130
1131
  settings.audio.input.timeout.desc = Tiempo de espera (segundos) para detener la grabación automáticamente, 0 para deshabilitar, por defecto: 120
1132
+ settings.audio.input.vad.prefix = Relleno de prefijo VAD (en ms)
1133
+ settings.audio.input.vad.silence = Silencio de final VAD (en ms)
1131
1134
  settings.audio.output.backend = Backend para la salida de audio
1132
1135
  settings.audio.output.backend.desc = Selecciona el backend para la salida de audio.
1133
1136
  settings.audio.output.device = Dispositivo para la salida de audio
@@ -1199,6 +1202,7 @@ settings.func_call.native = Usar llamadas a funciones API nativas
1199
1202
  settings.func_call.native.desc = Si está habilitado, la aplicación usará llamadas a funciones API nativas en lugar del formato pygpt interno y los prompt de comandos a continuación no se usarán. Solo modos de Chat y Asistentes.
1200
1203
  settings.img_dialog_open = Abrir diálogo de imagen después de generar (Modo imagen)
1201
1204
  settings.img_prompt_model = Modelo de generación de indicaciones
1205
+ settings.img_prompt_model.desc = LLM utilizado para refinar su indicación antes de la generación de imágenes (no el modelo de imágenes)
1202
1206
  settings.img_quality = Calidad de imagen
1203
1207
  settings.img_resolution = Tamaño de imagen
1204
1208
  settings.layout.animation.disable = Desactivar animaciones
@@ -1297,6 +1301,8 @@ settings.prompt.expert = Experto: Master prompt
1297
1301
  settings.prompt.expert.desc = Instrucción (prompt del sistema) para el experto Master cómo manejar a los expertos subordinados. Las instrucciones para los expertos subordinados se dan desde sus presets.
1298
1302
  settings.prompt.img = Generación de imagen
1299
1303
  settings.prompt.img.desc = Mensaje para generar comandos para DALL-E (si el modo crudo está desactivado). Solo modo de imagen.
1304
+ settings.prompt.video = Generación de video
1305
+ settings.prompt.video.desc = Indicaciones para generar indicaciones para el modelo de video (si el modo sin formato está desactivado). Solo modo Imagen/Videos.
1300
1306
  settings.remote_tools.code_interpreter = Intérprete de Código
1301
1307
  settings.remote_tools.code_interpreter.desc = Habilitar herramienta remota `code_interpreter` en modo Chat / vía API de Respuestas de OpenAI.
1302
1308
  settings.remote_tools.file_search = File search
@@ -1340,7 +1346,9 @@ settings.section.ctx = Contexto
1340
1346
  settings.section.debug = Depuración
1341
1347
  settings.section.files = Archivos y adjuntos
1342
1348
  settings.section.general = General
1343
- settings.section.images = Imágenes
1349
+ settings.section.images = Imágenes y vídeo
1350
+ settings.section.images.image = Imagen
1351
+ settings.section.images.video = Video
1344
1352
  settings.section.layout = Diseño
1345
1353
  settings.section.llama_index = Índices / LlamaIndex
1346
1354
  settings.section.llama-index.chat = Chat
@@ -1368,6 +1376,22 @@ settings.upload.data_dir.desc = Habilite para almacenar todo en un único direct
1368
1376
  settings.upload.store = Almacenar adjuntos en el directorio de subida del directorio de trabajo
1369
1377
  settings.upload.store.desc = Habilitar el almacenamiento de una copia local de los adjuntos subidos para su uso futuro
1370
1378
  settings.use_context = Utilizar contexto (memoria)
1379
+ settings.video.aspect_ratio = Relación de aspecto
1380
+ settings.video.aspect_ratio.desc = Relación de aspecto del cuadro (por ejemplo, 16:9, 9:16, 1:1); la disponibilidad depende del modelo seleccionado
1381
+ settings.video.duration = Duración de video
1382
+ settings.video.duration.desc = Longitud del clip en segundos; los límites pueden variar según el modelo
1383
+ settings.video.fps = FPS
1384
+ settings.video.fps.desc = Fotogramas por segundo (por ejemplo, 24, 25, 30); puede ser redondeado o ignorado por el modelo
1385
+ settings.video.generate_audio = Generar audio
1386
+ settings.video.generate_audio.desc = Incluir audio de fondo sintetizado si es compatible con el modelo
1387
+ settings.video.negative_prompt = Indicaciones negativas
1388
+ settings.video.negative_prompt.desc = Palabras o frases a evitar en el resultado (separadas por comas)
1389
+ settings.video.prompt_model = Modelo de mejora de indicación
1390
+ settings.video.prompt_model.desc = LLM utilizado para refinar su indicación antes de la generación de video (no el modelo de video)
1391
+ settings.video.resolution = Resolución de video
1392
+ settings.video.resolution.desc = Resolución de salida objetivo (por ejemplo, 720p, 1080p); la disponibilidad depende del modelo
1393
+ settings.video.seed = Semilla
1394
+ settings.video.seed.desc = Semilla aleatoria opcional para resultados reproducibles; déjelo vacío para aleatorio
1371
1395
  settings.vision.capture.auto = Captura automática
1372
1396
  settings.vision.capture.enabled = Cámara
1373
1397
  settings.vision.capture.height = Altura de captura de cámara (px)
@@ -1527,6 +1551,10 @@ updater.check.launch = Comprobar al iniciar
1527
1551
  update.released = Versión
1528
1552
  update.snap = Ir a Snap Store
1529
1553
  update.title = Buscando actualizaciones
1554
+ vid.status.downloading = Descargando video... por favor espere...
1555
+ vid.status.generating = Generando video desde
1556
+ vid.status.prompt.error = Ocurrió un error en la indicación de mejora
1557
+ vid.status.prompt.wait = Preparando indicación... por favor espere...
1530
1558
  vision.capture.auto = Captura automática
1531
1559
  vision.capture.auto.click = ¡La captura automática está habilitada!
1532
1560
  vision.capture.auto.label = Captura automática habilitada
@@ -191,6 +191,7 @@ attachments_uploaded.tab = Fichiers téléchargés
191
191
  audio.cache.clear.confirm = Êtes-vous sûr de vouloir supprimer tous les fichiers audio en cache ?
192
192
  audio.cache.clear.success = OK. Tous les fichiers de cache audio ont été effacés.
193
193
  audio.control.btn = Contrôle vocal
194
+ audio.loop = Boucle
194
195
  audio.magic_word.detected = Mot magique détecté !
195
196
  audio.magic_word.invalid = Pas un mot magique :(
196
197
  audio.magic_word.please = S'il vous plaît, le mot magique...
@@ -854,7 +855,7 @@ mode.computer = Utilisation de l'ordinateur
854
855
  mode.computer.tooltip = Utilisation de l'ordinateur (souris, clavier, navigation)
855
856
  mode.expert = Experts (co-opération)
856
857
  mode.expert.tooltip = Appeler des experts en arrière-plan
857
- mode.img = Image
858
+ mode.img = Image et vidéo
858
859
  mode.img.tooltip = Génération d'image avec DALL-E
859
860
  mode.langchain = Langchain
860
861
  mode.langchain.tooltip = Discussion avec les modèles fournis par Langchain
@@ -1127,6 +1128,8 @@ settings.audio.input.stop_interval.desc = Intervalle en secondes pour la transcr
1127
1128
  settings.audio.input.timeout = Délai d'enregistrement
1128
1129
  settings.audio.input.timeout.continuous = Activer le délai en mode continu
1129
1130
  settings.audio.input.timeout.desc = Délai (secondes) pour l'arrêt automatique de l'enregistrement, 0 pour désactiver, par défaut : 120
1131
+ settings.audio.input.vad.prefix = Padding du préfixe VAD (en ms)
1132
+ settings.audio.input.vad.silence = Silence de fin VAD (en ms)
1130
1133
  settings.audio.output.backend = Backend pour la sortie audio
1131
1134
  settings.audio.output.backend.desc = Sélectionnez le backend pour la sortie audio.
1132
1135
  settings.audio.output.device = Périphérique pour la sortie audio
@@ -1198,6 +1201,7 @@ settings.func_call.native = Utiliser les appels de fonction API natives
1198
1201
  settings.func_call.native.desc = Si activé, l'application utilisera les appels de fonction API natives au lieu du format interne de pygpt et les commandes prompt ci-dessous ne seront pas utilisées. Modes uniquement Chat et Assistants.
1199
1202
  settings.img_dialog_open = Ouvrir la boîte de dialogue d'image après la génération (Mode image)
1200
1203
  settings.img_prompt_model = Modèle de génération d'invite
1204
+ settings.img_prompt_model.desc = LLM utilisé pour affiner votre invite avant la génération d'images (pas le modèle d'image)
1201
1205
  settings.img_quality = Qualité d'image
1202
1206
  settings.img_resolution = Taille de l'image
1203
1207
  settings.layout.animation.disable = Désactiver les animations
@@ -1296,6 +1300,8 @@ settings.prompt.expert = Expert : Master prompt
1296
1300
  settings.prompt.expert.desc = Instruction (prompt système) pour l'expert Master sur comment gérer les experts esclaves. Les instructions pour les experts esclaves sont données à partir de leurs presets.
1297
1301
  settings.prompt.img = Génération d'image
1298
1302
  settings.prompt.img.desc = Prompt pour générer des commandes pour DALL-E (si le mode brut est désactivé). Mode image uniquement.
1303
+ settings.prompt.video = Génération de vidéo
1304
+ settings.prompt.video.desc = Invite pour générer des invites pour le modèle vidéo (si le mode brut est désactivé). Mode Image/Vidéo uniquement.
1299
1305
  settings.remote_tools.code_interpreter = Interpréteur de code
1300
1306
  settings.remote_tools.code_interpreter.desc = Activer l'outil distant `code_interpreter` en mode Chat/ via OpenAI Responses API.
1301
1307
  settings.remote_tools.file_search = File search
@@ -1339,7 +1345,9 @@ settings.section.ctx = Contexte
1339
1345
  settings.section.debug = Débogage
1340
1346
  settings.section.files = Fichiers et pièces jointes
1341
1347
  settings.section.general = Général
1342
- settings.section.images = Images
1348
+ settings.section.images = Images et vidéos
1349
+ settings.section.images.image = Image
1350
+ settings.section.images.video = Vidéo
1343
1351
  settings.section.layout = Mise en page
1344
1352
  settings.section.llama_index = Indexes / LlamaIndex
1345
1353
  settings.section.llama-index.chat = Chat
@@ -1367,6 +1375,22 @@ settings.upload.data_dir.desc = Activez pour stocker tout dans un seul répertoi
1367
1375
  settings.upload.store = Stocker les pièces jointes dans le répertoire d'upload du répertoire de travail
1368
1376
  settings.upload.store.desc = Activer le stockage d'une copie locale des pièces jointes téléchargées pour une utilisation future
1369
1377
  settings.use_context = Utiliser le contexte (mémoire)
1378
+ settings.video.aspect_ratio = Ratio d'aspect
1379
+ settings.video.aspect_ratio.desc = Ratio d'aspect du cadre (ex. : 16:9, 9:16, 1:1); disponibilité dépend du modèle sélectionné
1380
+ settings.video.duration = Durée de la vidéo
1381
+ settings.video.duration.desc = Longueur du clip en secondes; les limites peuvent varier selon le modèle
1382
+ settings.video.fps = FPS
1383
+ settings.video.fps.desc = Images par seconde (ex. : 24, 25, 30); peut être arrondi ou ignoré par le modèle
1384
+ settings.video.generate_audio = Générer de l'audio
1385
+ settings.video.generate_audio.desc = Inclure un fond audio synthétisé si pris en charge par le modèle
1386
+ settings.video.negative_prompt = Invite négative
1387
+ settings.video.negative_prompt.desc = Mots ou phrases à éviter dans le résultat (séparés par des virgules)
1388
+ settings.video.prompt_model = Modèle d'amélioration de l'invite
1389
+ settings.video.prompt_model.desc = LLM utilisé pour affiner votre invite avant la génération de la vidéo (pas le modèle vidéo)
1390
+ settings.video.resolution = Résolution vidéo
1391
+ settings.video.resolution.desc = Résolution de sortie cible (ex. : 720p, 1080p); disponibilité dépend du modèle
1392
+ settings.video.seed = Graine
1393
+ settings.video.seed.desc = Graine aléatoire facultative pour des résultats reproductibles; laisser vide pour aléatoire
1370
1394
  settings.vision.capture.auto = Capture automatique
1371
1395
  settings.vision.capture.enabled = Caméra
1372
1396
  settings.vision.capture.height = Hauteur de capture par caméra (px)
@@ -1526,6 +1550,10 @@ updater.check.launch = Vérifier au démarrage
1526
1550
  update.released = build
1527
1551
  update.snap = Aller au Snap Store
1528
1552
  update.title = Vérification des mises à jour
1553
+ vid.status.downloading = Téléchargement de la vidéo... veuillez patienter...
1554
+ vid.status.generating = Génération de la vidéo à partir de
1555
+ vid.status.prompt.error = Erreur d'amélioration de l'invite survenue
1556
+ vid.status.prompt.wait = Préparation de l'invite... veuillez patienter...
1529
1557
  vision.capture.auto = Capture automatique
1530
1558
  vision.capture.auto.click = La capture automatique est activée !
1531
1559
  vision.capture.auto.label = Capture automatique activée