lemonade-sdk 8.1.9__py3-none-any.whl → 8.1.11__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of lemonade-sdk might be problematic. Click here for more details.
- lemonade/common/inference_engines.py +13 -4
- lemonade/common/system_info.py +570 -1
- lemonade/tools/flm/__init__.py +1 -0
- lemonade/tools/flm/utils.py +255 -0
- lemonade/tools/llamacpp/utils.py +62 -13
- lemonade/tools/server/flm.py +137 -0
- lemonade/tools/server/llamacpp.py +23 -5
- lemonade/tools/server/serve.py +292 -135
- lemonade/tools/server/static/js/chat.js +165 -82
- lemonade/tools/server/static/js/models.js +87 -54
- lemonade/tools/server/static/js/shared.js +5 -3
- lemonade/tools/server/static/logs.html +47 -0
- lemonade/tools/server/static/styles.css +159 -8
- lemonade/tools/server/static/webapp.html +28 -10
- lemonade/tools/server/tray.py +158 -38
- lemonade/tools/server/utils/macos_tray.py +226 -0
- lemonade/tools/server/utils/{system_tray.py → windows_tray.py} +13 -0
- lemonade/tools/server/webapp.py +4 -1
- lemonade/tools/server/wrapped_server.py +91 -25
- lemonade/version.py +1 -1
- lemonade_install/install.py +25 -2
- {lemonade_sdk-8.1.9.dist-info → lemonade_sdk-8.1.11.dist-info}/METADATA +9 -6
- {lemonade_sdk-8.1.9.dist-info → lemonade_sdk-8.1.11.dist-info}/RECORD +33 -28
- lemonade_server/cli.py +105 -14
- lemonade_server/model_manager.py +186 -45
- lemonade_server/pydantic_models.py +25 -1
- lemonade_server/server_models.json +162 -62
- lemonade_server/settings.py +39 -39
- {lemonade_sdk-8.1.9.dist-info → lemonade_sdk-8.1.11.dist-info}/WHEEL +0 -0
- {lemonade_sdk-8.1.9.dist-info → lemonade_sdk-8.1.11.dist-info}/entry_points.txt +0 -0
- {lemonade_sdk-8.1.9.dist-info → lemonade_sdk-8.1.11.dist-info}/licenses/LICENSE +0 -0
- {lemonade_sdk-8.1.9.dist-info → lemonade_sdk-8.1.11.dist-info}/licenses/NOTICE.md +0 -0
- {lemonade_sdk-8.1.9.dist-info → lemonade_sdk-8.1.11.dist-info}/top_level.txt +0 -0
|
@@ -24,7 +24,7 @@ class InferenceEngineDetector:
|
|
|
24
24
|
Detect all available inference engines for a specific device type.
|
|
25
25
|
|
|
26
26
|
Args:
|
|
27
|
-
device_type: "cpu", "amd_igpu", "amd_dgpu", or "npu"
|
|
27
|
+
device_type: "cpu", "amd_igpu", "amd_dgpu", "nvidia_dgpu", or "npu"
|
|
28
28
|
|
|
29
29
|
Returns:
|
|
30
30
|
dict: Engine availability information
|
|
@@ -223,17 +223,26 @@ class LlamaCppDetector(BaseEngineDetector):
|
|
|
223
223
|
"""
|
|
224
224
|
try:
|
|
225
225
|
|
|
226
|
-
if device_type not in ["cpu", "amd_igpu", "amd_dgpu"]:
|
|
226
|
+
if device_type not in ["cpu", "amd_igpu", "amd_dgpu", "nvidia_dgpu"]:
|
|
227
227
|
return None
|
|
228
228
|
|
|
229
229
|
# Check if the device is supported by the backend
|
|
230
230
|
if device_type == "cpu":
|
|
231
231
|
device_supported = True
|
|
232
|
-
elif device_type
|
|
232
|
+
elif device_type in ["amd_igpu", "amd_dgpu"]:
|
|
233
233
|
if backend == "vulkan":
|
|
234
234
|
device_supported = self._check_vulkan_support()
|
|
235
235
|
elif backend == "rocm":
|
|
236
236
|
device_supported = self._check_rocm_support(device_name.lower())
|
|
237
|
+
else:
|
|
238
|
+
device_supported = False
|
|
239
|
+
elif device_type == "nvidia_dgpu":
|
|
240
|
+
if backend == "vulkan":
|
|
241
|
+
device_supported = self._check_vulkan_support()
|
|
242
|
+
else:
|
|
243
|
+
device_supported = False
|
|
244
|
+
else:
|
|
245
|
+
device_supported = False
|
|
237
246
|
if not device_supported:
|
|
238
247
|
return {"available": False, "error": f"{backend} not available"}
|
|
239
248
|
|
|
@@ -390,7 +399,7 @@ def detect_inference_engines(device_type: str, device_name: str) -> Dict[str, Di
|
|
|
390
399
|
Helper function to detect inference engines for a device type.
|
|
391
400
|
|
|
392
401
|
Args:
|
|
393
|
-
device_type: "cpu", "amd_igpu", "amd_dgpu", or "npu"
|
|
402
|
+
device_type: "cpu", "amd_igpu", "amd_dgpu", "nvidia_dgpu", or "npu"
|
|
394
403
|
device_name: device name
|
|
395
404
|
|
|
396
405
|
Returns:
|