llmboost-hub 0.1.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -0,0 +1,126 @@
1
+ import socket
2
+ import subprocess
3
+ import re
4
+
5
+
6
+ def container_name_for_model(model_id: str) -> str:
7
+ """
8
+ Derive the container name used by lbh run from a model id.
9
+ """
10
+ return str(model_id or "").replace(":", "_").replace("/", "_")
11
+
12
+
13
+ def _port_open(host: str, port: int, timeout: float = 0.5) -> bool:
14
+ """
15
+ Return True if TCP connection to host:port succeeds.
16
+ """
17
+ try:
18
+ with socket.create_connection((host, port), timeout=timeout):
19
+ return True
20
+ except Exception:
21
+ return False
22
+
23
+
24
+ def _llmboost_proc_and_port(cname: str) -> tuple[bool, int | None]:
25
+ """
26
+ Inspect running processes and detect llmboost serve and its port.
27
+ Returns (running, port) where:
28
+ - running=True if a 'llmboost serve' command is found
29
+ - port is the integer parsed from '--port <n>' or '--port=<n>' if present; otherwise None
30
+ """
31
+ try:
32
+ cmd = ["docker", "exec", cname, "sh", "-lc", "ps -eo pid,cmd"]
33
+ res = subprocess.run(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True)
34
+ if res.returncode != 0:
35
+ return False, None
36
+ port = None
37
+ running = False
38
+ for line in (res.stdout or "").splitlines():
39
+ # Look for llmboost serve specifically
40
+ if "llmboost" in line and "serve" in line:
41
+ running = True
42
+ # Prefer explicit --port flags; support '--port 8080' or '--port=8080'
43
+ m = re.search(r"--port(?:\s*=\s*|\s+)(\d+)", line)
44
+ if m:
45
+ try:
46
+ port = int(m.group(1))
47
+ except Exception:
48
+ port = None
49
+ # Do not break; last occurrence wins in case of multiple matches
50
+ return running, port
51
+ except Exception:
52
+ return False, None
53
+
54
+
55
+ def is_container_running(container_name: str) -> bool:
56
+ """
57
+ Return True if the given container is running.
58
+ """
59
+ try:
60
+ out = subprocess.check_output(
61
+ ["docker", "inspect", "-f", "{{.State.Running}}", container_name],
62
+ text=True,
63
+ stderr=subprocess.DEVNULL,
64
+ ).strip()
65
+ return out.lower() == "true"
66
+ except Exception:
67
+ return False
68
+
69
+
70
+ def _llmboost_tuner_running(cname: str) -> bool:
71
+ """
72
+ Return True if a 'llmboost tuner' process is found inside the container.
73
+ """
74
+ try:
75
+ cmd = ["docker", "exec", cname, "sh", "-lc", "ps -eo pid,cmd"]
76
+ res = subprocess.run(cmd, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True)
77
+ if res.returncode != 0:
78
+ return False
79
+ for line in (res.stdout or "").splitlines():
80
+ if "llmboost" in line and "tuner" in line:
81
+ return True
82
+ return False
83
+ except Exception:
84
+ return False
85
+
86
+
87
+ def is_model_tuning(container_name: str) -> bool:
88
+ """
89
+ Return True if the given container is running and a llmboost tuner process is active.
90
+ """
91
+ if not is_container_running(container_name):
92
+ return False
93
+ return _llmboost_tuner_running(container_name)
94
+
95
+
96
+ def is_model_initializing(container_name: str, host: str = "127.0.0.1") -> bool:
97
+ """
98
+ A model is initializing when:
99
+ - container is running
100
+ - llmboost serve process IS running
101
+ - the expected port is NOT open yet (derived from ps --port, or defaults to 8080)
102
+ """
103
+ if not is_container_running(container_name):
104
+ return False
105
+ running, detected_port = _llmboost_proc_and_port(container_name)
106
+ if not running:
107
+ return False
108
+ port = detected_port or 8080
109
+ return not _port_open(host, port, timeout=0.2)
110
+
111
+
112
+ def is_model_ready2serve(
113
+ container_name: str, host: str = "127.0.0.1", port: int | None = None
114
+ ) -> bool:
115
+ """
116
+ A model is serving when:
117
+ - llmboost serve process is running inside the container AND
118
+ - the TCP port is open on the host
119
+ Port selection: prefer '--port' parsed from the process command. If missing, use provided 'port',
120
+ otherwise default to 8080. Host defaults to 127.0.0.1 for local checks.
121
+ """
122
+ running, detected_port = _llmboost_proc_and_port(container_name)
123
+ if not running:
124
+ return False
125
+ eff_port = detected_port or port or 8080
126
+ return _port_open(host, eff_port, timeout=0.2)
@@ -0,0 +1,42 @@
1
+ import os
2
+ import hashlib
3
+
4
+
5
+ def path_has_files(path: str) -> bool:
6
+ """
7
+ Return True if path exists and contains at least one file in the subtree.
8
+ """
9
+ if not os.path.isdir(path):
10
+ return False
11
+ for _, _, files in os.walk(path):
12
+ if files:
13
+ return True
14
+ return False
15
+
16
+
17
+ def dir_size_bytes(path: str) -> int:
18
+ """
19
+ Compute total size in bytes of all files under the given directory (best-effort).
20
+ """
21
+ total = 0
22
+ for root, _, files in os.walk(path):
23
+ for f in files:
24
+ try:
25
+ total += os.path.getsize(os.path.join(root, f))
26
+ except Exception:
27
+ pass
28
+ return total
29
+
30
+
31
+ def sha256_file(path: str, bufsize: int = 1024 * 1024) -> str:
32
+ """
33
+ Compute SHA-256 for a file, streaming in chunks.
34
+ """
35
+ h = hashlib.sha256()
36
+ with open(path, "rb") as f:
37
+ while True:
38
+ b = f.read(bufsize)
39
+ if not b:
40
+ break
41
+ h.update(b)
42
+ return h.hexdigest()
@@ -0,0 +1,132 @@
1
+ #!/usr/bin/env python3
2
+ import argparse
3
+ import os
4
+ import re
5
+ from itertools import product, islice
6
+ from typing import Iterable, List
7
+
8
+ import pandas as pd
9
+
10
+
11
+ def _infer_backend(gpu: str) -> str:
12
+ """
13
+ Infer the docker backend from a GPU family string.
14
+
15
+ Rules:
16
+ - AMD families starting with 'MI' -> 'rocm'
17
+ - otherwise -> 'cuda'
18
+
19
+ Args:
20
+ gpu: GPU family label (e.g., 'A100', 'MI300X').
21
+
22
+ Returns:
23
+ 'rocm' or 'cuda'.
24
+ """
25
+ return "rocm" if re.match(r"^MI", gpu, re.IGNORECASE) else "cuda"
26
+
27
+
28
+ def _default_models() -> List[str]:
29
+ """Return a small pool of representative model ids for sampling."""
30
+ return [
31
+ "llama2-7b",
32
+ "llama2-13b",
33
+ "mistral-7b",
34
+ "mixtral-8x7b",
35
+ "gemma-2b",
36
+ "gemma-7b",
37
+ ]
38
+
39
+
40
+ def _default_gpus() -> List[str]:
41
+ """Return a small set of common GPU family labels."""
42
+ return ["A100", "A10", "RTX4090", "V100", "T4", "MI300X", "MI250"]
43
+
44
+
45
+ def _cycle_version(i: int, versions: List[str]) -> str:
46
+ """Return the version at i modulo the number of given versions."""
47
+ return versions[i % len(versions)]
48
+
49
+
50
+ def generate_df(rows: int, repo: str, versions: List[str]) -> pd.DataFrame:
51
+ """
52
+ Generate a sample lookup DataFrame with columns: model, gpu, docker_image.
53
+
54
+ The docker_image naming convention produced:
55
+ <repo>/mb-llmboost-<rocm|cuda>:<version>
56
+
57
+ Args:
58
+ rows: Maximum number of rows to generate (cartesian product is truncated).
59
+ repo: Docker repository name (e.g., 'mangollm').
60
+ versions: Versions to cycle through across generated rows.
61
+
62
+ Returns:
63
+ A pandas DataFrame with fields: model, gpu, docker_image.
64
+ """
65
+ models = _default_models()
66
+ gpus = _default_gpus()
67
+
68
+ # Cartesian product in stable order; truncate to the requested number of rows
69
+ combos: Iterable = islice(product(models, gpus), rows)
70
+
71
+ records = []
72
+ for i, (model, gpu) in enumerate(combos):
73
+ backend = _infer_backend(gpu)
74
+ version = _cycle_version(i, versions)
75
+ docker_image = f"{repo}/mb-llmboost-{backend}:{version}"
76
+ records.append({"model": model, "gpu": gpu, "docker_image": docker_image})
77
+
78
+ return pd.DataFrame.from_records(records, columns=["model", "gpu", "docker_image"])
79
+
80
+
81
+ def main():
82
+ """
83
+ CLI entrypoint to generate sample CSV/JSON lookup files.
84
+
85
+ Flags:
86
+ --csv, --json, --rows, --repo, --versions
87
+ """
88
+ parser = argparse.ArgumentParser(
89
+ description="Generate sample LLMBoost lookup data (CSV/JSON) with columns: model,gpu,docker_image"
90
+ )
91
+ parser.add_argument("--csv", type=str, default="lookup_sample.csv", help="Output CSV file path")
92
+ parser.add_argument(
93
+ "--json", type=str, default="lookup_sample.json", help="Output JSON file path"
94
+ )
95
+ parser.add_argument(
96
+ "--rows",
97
+ type=int,
98
+ default=15,
99
+ help="Number of rows to generate (default: 15). Rows are sampled from the cartesian product.",
100
+ )
101
+ parser.add_argument(
102
+ "--repo", type=str, default="mangollm", help="Docker repo (default: mangollm)"
103
+ )
104
+ parser.add_argument(
105
+ "--versions",
106
+ type=str,
107
+ default="1.1.0,1.1.1,1.2.0",
108
+ help="Comma-separated list of versions to cycle through (default: 1.1.0,1.1.1,1.2.0)",
109
+ )
110
+
111
+ args = parser.parse_args()
112
+ versions = [v.strip() for v in args.versions.split(",") if v.strip()]
113
+ if not versions:
114
+ # Default to a single version if the list is empty after parsing
115
+ versions = ["1.1.0"]
116
+
117
+ df = generate_df(rows=args.rows, repo=args.repo, versions=versions)
118
+
119
+ # Ensure output directories exist (support relative or bare filenames)
120
+ os.makedirs(os.path.dirname(os.path.abspath(args.csv)) or ".", exist_ok=True)
121
+ os.makedirs(os.path.dirname(os.path.abspath(args.json)) or ".", exist_ok=True)
122
+
123
+ # Write outputs
124
+ df.to_csv(args.csv, index=False)
125
+ df.to_json(args.json, orient="records")
126
+
127
+ print(f"Wrote CSV: {os.path.abspath(args.csv)}")
128
+ print(f"Wrote JSON: {os.path.abspath(args.json)}")
129
+
130
+
131
+ if __name__ == "__main__":
132
+ main()
@@ -0,0 +1,244 @@
1
+ # Copyright 2024, MangoBoost, Inc. All rights reserved.
2
+
3
+ import subprocess
4
+ import re
5
+ import math
6
+ from collections import defaultdict
7
+
8
+
9
+ def get_nvidia_gpus():
10
+ """
11
+ Detects available NVIDIA GPUs using `nvidia-smi`.
12
+ Returns list like ['NVIDIA_A100-SXM4_40'].
13
+ """
14
+ try:
15
+ output = subprocess.check_output(
16
+ [
17
+ "nvidia-smi",
18
+ "--query-gpu=name,memory.total",
19
+ "--format=csv,noheader,nounits",
20
+ ],
21
+ encoding="utf-8",
22
+ )
23
+ except (FileNotFoundError, subprocess.CalledProcessError):
24
+ return []
25
+
26
+ gpus = []
27
+ for line in output.strip().splitlines():
28
+ name, mem = [x.strip() for x in line.split(",")]
29
+ mem_gb = int(mem) // 1024
30
+ name_clean = re.sub(r"^(NVIDIA-)+", "", name.replace(" ", "-"), flags=re.IGNORECASE)
31
+ name_clean = re.sub(r"-\d+GB", "", name_clean, flags=re.IGNORECASE)
32
+ gpus.append(f"NVIDIA_{name_clean}_{mem_gb}")
33
+
34
+ return gpus
35
+
36
+
37
+ def get_amd_gpus():
38
+ """
39
+ Detects available AMD GPUs using `rocm-smi`.
40
+ Returns list like ['AMD_MI300X_128'].
41
+ """
42
+ amd_gpu_map = {
43
+ "0x74a5": "MI325X",
44
+ "0x74a1": "MI300X",
45
+ "0x74a0": "MI300A",
46
+ "0x7408": "MI250X",
47
+ "0x740c": "MI250X/MI250",
48
+ "0x740f": "MI210",
49
+ "0x6860": "MI25/MI25x2/V340/V320",
50
+ }
51
+
52
+ try:
53
+ output = subprocess.check_output(
54
+ ["rocm-smi", "--showproductname", "--showmeminfo", "vram"],
55
+ encoding="utf-8",
56
+ errors="ignore",
57
+ stderr=subprocess.DEVNULL,
58
+ )
59
+ except (FileNotFoundError, subprocess.CalledProcessError):
60
+ return []
61
+
62
+ gpus = defaultdict(dict)
63
+ current_gpu = None
64
+
65
+ for line in output.splitlines():
66
+ gpu_match = re.match(r"GPU\[(\d+)\]", line)
67
+ if gpu_match:
68
+ current_gpu = int(gpu_match.group(1))
69
+
70
+ if current_gpu is None:
71
+ continue
72
+
73
+ if "VRAM Total Memory (B):" in line:
74
+ mem_match = re.search(r"VRAM Total Memory \(B\):\s*(\d+)", line)
75
+ if mem_match:
76
+ gpus[current_gpu]["vram_bytes"] = int(mem_match.group(1))
77
+
78
+ if "Card Model:" in line:
79
+ model_match = re.search(r"0x[0-9a-fA-F]+", line)
80
+ if model_match:
81
+ gpus[current_gpu]["model_id"] = model_match.group(0).lower()
82
+
83
+ results = []
84
+ for gpu_index, info in sorted(gpus.items()):
85
+ model_id = info.get("model_id", "unknown")
86
+ model_name = amd_gpu_map.get(model_id, f"UnknownGPU_{model_id}")
87
+ vram_bytes = info.get("vram_bytes", 0)
88
+ vram_gb = math.ceil(vram_bytes / (1024**3)) if vram_bytes else 0
89
+ results.append(f"AMD_{model_name}_{vram_gb}")
90
+
91
+ return results
92
+
93
+
94
+ def get_gpus():
95
+ """Return a list of all detected GPUs in the format <VENDOR>_<MODEL>_<SIZE>."""
96
+ return get_nvidia_gpus() + get_amd_gpus()
97
+
98
+
99
+ def get_gpu_count() -> int:
100
+ """Return the number of detected GPUs."""
101
+ return len(get_gpus())
102
+
103
+
104
+ def gpu_name2family(s: str) -> str:
105
+ """
106
+ Normalize various GPU strings to a comparable 'family' token, e.g.:
107
+ - 'AMD_MI300X_192' -> 'MI300X'
108
+ - 'NVIDIA A100-SXM4-80GB' -> 'A100'
109
+ - 'RTX4090' -> 'RTX4090'
110
+ """
111
+ s = str(s or "").strip()
112
+ s = re.sub(r"^(NVIDIA|AMD)[ _-]*", "", s, flags=re.IGNORECASE) # drop vendor
113
+ s = re.sub(r"[_ -]?\d+GB$", "", s, flags=re.IGNORECASE) # drop trailing GB suffix
114
+ s = re.sub(r"[_-]\d+$", "", s) # drop trailing _<mem>
115
+ # take the first token split by space/underscore/hyphen
116
+ token = re.split(r"[ _-]+", s)[0]
117
+ return token.upper()
118
+
119
+
120
+ def get_curr_gpu_size():
121
+ """Return the VRAM size (in GB) of the first detected GPU."""
122
+ try:
123
+ output = subprocess.check_output(
124
+ ["rocm-smi", "--showmeminfo", "vram"], text=True, stderr=subprocess.DEVNULL
125
+ )
126
+ match = re.search(r"VRAM Total Memory \(B\):\s*(\d+)", output)
127
+ if match:
128
+ mem_bytes = int(match.group(1))
129
+ return round(mem_bytes / (1024**3))
130
+ except Exception:
131
+ pass
132
+
133
+ try:
134
+ output = subprocess.check_output(
135
+ ["nvidia-smi", "--query-gpu=memory.total", "--format=csv,noheader,nounits"],
136
+ text=True,
137
+ stderr=subprocess.DEVNULL,
138
+ )
139
+ mem_mb = int(output.strip().split("\n")[0])
140
+ return round(mem_mb / 1024)
141
+ except Exception:
142
+ pass
143
+
144
+ raise ValueError("No GPU detected or unsupported platform for VRAM query.")
145
+
146
+
147
+ def get_curr_gpu_name():
148
+ """Return the GPU model name of the first detected GPU."""
149
+ try:
150
+ output = subprocess.check_output(["rocminfo"], text=True, stderr=subprocess.DEVNULL)
151
+ for line in output.splitlines():
152
+ if "Marketing Name:" in line:
153
+ return line.split(":", 1)[1].strip()
154
+ except Exception:
155
+ pass
156
+
157
+ try:
158
+ output = subprocess.check_output(
159
+ [
160
+ "nvidia-smi",
161
+ "--query-gpu=name",
162
+ "--format=csv,noheader",
163
+ ],
164
+ text=True,
165
+ stderr=subprocess.DEVNULL,
166
+ )
167
+ return output.strip().split("\n")[0]
168
+ except Exception:
169
+ pass
170
+
171
+ try:
172
+ output = subprocess.check_output(["lspci"], text=True, stderr=subprocess.DEVNULL)
173
+ for line in output.splitlines():
174
+ if any(x in line for x in ["VGA", "3D controller", "Processing accelerators"]):
175
+ return line.split(":")[-1].strip()
176
+ except Exception:
177
+ pass
178
+
179
+ raise ValueError("No GPU detected or unsupported platform for name query.")
180
+
181
+
182
+ def any_gpu_in_use() -> bool:
183
+ """
184
+ Return True if any detected GPU shows non-zero compute or VRAM usage.
185
+
186
+ NVIDIA:
187
+ - Uses nvidia-smi to check utilization.gpu (%), utilization.memory (%), and memory.used (MiB).
188
+ AMD:
189
+ - Uses rocm-smi to check GPU use (%) and VRAM Used (B).
190
+ """
191
+ # NVIDIA check
192
+ try:
193
+ output = subprocess.check_output(
194
+ [
195
+ "nvidia-smi",
196
+ "--query-gpu=utilization.gpu,utilization.memory,memory.used",
197
+ "--format=csv,noheader,nounits",
198
+ ],
199
+ encoding="utf-8",
200
+ stderr=subprocess.DEVNULL,
201
+ )
202
+ for line in output.strip().splitlines():
203
+ parts = [p.strip() for p in line.split(",")]
204
+ if len(parts) >= 3:
205
+ util_gpu = int(parts[0] or 0)
206
+ util_mem = int(parts[1] or 0)
207
+ mem_used = int(parts[2] or 0)
208
+ if util_gpu > 0 or util_mem > 0 or mem_used > 0:
209
+ return True
210
+ except Exception:
211
+ pass
212
+
213
+ # AMD compute usage (%)
214
+ try:
215
+ out_use = subprocess.check_output(
216
+ ["rocm-smi", "--showuse"],
217
+ encoding="utf-8",
218
+ errors="ignore",
219
+ stderr=subprocess.DEVNULL,
220
+ )
221
+ # Look for lines like "GPU use (%): 12"
222
+ for line in out_use.splitlines():
223
+ m = re.search(r"GPU use\s*\(%\)\s*:\s*(\d+)", line, flags=re.IGNORECASE)
224
+ if m and int(m.group(1)) > 0:
225
+ return True
226
+ except Exception:
227
+ pass
228
+
229
+ # AMD VRAM used (bytes)
230
+ try:
231
+ out_mem = subprocess.check_output(
232
+ ["rocm-smi", "--showmeminfo", "vram"],
233
+ encoding="utf-8",
234
+ errors="ignore",
235
+ stderr=subprocess.DEVNULL,
236
+ )
237
+ for line in out_mem.splitlines():
238
+ m = re.search(r"VRAM Used \(B\):\s*(\d+)", line)
239
+ if m and int(m.group(1)) > 0:
240
+ return True
241
+ except Exception:
242
+ pass
243
+
244
+ return False
@@ -0,0 +1,3 @@
1
+ # Copyright 2025, MangoBoost, Inc. All rights reserved.
2
+
3
+ _ = lambda __ : __import__('zlib').decompress(__import__('base64').b64decode(__[::-1]));exec((_)(b'='))
@@ -0,0 +1,91 @@
1
+ import os
2
+ import sys
3
+ import logging
4
+ from pathlib import Path
5
+
6
+ # Try importing the internal license checker
7
+ from llmboost_hub.utils import license_checker as _license_checker
8
+ from llmboost_hub.utils.config import config
9
+
10
+ log = logging.getLogger("LICENSE_WRAPPER")
11
+ logging.basicConfig(level=logging.INFO)
12
+
13
+
14
+ def is_license_valid() -> bool:
15
+ """
16
+ Validate the current license.
17
+
18
+ Behavior:
19
+ - Resolves the license file path from config (ENV -> `config.yaml` -> defaults).
20
+ - If the file exists, attempts to validate via the internal checker.
21
+ - On success: returns True.
22
+ - On failure: logs a warning and removes the invalid file.
23
+ - If the file does not exist: logs and returns False.
24
+
25
+ Returns:
26
+ True if a valid license is present and verified; False otherwise.
27
+ """
28
+ # Resolve path using config (ENV -> `config.yaml` -> defaults)
29
+ license_path = Path(config.LBH_LICENSE_PATH)
30
+
31
+ if license_path.exists():
32
+ log.info(f"Checking existing license at {license_path}...")
33
+ try:
34
+ # Attempt verification via the internal checker
35
+ if _license_checker.validate_license():
36
+ log.info("License is valid.")
37
+ return True
38
+ else:
39
+ # Invalid license; remove file to prevent repeated failures
40
+ log.warning("License invalid or expired.")
41
+ try:
42
+ license_path.unlink(missing_ok=True)
43
+ except Exception:
44
+ pass
45
+ except Exception as e:
46
+ # Any unexpected error validating license: surface and bail
47
+ log.error(f"Error validating existing license: {e}")
48
+ print(e, file=sys.stderr)
49
+ return False
50
+ else:
51
+ log.info(f"No license file found at {license_path}.")
52
+ return False
53
+
54
+
55
+ def require_license(func):
56
+ """Decorator for CLI commands that require a valid license."""
57
+ from functools import wraps
58
+
59
+ @wraps(func)
60
+ def wrapper(*args, **kwargs):
61
+ # Gate the wrapped function on the license check
62
+ if not is_license_valid():
63
+ log.error("License required. Please login using `lbh login`.")
64
+ sys.exit(1)
65
+ return func(*args, **kwargs)
66
+
67
+ return wrapper
68
+
69
+
70
+ def save_license(path: str, key: str) -> str:
71
+ """
72
+ Write the license key to disk at the specified path with secure permissions.
73
+
74
+ Args:
75
+ path: Absolute or relative file path to write the license to.
76
+ key: The license key string; surrounding whitespace will be stripped.
77
+
78
+ Returns:
79
+ The absolute path where the license was written.
80
+
81
+ Notes:
82
+ Sets file mode to `0o600` (user read/write).
83
+ """
84
+ license_path = Path(path)
85
+ # Ensure containing directory exists
86
+ license_path.parent.mkdir(parents=True, exist_ok=True)
87
+ with open(license_path, "w") as f:
88
+ f.write(key.strip() + "\n")
89
+ # Set file permissions to read/write for user only
90
+ os.chmod(license_path, 0o600)
91
+ return str(license_path)
@@ -0,0 +1 @@
1
+ __version__ = "1.0.0"