ob-metaflow-extensions 1.1.64__tar.gz → 1.1.65__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of ob-metaflow-extensions might be problematic. Click here for more details.
- {ob-metaflow-extensions-1.1.64 → ob-metaflow-extensions-1.1.65}/PKG-INFO +1 -1
- ob-metaflow-extensions-1.1.65/metaflow_extensions/nim/plugins/__init__.py +60 -0
- ob-metaflow-extensions-1.1.65/metaflow_extensions/nim/plugins/nim.py +137 -0
- ob-metaflow-extensions-1.1.65/metaflow_extensions/nim/toplevel/mfextinit_nim.py +1 -0
- ob-metaflow-extensions-1.1.65/metaflow_extensions/nim/toplevel/nim_toplevel.py +2 -0
- {ob-metaflow-extensions-1.1.64 → ob-metaflow-extensions-1.1.65}/ob_metaflow_extensions.egg-info/PKG-INFO +1 -1
- {ob-metaflow-extensions-1.1.64 → ob-metaflow-extensions-1.1.65}/ob_metaflow_extensions.egg-info/SOURCES.txt +4 -0
- {ob-metaflow-extensions-1.1.64 → ob-metaflow-extensions-1.1.65}/setup.py +1 -1
- {ob-metaflow-extensions-1.1.64 → ob-metaflow-extensions-1.1.65}/README.md +0 -0
- {ob-metaflow-extensions-1.1.64 → ob-metaflow-extensions-1.1.65}/metaflow_extensions/outerbounds/__init__.py +0 -0
- {ob-metaflow-extensions-1.1.64 → ob-metaflow-extensions-1.1.65}/metaflow_extensions/outerbounds/config/__init__.py +0 -0
- {ob-metaflow-extensions-1.1.64 → ob-metaflow-extensions-1.1.65}/metaflow_extensions/outerbounds/plugins/__init__.py +0 -0
- {ob-metaflow-extensions-1.1.64 → ob-metaflow-extensions-1.1.65}/metaflow_extensions/outerbounds/plugins/auth_server.py +0 -0
- {ob-metaflow-extensions-1.1.64 → ob-metaflow-extensions-1.1.65}/metaflow_extensions/outerbounds/plugins/kubernetes/__init__.py +0 -0
- {ob-metaflow-extensions-1.1.64 → ob-metaflow-extensions-1.1.65}/metaflow_extensions/outerbounds/plugins/kubernetes/kubernetes_client.py +0 -0
- {ob-metaflow-extensions-1.1.64 → ob-metaflow-extensions-1.1.65}/metaflow_extensions/outerbounds/plugins/perimeters.py +0 -0
- {ob-metaflow-extensions-1.1.64 → ob-metaflow-extensions-1.1.65}/metaflow_extensions/outerbounds/profilers/__init__.py +0 -0
- {ob-metaflow-extensions-1.1.64 → ob-metaflow-extensions-1.1.65}/metaflow_extensions/outerbounds/profilers/gpu.py +0 -0
- {ob-metaflow-extensions-1.1.64 → ob-metaflow-extensions-1.1.65}/metaflow_extensions/outerbounds/remote_config.py +0 -0
- {ob-metaflow-extensions-1.1.64 → ob-metaflow-extensions-1.1.65}/metaflow_extensions/outerbounds/toplevel/__init__.py +0 -0
- {ob-metaflow-extensions-1.1.64 → ob-metaflow-extensions-1.1.65}/metaflow_extensions/outerbounds/toplevel/global_aliases_for_metaflow_package.py +0 -0
- {ob-metaflow-extensions-1.1.64 → ob-metaflow-extensions-1.1.65}/metaflow_extensions/outerbounds/toplevel/plugins/azure/__init__.py +0 -0
- {ob-metaflow-extensions-1.1.64 → ob-metaflow-extensions-1.1.65}/metaflow_extensions/outerbounds/toplevel/plugins/gcp/__init__.py +0 -0
- {ob-metaflow-extensions-1.1.64 → ob-metaflow-extensions-1.1.65}/metaflow_extensions/outerbounds/toplevel/plugins/kubernetes/__init__.py +0 -0
- {ob-metaflow-extensions-1.1.64 → ob-metaflow-extensions-1.1.65}/ob_metaflow_extensions.egg-info/dependency_links.txt +0 -0
- {ob-metaflow-extensions-1.1.64 → ob-metaflow-extensions-1.1.65}/ob_metaflow_extensions.egg-info/requires.txt +0 -0
- {ob-metaflow-extensions-1.1.64 → ob-metaflow-extensions-1.1.65}/ob_metaflow_extensions.egg-info/top_level.txt +0 -0
- {ob-metaflow-extensions-1.1.64 → ob-metaflow-extensions-1.1.65}/setup.cfg +0 -0
|
@@ -0,0 +1,60 @@
|
|
|
1
|
+
from functools import partial
|
|
2
|
+
from metaflow.decorators import FlowDecorator
|
|
3
|
+
from metaflow import current
|
|
4
|
+
from .nim import NimManager
|
|
5
|
+
|
|
6
|
+
|
|
7
|
+
class NimDecorator(FlowDecorator):
|
|
8
|
+
"""
|
|
9
|
+
This decorator is used to run NIM containers in Metaflow tasks as sidecars.
|
|
10
|
+
|
|
11
|
+
User code call
|
|
12
|
+
-----------
|
|
13
|
+
@nim(
|
|
14
|
+
models=['meta/llama3-8b-instruct', 'meta/llama3-70b-instruct'],
|
|
15
|
+
backend='managed'
|
|
16
|
+
)
|
|
17
|
+
|
|
18
|
+
Valid backend options
|
|
19
|
+
---------------------
|
|
20
|
+
- 'managed': Outerbounds selects a compute provider based on the model.
|
|
21
|
+
- 🚧 'dataplane': Run in your account.
|
|
22
|
+
|
|
23
|
+
|
|
24
|
+
Valid model options
|
|
25
|
+
----------------
|
|
26
|
+
- 'meta/llama3-8b-instruct': 8B parameter model
|
|
27
|
+
- 'meta/llama3-70b-instruct': 70B parameter model
|
|
28
|
+
- Upon request, any model here: https://nvcf.ngc.nvidia.com/functions?filter=nvidia-functions
|
|
29
|
+
|
|
30
|
+
MF Add To Current
|
|
31
|
+
-----------------
|
|
32
|
+
current.nim
|
|
33
|
+
|
|
34
|
+
Parameters
|
|
35
|
+
----------
|
|
36
|
+
models: list[NIM]
|
|
37
|
+
List of NIM containers running models in sidecars.
|
|
38
|
+
backend: str
|
|
39
|
+
Compute provider to run the NIM container.
|
|
40
|
+
"""
|
|
41
|
+
|
|
42
|
+
name = "nim"
|
|
43
|
+
defaults = {
|
|
44
|
+
"models": [],
|
|
45
|
+
"backend": "managed",
|
|
46
|
+
}
|
|
47
|
+
|
|
48
|
+
def flow_init(
|
|
49
|
+
self, flow, graph, environment, flow_datastore, metadata, logger, echo, options
|
|
50
|
+
):
|
|
51
|
+
current._update_env(
|
|
52
|
+
{
|
|
53
|
+
"nim": NimManager(
|
|
54
|
+
models=self.attributes["models"], backend=self.attributes["backend"]
|
|
55
|
+
)
|
|
56
|
+
}
|
|
57
|
+
)
|
|
58
|
+
|
|
59
|
+
|
|
60
|
+
FLOW_DECORATORS_DESC = [("nim", ".NimDecorator")]
|
|
@@ -0,0 +1,137 @@
|
|
|
1
|
+
import os
|
|
2
|
+
import time
|
|
3
|
+
import json
|
|
4
|
+
import requests
|
|
5
|
+
from urllib.parse import urlparse
|
|
6
|
+
from metaflow.metaflow_config import SERVICE_URL
|
|
7
|
+
from metaflow.metaflow_config_funcs import init_config
|
|
8
|
+
|
|
9
|
+
auth_host = "auth." + urlparse(SERVICE_URL).hostname.split(".", 1)[1]
|
|
10
|
+
nim_info_url = "https://" + auth_host + "/generate/nim"
|
|
11
|
+
|
|
12
|
+
NVCF_URL = "https://api.nvcf.nvidia.com"
|
|
13
|
+
NVCF_SUBMIT_ENDPOINT = f"{NVCF_URL}/v2/nvcf/pexec/functions"
|
|
14
|
+
NVCF_RESULT_ENDPOINT = f"{NVCF_URL}/v2/nvcf/pexec/status"
|
|
15
|
+
|
|
16
|
+
NVCF_CHAT_COMPLETION_MODELS = []
|
|
17
|
+
COREWEAVE_CHAT_COMPLETION_MODELS = []
|
|
18
|
+
|
|
19
|
+
conf = init_config()
|
|
20
|
+
if "METAFLOW_SERVICE_AUTH_KEY" in conf:
|
|
21
|
+
headers = {"x-api-key": conf["METAFLOW_SERVICE_AUTH_KEY"]}
|
|
22
|
+
res = requests.get(nim_info_url, headers=headers)
|
|
23
|
+
else:
|
|
24
|
+
headers = json.loads(os.environ.get("METAFLOW_SERVICE_HEADERS"))
|
|
25
|
+
res = requests.get(nim_info_url, headers=headers)
|
|
26
|
+
|
|
27
|
+
res.raise_for_status()
|
|
28
|
+
NGC_API_KEY = res.json()["nvcf"]["api_key"]
|
|
29
|
+
for model in res.json()["nvcf"]["functions"]:
|
|
30
|
+
NVCF_CHAT_COMPLETION_MODELS.append(
|
|
31
|
+
{
|
|
32
|
+
"name": model["model_key"],
|
|
33
|
+
"function-id": model["id"],
|
|
34
|
+
"version-id": model["version"],
|
|
35
|
+
}
|
|
36
|
+
)
|
|
37
|
+
for model in res.json()["coreweave"]["containers"]:
|
|
38
|
+
COREWEAVE_CHAT_COMPLETION_MODELS.append(
|
|
39
|
+
{"name": model["nim_name"], "ip-address": model["ip_addr"]}
|
|
40
|
+
)
|
|
41
|
+
|
|
42
|
+
COMMON_HEADERS = {"accept": "application/json", "Content-Type": "application/json"}
|
|
43
|
+
COREWEAVE_HEADERS = COMMON_HEADERS
|
|
44
|
+
NVCF_HEADERS = {**COMMON_HEADERS, "Authorization": f"Bearer {NGC_API_KEY}"}
|
|
45
|
+
POLL_INTERVAL = 1
|
|
46
|
+
|
|
47
|
+
|
|
48
|
+
class NimManager(object):
|
|
49
|
+
def __init__(self, models, backend):
|
|
50
|
+
if backend == "managed":
|
|
51
|
+
nvcf_models = [m["name"] for m in NVCF_CHAT_COMPLETION_MODELS]
|
|
52
|
+
cw_models = [m["name"] for m in COREWEAVE_CHAT_COMPLETION_MODELS]
|
|
53
|
+
for m in models:
|
|
54
|
+
if m not in nvcf_models and m not in cw_models:
|
|
55
|
+
raise ValueError(
|
|
56
|
+
f"Model {m} not supported by the Outerbounds @nim offering."
|
|
57
|
+
f"\nYou can choose from these options: {nvcf_models + cw_models}\n\n"
|
|
58
|
+
"Reach out to Outerbounds if there are other models you'd like supported."
|
|
59
|
+
)
|
|
60
|
+
self.models = {}
|
|
61
|
+
for m in models:
|
|
62
|
+
if m in nvcf_models:
|
|
63
|
+
self.models[m] = NimChatCompletion(model=m, provider="NVCF")
|
|
64
|
+
elif m in cw_models:
|
|
65
|
+
self.models[m] = NimChatCompletion(model=m, provider="CoreWeave")
|
|
66
|
+
else:
|
|
67
|
+
raise ValueError(
|
|
68
|
+
f"Backend {backend} not supported by the Outerbounds @nim offering. Please reach out to Outerbounds."
|
|
69
|
+
)
|
|
70
|
+
|
|
71
|
+
|
|
72
|
+
class NimChatCompletion(object):
|
|
73
|
+
def __init__(self, model="meta/llama3-8b-instruct", provider="CoreWeave", **kwargs):
|
|
74
|
+
self.compute_provider = provider
|
|
75
|
+
self.invocations = []
|
|
76
|
+
|
|
77
|
+
if self.compute_provider == "CoreWeave":
|
|
78
|
+
cw_model_names = [m["name"] for m in COREWEAVE_CHAT_COMPLETION_MODELS]
|
|
79
|
+
self.model = model
|
|
80
|
+
self.ip_address = COREWEAVE_CHAT_COMPLETION_MODELS[
|
|
81
|
+
cw_model_names.index(model)
|
|
82
|
+
]["ip-address"]
|
|
83
|
+
self.endpoint = f"http://{self.ip_address}:8000/v1/chat/completions"
|
|
84
|
+
|
|
85
|
+
elif self.compute_provider == "NVCF":
|
|
86
|
+
nvcf_model_names = [m["name"] for m in NVCF_CHAT_COMPLETION_MODELS]
|
|
87
|
+
self.model = model
|
|
88
|
+
self.function_id = NVCF_CHAT_COMPLETION_MODELS[
|
|
89
|
+
nvcf_model_names.index(model)
|
|
90
|
+
]["function-id"]
|
|
91
|
+
self.version_id = NVCF_CHAT_COMPLETION_MODELS[
|
|
92
|
+
nvcf_model_names.index(model)
|
|
93
|
+
]["version-id"]
|
|
94
|
+
|
|
95
|
+
def __call__(self, **kwargs):
|
|
96
|
+
|
|
97
|
+
if self.compute_provider == "CoreWeave":
|
|
98
|
+
request_data = {"model": self.model, **kwargs}
|
|
99
|
+
response = requests.post(
|
|
100
|
+
self.endpoint, headers=COREWEAVE_HEADERS, json=request_data
|
|
101
|
+
)
|
|
102
|
+
response.raise_for_status()
|
|
103
|
+
return response.json()
|
|
104
|
+
|
|
105
|
+
elif self.compute_provider == "NVCF":
|
|
106
|
+
|
|
107
|
+
request_data = {"model": self.model, **kwargs}
|
|
108
|
+
request_url = f"{NVCF_SUBMIT_ENDPOINT}/{self.function_id}"
|
|
109
|
+
|
|
110
|
+
response = requests.post(
|
|
111
|
+
request_url, headers=NVCF_HEADERS, json=request_data
|
|
112
|
+
)
|
|
113
|
+
response.raise_for_status()
|
|
114
|
+
if response.status_code == 202:
|
|
115
|
+
invocation_id = response.headers.get("NVCF-REQID")
|
|
116
|
+
self.invocations.append(invocation_id)
|
|
117
|
+
elif response.status_code == 200:
|
|
118
|
+
return response.json()
|
|
119
|
+
|
|
120
|
+
def _poll():
|
|
121
|
+
poll_request_url = f"{NVCF_RESULT_ENDPOINT}/{invocation_id}"
|
|
122
|
+
poll_response = requests.get(poll_request_url, headers=NVCF_HEADERS)
|
|
123
|
+
poll_response.raise_for_status()
|
|
124
|
+
if poll_response.status_code == 200:
|
|
125
|
+
return poll_response.json()
|
|
126
|
+
elif poll_response.status_code == 202:
|
|
127
|
+
return 202
|
|
128
|
+
else:
|
|
129
|
+
raise Exception(
|
|
130
|
+
f"NVCF returned {poll_response.status_code} status code. Please contact Outerbounds."
|
|
131
|
+
)
|
|
132
|
+
|
|
133
|
+
while True:
|
|
134
|
+
data = _poll()
|
|
135
|
+
if data and data != 202:
|
|
136
|
+
return data
|
|
137
|
+
time.sleep(POLL_INTERVAL)
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
toplevel = "nim_toplevel"
|
|
@@ -1,5 +1,9 @@
|
|
|
1
1
|
README.md
|
|
2
2
|
setup.py
|
|
3
|
+
metaflow_extensions/nim/plugins/__init__.py
|
|
4
|
+
metaflow_extensions/nim/plugins/nim.py
|
|
5
|
+
metaflow_extensions/nim/toplevel/mfextinit_nim.py
|
|
6
|
+
metaflow_extensions/nim/toplevel/nim_toplevel.py
|
|
3
7
|
metaflow_extensions/outerbounds/__init__.py
|
|
4
8
|
metaflow_extensions/outerbounds/remote_config.py
|
|
5
9
|
metaflow_extensions/outerbounds/config/__init__.py
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|