ConfigLMM 0.4.0 → 0.5.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/CHANGELOG.md +34 -0
- data/CNAME +1 -0
- data/Examples/.lmm.state.yaml +159 -0
- data/Examples/ConfigLMM.mm.yaml +32 -0
- data/Examples/Implemented.mm.yaml +252 -4
- data/Examples/SmallBusiness.mm.yaml +492 -0
- data/Plugins/Apps/Answer/answer.lmm.rb +165 -0
- data/Plugins/Apps/Answer/answer@.service +40 -0
- data/Plugins/Apps/ArchiSteamFarm/ArchiSteamFarm.conf.erb +0 -3
- data/Plugins/Apps/ArchiSteamFarm/ArchiSteamFarm.lmm.rb +0 -1
- data/Plugins/Apps/Authentik/Authentik-ProxyOutpost.container +7 -1
- data/Plugins/Apps/Authentik/Authentik-Server.container +6 -1
- data/Plugins/Apps/Authentik/Authentik-Worker.container +6 -1
- data/Plugins/Apps/Authentik/Authentik.conf.erb +12 -7
- data/Plugins/Apps/Authentik/Authentik.lmm.rb +226 -61
- data/Plugins/Apps/BookStack/BookStack.conf.erb +0 -3
- data/Plugins/Apps/BookStack/BookStack.container +5 -0
- data/Plugins/Apps/BookStack/BookStack.lmm.rb +14 -3
- data/Plugins/Apps/Cassandra/Cassandra.lmm.rb +9 -19
- data/Plugins/Apps/ClickHouse/ClickHouse.container +28 -0
- data/Plugins/Apps/ClickHouse/ClickHouse.lmm.rb +113 -0
- data/Plugins/Apps/ClickHouse/Config/listen.yaml +2 -0
- data/Plugins/Apps/ClickHouse/Config/logger.yaml +8 -0
- data/Plugins/Apps/ClickHouse/Config/zookeepers.yaml +5 -0
- data/Plugins/Apps/ClickHouse/Connection.rb +96 -0
- data/Plugins/Apps/Discourse/Discourse-Sidekiq.container +5 -0
- data/Plugins/Apps/Discourse/Discourse.conf.erb +1 -4
- data/Plugins/Apps/Discourse/Discourse.container +4 -0
- data/Plugins/Apps/Discourse/Discourse.lmm.rb +116 -55
- data/Plugins/Apps/Dovecot/Dovecot.lmm.rb +74 -62
- data/Plugins/Apps/ERPNext/ERPNext-Frontend.container +6 -1
- data/Plugins/Apps/ERPNext/ERPNext-Queue.container +5 -0
- data/Plugins/Apps/ERPNext/ERPNext-Scheduler.container +5 -0
- data/Plugins/Apps/ERPNext/ERPNext-Websocket.container +6 -1
- data/Plugins/Apps/ERPNext/ERPNext.container +6 -1
- data/Plugins/Apps/ERPNext/ERPNext.lmm.rb +138 -127
- data/Plugins/Apps/GitLab/GitLab.container +6 -0
- data/Plugins/Apps/GitLab/GitLab.lmm.rb +43 -49
- data/Plugins/Apps/Homepage/Homepage.conf.erb +86 -0
- data/Plugins/Apps/Homepage/Homepage.container +19 -0
- data/Plugins/Apps/Homepage/Homepage.lmm.rb +54 -0
- data/Plugins/Apps/IPFS/IPFS.conf.erb +0 -3
- data/Plugins/Apps/IPFS/IPFS.lmm.rb +0 -1
- data/Plugins/Apps/InfluxDB/InfluxDB.conf.erb +0 -3
- data/Plugins/Apps/InfluxDB/InfluxDB.lmm.rb +0 -1
- data/Plugins/Apps/Jackett/Jackett.conf.erb +0 -3
- data/Plugins/Apps/Jackett/Jackett.lmm.rb +0 -1
- data/Plugins/Apps/Jellyfin/Jellyfin.conf.erb +0 -3
- data/Plugins/Apps/Jellyfin/Jellyfin.lmm.rb +0 -1
- data/Plugins/Apps/LetsEncrypt/LetsEncrypt.lmm.rb +49 -28
- data/Plugins/Apps/LibreTranslate/LibreTranslate.container +21 -0
- data/Plugins/Apps/LibreTranslate/LibreTranslate.lmm.rb +34 -0
- data/Plugins/Apps/Lobsters/Containerfile +81 -0
- data/Plugins/Apps/Lobsters/Lobsters-Tasks.container +26 -0
- data/Plugins/Apps/Lobsters/Lobsters.conf.erb +99 -0
- data/Plugins/Apps/Lobsters/Lobsters.container +27 -0
- data/Plugins/Apps/Lobsters/Lobsters.lmm.rb +196 -0
- data/Plugins/Apps/Lobsters/crontab +3 -0
- data/Plugins/Apps/Lobsters/database.yml +26 -0
- data/Plugins/Apps/Lobsters/entrypoint.sh +30 -0
- data/Plugins/Apps/Lobsters/generateCredentials.rb +19 -0
- data/Plugins/Apps/Lobsters/lobsters-cron.sh +25 -0
- data/Plugins/Apps/Lobsters/lobsters-daily.sh +23 -0
- data/Plugins/Apps/Lobsters/puma.rb +49 -0
- data/Plugins/Apps/MariaDB/Connection.rb +55 -0
- data/Plugins/Apps/MariaDB/MariaDB.lmm.rb +60 -53
- data/Plugins/Apps/Mastodon/Mastodon-Sidekiq.container +22 -0
- data/Plugins/Apps/Mastodon/Mastodon-Streaming.container +20 -0
- data/Plugins/Apps/Mastodon/Mastodon.conf.erb +34 -45
- data/Plugins/Apps/Mastodon/Mastodon.container +28 -0
- data/Plugins/Apps/Mastodon/Mastodon.lmm.rb +240 -5
- data/Plugins/Apps/Mastodon/configlmm.rake +30 -0
- data/Plugins/Apps/Mastodon/entrypoint.sh +16 -0
- data/Plugins/Apps/Matrix/Element.container +5 -0
- data/Plugins/Apps/Matrix/Matrix.conf.erb +2 -8
- data/Plugins/Apps/Matrix/Matrix.lmm.rb +100 -71
- data/Plugins/Apps/Matrix/Synapse.container +5 -0
- data/Plugins/Apps/Netdata/Netdata.conf.erb +0 -3
- data/Plugins/Apps/Netdata/Netdata.lmm.rb +0 -1
- data/Plugins/Apps/Nextcloud/Nextcloud.conf.erb +3 -4
- data/Plugins/Apps/Nextcloud/Nextcloud.lmm.rb +150 -68
- data/Plugins/Apps/Nextcloud/autoconfig.php +13 -0
- data/Plugins/Apps/Nextcloud/config.php +10 -1
- data/Plugins/Apps/Nextcloud/nextcloudcron.service +8 -0
- data/Plugins/Apps/Nextcloud/nextcloudcron.timer +10 -0
- data/Plugins/Apps/Nginx/Connection.rb +93 -0
- data/Plugins/Apps/Nginx/conf.d/configlmm.conf +50 -9
- data/Plugins/Apps/Nginx/conf.d/languages.conf +21 -0
- data/Plugins/Apps/Nginx/config-lmm/errors.conf +25 -20
- data/Plugins/Apps/Nginx/config-lmm/gateway-errors.conf +20 -0
- data/Plugins/Apps/Nginx/config-lmm/proxy.conf +1 -1
- data/Plugins/Apps/Nginx/main.conf.erb +7 -3
- data/Plugins/Apps/Nginx/nginx.conf +2 -2
- data/Plugins/Apps/Nginx/nginx.lmm.rb +99 -81
- data/Plugins/Apps/Nginx/proxy.conf.erb +11 -3
- data/Plugins/Apps/Odoo/Odoo.conf.erb +0 -3
- data/Plugins/Apps/Odoo/Odoo.container +5 -0
- data/Plugins/Apps/Odoo/Odoo.lmm.rb +4 -5
- data/Plugins/Apps/Ollama/Ollama.container +26 -0
- data/Plugins/Apps/Ollama/Ollama.lmm.rb +73 -0
- data/Plugins/Apps/OpenTelemetry/Config/config.yaml +704 -0
- data/Plugins/Apps/OpenTelemetry/OpenTelemetry.lmm.rb +154 -0
- data/Plugins/Apps/OpenVidu/Ingress.container +5 -0
- data/Plugins/Apps/OpenVidu/OpenVidu.conf.erb +0 -3
- data/Plugins/Apps/OpenVidu/OpenVidu.container +5 -0
- data/Plugins/Apps/OpenVidu/OpenVidu.lmm.rb +7 -3
- data/Plugins/Apps/OpenVidu/OpenViduCall.conf.erb +0 -3
- data/Plugins/Apps/OpenVidu/OpenViduCall.container +5 -0
- data/Plugins/Apps/PHP-FPM/Connection.rb +91 -0
- data/Plugins/Apps/PHP-FPM/PHP-FPM.lmm.rb +31 -4
- data/Plugins/Apps/Peppermint/Peppermint.conf.erb +2 -5
- data/Plugins/Apps/Peppermint/Peppermint.container +5 -0
- data/Plugins/Apps/Peppermint/Peppermint.lmm.rb +29 -33
- data/Plugins/Apps/Perplexica/Perplexica.container +25 -0
- data/Plugins/Apps/Perplexica/Perplexica.lmm.rb +92 -0
- data/Plugins/Apps/Perplexica/config.toml +26 -0
- data/Plugins/Apps/Podman/Connection.rb +24 -0
- data/Plugins/Apps/Podman/Podman.lmm.rb +80 -0
- data/Plugins/Apps/Podman/storage.conf +6 -0
- data/Plugins/Apps/Postfix/Postfix.lmm.rb +242 -164
- data/Plugins/Apps/PostgreSQL/Connection.rb +97 -0
- data/Plugins/Apps/PostgreSQL/PostgreSQL.lmm.rb +184 -148
- data/Plugins/Apps/Pterodactyl/Pterodactyl.conf.erb +0 -3
- data/Plugins/Apps/Pterodactyl/Pterodactyl.lmm.rb +0 -2
- data/Plugins/Apps/Pterodactyl/Wings.conf.erb +0 -3
- data/Plugins/Apps/RVM/RVM.lmm.rb +57 -0
- data/Plugins/Apps/Roundcube/Roundcube.conf.erb +0 -3
- data/Plugins/Apps/Roundcube/Roundcube.lmm.rb +15 -19
- data/Plugins/Apps/SSH/SSH.lmm.rb +9 -15
- data/Plugins/Apps/SearXNG/SearXNG.container +22 -0
- data/Plugins/Apps/SearXNG/SearXNG.lmm.rb +79 -0
- data/Plugins/Apps/SearXNG/limiter.toml +40 -0
- data/Plugins/Apps/SearXNG/settings.yml +2 -0
- data/Plugins/Apps/SigNoz/Config/alerts.yml +11 -0
- data/Plugins/Apps/SigNoz/Config/otel-collector-config.yaml +110 -0
- data/Plugins/Apps/SigNoz/Config/otel-collector-opamp-config.yaml +1 -0
- data/Plugins/Apps/SigNoz/Config/prometheus.yml +18 -0
- data/Plugins/Apps/SigNoz/SigNoz-Collector.container +23 -0
- data/Plugins/Apps/SigNoz/SigNoz-Migrator.container +17 -0
- data/Plugins/Apps/SigNoz/SigNoz.conf.erb +61 -0
- data/Plugins/Apps/SigNoz/SigNoz.container +26 -0
- data/Plugins/Apps/SigNoz/SigNoz.lmm.rb +319 -0
- data/Plugins/Apps/Solr/log4j2.xml +89 -0
- data/Plugins/Apps/Solr/solr.lmm.rb +82 -0
- data/Plugins/Apps/Sunshine/Sunshine.conf.erb +0 -3
- data/Plugins/Apps/Sunshine/Sunshine.lmm.rb +0 -1
- data/Plugins/Apps/Tunnel/tunnel.lmm.rb +33 -37
- data/Plugins/Apps/UVdesk/UVdesk.conf.erb +0 -3
- data/Plugins/Apps/Umami/Umami.container +19 -0
- data/Plugins/Apps/Umami/Umami.lmm.rb +108 -0
- data/Plugins/Apps/Valkey/Valkey.lmm.rb +54 -42
- data/Plugins/Apps/Vaultwarden/Vaultwarden.conf.erb +9 -6
- data/Plugins/Apps/Vaultwarden/Vaultwarden.container +7 -1
- data/Plugins/Apps/Vaultwarden/Vaultwarden.lmm.rb +64 -29
- data/Plugins/Apps/Wiki.js/Wiki.js.conf.erb +1 -4
- data/Plugins/Apps/Wiki.js/Wiki.js.container +5 -0
- data/Plugins/Apps/Wiki.js/Wiki.js.lmm.rb +31 -37
- data/Plugins/Apps/YaCy/YaCy.conf.erb +93 -0
- data/Plugins/Apps/YaCy/YaCy.container +21 -0
- data/Plugins/Apps/YaCy/YaCy.lmm.rb +160 -0
- data/Plugins/Apps/ZooKeeper/ZooKeeper.container +24 -0
- data/Plugins/Apps/ZooKeeper/ZooKeeper.lmm.rb +68 -0
- data/Plugins/Apps/bitmagnet/bitmagnet.conf.erb +0 -3
- data/Plugins/Apps/bitmagnet/bitmagnet.lmm.rb +0 -1
- data/Plugins/Apps/gollum/gollum.conf.erb +2 -4
- data/Plugins/Apps/gollum/gollum.container +6 -0
- data/Plugins/Apps/gollum/gollum.lmm.rb +51 -50
- data/Plugins/Apps/llama.cpp/llama.cpp.container +28 -0
- data/Plugins/Apps/llama.cpp/llama.cpp.lmm.rb +90 -0
- data/Plugins/Apps/vLLM/vLLM.container +32 -0
- data/Plugins/Apps/vLLM/vLLM.lmm.rb +89 -0
- data/Plugins/OS/General/Utils.lmm.rb +26 -0
- data/Plugins/OS/Linux/Connection.rb +472 -0
- data/Plugins/OS/Linux/Debian/preseed.cfg.erb +25 -6
- data/Plugins/OS/Linux/Flavours.yaml +13 -0
- data/Plugins/OS/Linux/Grub/grub.cfg +10 -0
- data/Plugins/OS/Linux/HTTP.rb +32 -0
- data/Plugins/OS/Linux/Linux.lmm.rb +533 -187
- data/Plugins/OS/Linux/Packages.yaml +20 -1
- data/Plugins/OS/Linux/Services.yaml +8 -0
- data/Plugins/OS/Linux/Shell.rb +70 -0
- data/Plugins/OS/Linux/Syslinux/default +8 -0
- data/Plugins/OS/Linux/WireGuard/WireGuard.lmm.rb +83 -59
- data/Plugins/OS/Linux/WireGuard/wg0.conf.erb +3 -0
- data/Plugins/OS/Linux/openSUSE/autoinst.xml.erb +29 -3
- data/Plugins/OS/Linux/systemd/systemd.lmm.rb +13 -11
- data/Plugins/OS/Routers/Aruba/ArubaInstant.lmm.rb +6 -5
- data/Plugins/Platforms/GitHub.lmm.rb +73 -28
- data/Plugins/Platforms/GoDaddy/GoDaddy.lmm.rb +9 -6
- data/Plugins/Platforms/Proxmox/Proxmox.lmm.rb +402 -0
- data/Plugins/Platforms/Proxmox/XTerm.rb +321 -0
- data/Plugins/Platforms/libvirt/libvirt.lmm.rb +38 -13
- data/Plugins/Platforms/porkbun.lmm.rb +12 -2
- data/Plugins/Platforms/porkbun_spec.rb +2 -2
- data/Plugins/Services/DNS/AmberBit.lmm.rb +1 -1
- data/Plugins/Services/DNS/ArubaItDNS.lmm.rb +1 -1
- data/Plugins/Services/DNS/NICLV.lmm.rb +1 -1
- data/Plugins/Services/DNS/PowerDNS.lmm.rb +70 -68
- data/Plugins/Services/DNS/tonic.lmm.rb +22 -12
- data/lib/ConfigLMM/Framework/plugins/dns.rb +4 -3
- data/lib/ConfigLMM/Framework/plugins/linuxApp.rb +145 -184
- data/lib/ConfigLMM/Framework/plugins/nginxApp.rb +34 -17
- data/lib/ConfigLMM/Framework/plugins/plugin.rb +53 -181
- data/lib/ConfigLMM/Framework/plugins/store.rb +4 -4
- data/lib/ConfigLMM/Framework/variables.rb +75 -0
- data/lib/ConfigLMM/Framework.rb +1 -0
- data/lib/ConfigLMM/cli.rb +12 -6
- data/lib/ConfigLMM/commands/configsCommand.rb +37 -6
- data/lib/ConfigLMM/commands/diff.rb +33 -9
- data/lib/ConfigLMM/context.rb +22 -3
- data/lib/ConfigLMM/io/configList.rb +82 -6
- data/lib/ConfigLMM/io/connection.rb +143 -0
- data/lib/ConfigLMM/io/dhcp.rb +330 -0
- data/lib/ConfigLMM/io/http.rb +78 -0
- data/lib/ConfigLMM/io/local.rb +207 -0
- data/lib/ConfigLMM/io/pxe.rb +92 -0
- data/lib/ConfigLMM/io/ssh.rb +156 -0
- data/lib/ConfigLMM/io/tftp.rb +105 -0
- data/lib/ConfigLMM/io.rb +2 -0
- data/lib/ConfigLMM/secrets/envStore.rb +39 -0
- data/lib/ConfigLMM/secrets/fileStore.rb +43 -0
- data/lib/ConfigLMM/state.rb +2 -1
- data/lib/ConfigLMM/version.rb +2 -1
- data/lib/ConfigLMM.rb +1 -0
- data/{Examples → scripts}/configlmmAuth.sh +7 -5
- metadata +205 -8
@@ -0,0 +1,90 @@
|
|
1
|
+
|
2
|
+
|
3
|
+
module ConfigLMM
|
4
|
+
module LMM
|
5
|
+
class Llamacpp < Framework::Plugin
|
6
|
+
|
7
|
+
USER = 'llama.cpp'
|
8
|
+
HOME_DIR = '/var/lib/llama.cpp'
|
9
|
+
PORT = 18900
|
10
|
+
|
11
|
+
def actionLlamacppDeploy(id, target, activeState, context, options)
|
12
|
+
raise Framework::PluginProcessError.new('Model field must be set!') unless target['Model']
|
13
|
+
|
14
|
+
self.withConnection(target['Location'], target) do |connection|
|
15
|
+
Linux.withConnection(connection) do |linuxConnection|
|
16
|
+
Podman.ensurePresent(linuxConnection, options)
|
17
|
+
Podman.createUser(USER, HOME_DIR, 'llama.cpp', linuxConnection, options)
|
18
|
+
linuxConnection.withUserShell(USER) do |shell|
|
19
|
+
shell.createDirs(options, '~/models', '~/.cache')
|
20
|
+
end
|
21
|
+
|
22
|
+
path = Podman.containersPath(HOME_DIR)
|
23
|
+
|
24
|
+
linuxConnection.fileWrite("#{path}/llama.cpp.env", '', options)
|
25
|
+
if target['Model'].end_with?('.gguf')
|
26
|
+
linuxConnection.fileAppend("#{path}/llama.cpp.env", 'LLAMA_ARG_MODEL=' + target['Model'], options)
|
27
|
+
else
|
28
|
+
linuxConnection.fileAppend("#{path}/llama.cpp.env", 'LLAMA_ARG_HF_REPO=' + target['Model'], options)
|
29
|
+
end
|
30
|
+
|
31
|
+
linuxConnection.setUserGroup("#{path}/llama.cpp.env", USER, USER, options)
|
32
|
+
linuxConnection.setPrivate("#{path}/llama.cpp.env", options)
|
33
|
+
|
34
|
+
linuxConnection.upload(__dir__ + '/llama.cpp.container', path, options)
|
35
|
+
|
36
|
+
devices = linuxConnection.getGPUDevices(options)
|
37
|
+
groups = linuxConnection.getGPUGroups(devices, options)
|
38
|
+
linuxConnection.userAddGroups(USER, groups, options)
|
39
|
+
|
40
|
+
image = nil
|
41
|
+
if devices.include?('/dev/kfd')
|
42
|
+
#image = 'full-rocm'
|
43
|
+
elsif devices.include?('nvidia.com/gpu=all')
|
44
|
+
image = 'full-cuda'
|
45
|
+
end
|
46
|
+
|
47
|
+
if image
|
48
|
+
linuxConnection.fileReplace("#{path}/llama.cpp.container", ':full', ':' + image, options)
|
49
|
+
end
|
50
|
+
|
51
|
+
args = target['Args'].to_s
|
52
|
+
linuxConnection.fileReplace("#{path}/llama.cpp.container", '\$ARGS', args, options)
|
53
|
+
|
54
|
+
devicesString = ''
|
55
|
+
if !devices.empty?
|
56
|
+
devicesString = devices.map { |device| "AddDevice=#{device}" }.join('\n')
|
57
|
+
end
|
58
|
+
linuxConnection.fileReplace("#{path}/llama.cpp.container", '\$DEVICES', devicesString, { **options, escape: false })
|
59
|
+
|
60
|
+
linuxConnection.reloadUserServices(USER, options)
|
61
|
+
linuxConnection.restartUserService(USER, 'llama.cpp', options)
|
62
|
+
end
|
63
|
+
end
|
64
|
+
end
|
65
|
+
|
66
|
+
def cleanup(configs, state, context, options)
|
67
|
+
cleanupType(:llamacpp, configs, state, context, options) do |item, id, state, context, options, connection|
|
68
|
+
Linux.withConnection(connection) do |linuxConnection|
|
69
|
+
|
70
|
+
linuxConnection.stopUserService(USER, 'llama.cpp', options)
|
71
|
+
|
72
|
+
path = Podman.containersPath(HOME_DIR)
|
73
|
+
linuxConnection.rm(path + '/llama.cpp.container', options[:dry])
|
74
|
+
|
75
|
+
linuxConnection.reloadUserServices(USER, options)
|
76
|
+
|
77
|
+
state.item(id)['Status'] = State::STATUS_DELETED unless options[:dry]
|
78
|
+
|
79
|
+
if options[:destroy]
|
80
|
+
linuxConnection.deleteUserAndGroup(USER, options)
|
81
|
+
state.item(id)['Status'] = State::STATUS_DESTROYED unless options[:dry]
|
82
|
+
end
|
83
|
+
end
|
84
|
+
end
|
85
|
+
end
|
86
|
+
|
87
|
+
end
|
88
|
+
end
|
89
|
+
end
|
90
|
+
|
@@ -0,0 +1,32 @@
|
|
1
|
+
|
2
|
+
[Unit]
|
3
|
+
Description=vLLM container
|
4
|
+
After=local-fs.target
|
5
|
+
|
6
|
+
[Container]
|
7
|
+
ContainerName=vLLM
|
8
|
+
Image=$IMAGE
|
9
|
+
Entrypoint=["python3", "-m", "vllm.entrypoints.openai.api_server"]
|
10
|
+
Exec=$ARGS
|
11
|
+
EnvironmentFile=/var/lib/vllm/.config/containers/systemd/vLLM.env
|
12
|
+
PublishPort=127.0.0.1:18050:8000
|
13
|
+
UserNS=keep-id:uid=1000,gid=1000
|
14
|
+
# Need newer Podman to use this
|
15
|
+
#GroupAdd=keep-groups
|
16
|
+
PodmanArgs=--group-add keep-groups
|
17
|
+
#PodmanArgs=--passwd-entry 'vllm:x:1000:1000:vLLM:/home/vllm:/bin/bash'
|
18
|
+
Volume=/var/lib/vllm/.cache:/app/.cache
|
19
|
+
Volume=/var/lib/vllm/.triton:/app/.triton
|
20
|
+
Volume=/var/lib/vllm/.cache:/root/.cache
|
21
|
+
Volume=/var/lib/vllm/.cache:/workspace/.cache
|
22
|
+
ShmSize=1G
|
23
|
+
$DEVICES
|
24
|
+
LogDriver=journald
|
25
|
+
AutoUpdate=registry
|
26
|
+
|
27
|
+
[Service]
|
28
|
+
TimeoutStartSec=12min
|
29
|
+
Restart=on-failure
|
30
|
+
|
31
|
+
[Install]
|
32
|
+
WantedBy=multi-user.target default.target
|
@@ -0,0 +1,89 @@
|
|
1
|
+
|
2
|
+
|
3
|
+
module ConfigLMM
|
4
|
+
module LMM
|
5
|
+
class VLLM < Framework::Plugin
|
6
|
+
|
7
|
+
USER = 'vllm'
|
8
|
+
HOME_DIR = '/var/lib/vllm'
|
9
|
+
PORT = 18050
|
10
|
+
|
11
|
+
CPU_IMAGE = 'public.ecr.aws/q9t5s3a7/vllm-cpu-release-repo:v0.8.4'
|
12
|
+
CUDA_IMAGE = 'docker.io/vllm/vllm-openai:latest'
|
13
|
+
ROCM_IMAGE = 'docker.io/rocm/vllm:instinct_main'
|
14
|
+
|
15
|
+
def actionVLLMDeploy(id, target, activeState, context, options)
|
16
|
+
#raise Framework::PluginProcessError.new('Model field must be set!') unless target['Model']
|
17
|
+
|
18
|
+
self.withConnection(target['Location'], target) do |connection|
|
19
|
+
Linux.withConnection(connection) do |linuxConnection|
|
20
|
+
Podman.ensurePresent(linuxConnection, options)
|
21
|
+
Podman.createUser(USER, HOME_DIR, 'vLLM', linuxConnection, options)
|
22
|
+
linuxConnection.withUserShell(USER) do |shell|
|
23
|
+
shell.createDirs(options, '~/.cache', '~/.triton')
|
24
|
+
end
|
25
|
+
|
26
|
+
path = Podman.containersPath(HOME_DIR)
|
27
|
+
|
28
|
+
linuxConnection.fileWrite("#{path}/vLLM.env", '', options)
|
29
|
+
|
30
|
+
linuxConnection.setUserGroup("#{path}/vLLM.env", USER, USER, options)
|
31
|
+
linuxConnection.setPrivate("#{path}/vLLM.env", options)
|
32
|
+
|
33
|
+
linuxConnection.upload(__dir__ + '/vLLM.container', path, options)
|
34
|
+
|
35
|
+
devices = linuxConnection.getGPUDevices(options)
|
36
|
+
groups = linuxConnection.getGPUGroups(devices, options)
|
37
|
+
linuxConnection.userAddGroups(USER, groups, options)
|
38
|
+
|
39
|
+
image = CPU_IMAGE
|
40
|
+
if devices.include?('/dev/kfd')
|
41
|
+
image = ROCM_IMAGE
|
42
|
+
elsif devices.include?('nvidia.com/gpu=all')
|
43
|
+
image = CUDA_IMAGE
|
44
|
+
end
|
45
|
+
linuxConnection.fileReplace("#{path}/vLLM.container", '\$IMAGE', image, options)
|
46
|
+
|
47
|
+
args = target['Args'].to_s
|
48
|
+
if target['Model']
|
49
|
+
args += ' --model ' + target['Model'].to_s
|
50
|
+
end
|
51
|
+
linuxConnection.fileReplace("#{path}/vLLM.container", '\$ARGS', args, options)
|
52
|
+
|
53
|
+
devicesString = ''
|
54
|
+
if !devices.empty?
|
55
|
+
devicesString = devices.map { |device| "AddDevice=#{device}" }.join('\n')
|
56
|
+
end
|
57
|
+
|
58
|
+
linuxConnection.fileReplace("#{path}/vLLM.container", '\$DEVICES', devicesString, { **options, escape: false })
|
59
|
+
|
60
|
+
linuxConnection.reloadUserServices(USER, options)
|
61
|
+
linuxConnection.restartUserService(USER, 'vLLM', options)
|
62
|
+
end
|
63
|
+
end
|
64
|
+
end
|
65
|
+
|
66
|
+
def cleanup(configs, state, context, options)
|
67
|
+
cleanupType(:vLLM, configs, state, context, options) do |item, id, state, context, options, connection|
|
68
|
+
Linux.withConnection(connection) do |linuxConnection|
|
69
|
+
|
70
|
+
linuxConnection.stopUserService(USER, 'vLLM', options)
|
71
|
+
|
72
|
+
path = Podman.containersPath(HOME_DIR)
|
73
|
+
linuxConnection.rm(path + '/vLLM.container', options[:dry])
|
74
|
+
|
75
|
+
linuxConnection.reloadUserServices(USER, options)
|
76
|
+
|
77
|
+
state.item(id)['Status'] = State::STATUS_DELETED unless options[:dry]
|
78
|
+
|
79
|
+
if options[:destroy]
|
80
|
+
linuxConnection.deleteUserAndGroup(USER, options)
|
81
|
+
state.item(id)['Status'] = State::STATUS_DESTROYED unless options[:dry]
|
82
|
+
end
|
83
|
+
end
|
84
|
+
end
|
85
|
+
end
|
86
|
+
|
87
|
+
end
|
88
|
+
end
|
89
|
+
end
|
@@ -0,0 +1,26 @@
|
|
1
|
+
|
2
|
+
module ConfigLMM
|
3
|
+
module LMM
|
4
|
+
class Utils < Framework::Plugin
|
5
|
+
|
6
|
+
def actionFilesystemDeploy(id, target, activeState, context, options)
|
7
|
+
self.withConnection(target['Location'], target) do |connection|
|
8
|
+
Linux.withConnection(connection) do |linuxConnection|
|
9
|
+
if target['Directory']
|
10
|
+
linuxConnection.createDirs(options, target['Directory'])
|
11
|
+
end
|
12
|
+
if target['Directories']
|
13
|
+
linuxConnection.createDirs(options, *target['Directories'])
|
14
|
+
end
|
15
|
+
if target['Copy']
|
16
|
+
target['Copy'].each do |source, target|
|
17
|
+
linuxConnection.upload(source, target, options)
|
18
|
+
end
|
19
|
+
end
|
20
|
+
end
|
21
|
+
end
|
22
|
+
end
|
23
|
+
|
24
|
+
end
|
25
|
+
end
|
26
|
+
end
|