feat: refactor LocalAGI backend configuration to use external-LLM mode and update disk size to 30GB
This commit is contained in:
@@ -25,50 +25,6 @@ if [[ -n "$header_content" ]]; then
|
||||
echo "$header_content"
|
||||
fi
|
||||
|
||||
# Decide which runtime backend label to use for LocalAGI.
|
||||
# Priority:
|
||||
# 1) Explicit user choice (`var_localagi_backend` or `var_torch_backend`)
|
||||
# 2) Auto-detection when GPU passthrough is enabled:
|
||||
# - NVIDIA device nodes => `cu128`
|
||||
# - AMD KFD node => `rocm7.2`
|
||||
# 3) Fallback => `cpu`
|
||||
resolve_backend() {
|
||||
local requested="${var_localagi_backend:-${var_torch_backend:-auto}}"
|
||||
local backend="cpu"
|
||||
local gpu_type="${GPU_TYPE:-unknown}"
|
||||
local has_nvidia="no"
|
||||
local has_kfd="no"
|
||||
local has_amd_pci="no"
|
||||
local has_amd_vendor="no"
|
||||
|
||||
[[ -e /dev/nvidia0 || -e /dev/nvidiactl ]] && has_nvidia="yes"
|
||||
[[ -e /dev/kfd ]] && has_kfd="yes"
|
||||
lspci 2>/dev/null | grep -qiE 'AMD|Radeon' && has_amd_pci="yes"
|
||||
grep -qEi '0x1002|0x1022' /sys/class/drm/renderD*/device/vendor /sys/class/drm/card*/device/vendor 2>/dev/null && has_amd_vendor="yes"
|
||||
|
||||
case "$requested" in
|
||||
cpu | cu128 | rocm7.2)
|
||||
backend="$requested"
|
||||
;;
|
||||
*)
|
||||
if [[ "${var_gpu:-no}" == "yes" ]]; then
|
||||
if [[ "${gpu_type}" == "NVIDIA" || "${has_nvidia}" == "yes" ]]; then
|
||||
backend="cu128"
|
||||
elif [[ "${gpu_type}" == "AMD" || "${has_kfd}" == "yes" ]]; then
|
||||
backend="rocm7.2"
|
||||
elif [[ "${has_amd_pci}" == "yes" ]]; then
|
||||
backend="rocm7.2"
|
||||
elif [[ "${has_amd_vendor}" == "yes" ]]; then
|
||||
backend="rocm7.2"
|
||||
fi
|
||||
fi
|
||||
;;
|
||||
esac
|
||||
|
||||
RESOLVED_BACKEND="$backend"
|
||||
BACKEND_DETECTION_SUMMARY="requested=${requested}, var_gpu=${var_gpu:-no}, GPU_TYPE=${gpu_type}, nvidia=${has_nvidia}, kfd=${has_kfd}, amd_pci=${has_amd_pci}, amd_vendor=${has_amd_vendor}, selected=${backend}"
|
||||
}
|
||||
|
||||
# Build LocalAGI from source using upstream workflow:
|
||||
# - Build frontend in `webui/react-ui` with Bun
|
||||
# - Build backend binary with Go to `/usr/local/bin/localagi`
|
||||
@@ -141,68 +97,13 @@ install_apt_packages_resilient() {
|
||||
retry_cmd 2 5 apt_install_fix_missing_cmd "$@"
|
||||
}
|
||||
|
||||
# Install ROCm runtime via AMD Debian package-manager method.
|
||||
# Steps:
|
||||
# - Determine supported suite mapping for current Debian version
|
||||
# - Install AMD signing key
|
||||
# - Add ROCm and graphics repositories for 7.2
|
||||
# - Pin AMD repo origin
|
||||
# - Install `rocm` meta-package
|
||||
install_rocm_runtime_debian() {
|
||||
if [[ -f /etc/os-release ]]; then
|
||||
. /etc/os-release
|
||||
fi
|
||||
|
||||
local rocm_suite=""
|
||||
case "${VERSION_ID:-}" in
|
||||
13*) rocm_suite="noble" ;;
|
||||
12*) rocm_suite="jammy" ;;
|
||||
*)
|
||||
msg_warn "Unsupported Debian version for automatic ROCm repo setup"
|
||||
return 1
|
||||
;;
|
||||
esac
|
||||
|
||||
msg_info "Configuring ROCm apt repositories (${rocm_suite})"
|
||||
mkdir -p /etc/apt/keyrings
|
||||
if ! curl -fsSL https://repo.radeon.com/rocm/rocm.gpg.key | gpg --dearmor -o /etc/apt/keyrings/rocm.gpg; then
|
||||
msg_warn "Failed to add ROCm apt signing key"
|
||||
return 1
|
||||
fi
|
||||
|
||||
cat <<EOF >/etc/apt/sources.list.d/rocm.list
|
||||
deb [arch=amd64 signed-by=/etc/apt/keyrings/rocm.gpg] https://repo.radeon.com/rocm/apt/7.2 ${rocm_suite} main
|
||||
deb [arch=amd64 signed-by=/etc/apt/keyrings/rocm.gpg] https://repo.radeon.com/graphics/7.2/ubuntu ${rocm_suite} main
|
||||
EOF
|
||||
|
||||
cat <<EOF >/etc/apt/preferences.d/rocm-pin-600
|
||||
Package: *
|
||||
Pin: release o=repo.radeon.com
|
||||
Pin-Priority: 600
|
||||
EOF
|
||||
|
||||
msg_info "Installing ROCm runtime packages (this may take several minutes)"
|
||||
if ! retry_cmd 3 5 apt_update_cmd; then
|
||||
msg_warn "ROCm apt repository update failed"
|
||||
return 1
|
||||
fi
|
||||
if ! retry_cmd 3 10 apt_install_cmd rocm; then
|
||||
msg_warn "ROCm runtime package installation failed"
|
||||
return 1
|
||||
fi
|
||||
ldconfig || true
|
||||
msg_ok "Installed ROCm runtime packages"
|
||||
}
|
||||
|
||||
# Install base tooling needed to fetch/build/run LocalAGI.
|
||||
# `gnupg` is required for ROCm key import path.
|
||||
msg_info "Installing Dependencies"
|
||||
install_apt_packages_resilient \
|
||||
curl \
|
||||
ca-certificates \
|
||||
git \
|
||||
jq \
|
||||
gnupg \
|
||||
build-essential
|
||||
msg_ok "Installed Dependencies"
|
||||
|
||||
@@ -224,20 +125,10 @@ msg_info "Fetching LocalAGI Source"
|
||||
CLEAN_INSTALL=1 fetch_and_deploy_gh_release "localagi" "mudler/LocalAGI" "tarball" "latest" "/opt/localagi"
|
||||
msg_ok "Fetched LocalAGI Source"
|
||||
|
||||
# Resolve backend and prepare persistent state directory.
|
||||
msg_info "Resolving LocalAGI backend"
|
||||
resolve_backend
|
||||
BACKEND="${RESOLVED_BACKEND:-cpu}"
|
||||
msg_info "Backend detection: ${BACKEND_DETECTION_SUMMARY:-unavailable}"
|
||||
# Configure external-LLM mode and prepare persistent state directory.
|
||||
BACKEND="external-llm"
|
||||
mkdir -p /opt/localagi/pool
|
||||
msg_ok "Resolved LocalAGI backend: ${BACKEND}"
|
||||
|
||||
# Only attempt ROCm runtime provisioning when AMD backend is selected.
|
||||
if [[ "${BACKEND}" == "rocm7.2" ]]; then
|
||||
install_rocm_runtime_debian || msg_warn "ROCm runtime package installation failed"
|
||||
else
|
||||
msg_warn "ROCm install skipped because selected backend is '${BACKEND}'"
|
||||
fi
|
||||
msg_ok "Configured LocalAGI backend mode: ${BACKEND}"
|
||||
|
||||
# Generate runtime configuration file used by systemd service.
|
||||
# Note: `LOCALAGI_LLM_API_URL` points to an OpenAI-compatible backend endpoint.
|
||||
@@ -251,7 +142,6 @@ LOCALAGI_LLM_API_URL=http://127.0.0.1:11434/v1
|
||||
LOCALAGI_STATE_DIR=/opt/localagi/pool
|
||||
LOCALAGI_TIMEOUT=5m
|
||||
LOCALAGI_ENABLE_CONVERSATIONS_LOGGING=false
|
||||
LOCALAGI_GPU_BACKEND=${BACKEND}
|
||||
EOF
|
||||
msg_ok "Configured LocalAGI"
|
||||
|
||||
|
||||
Reference in New Issue
Block a user