2024-03-21 22:09:04 +01:00
|
|
|
#!/bin/bash
|
|
|
|
|
|
|
|
echo "===> LocalAI All-in-One (AIO) container starting..."
|
|
|
|
|
|
|
|
GPU_ACCELERATION=false
|
|
|
|
GPU_VENDOR=""
|
|
|
|
|
2024-03-30 12:04:32 +01:00
|
|
|
function check_intel() {
|
|
|
|
if lspci | grep -E 'VGA|3D' | grep -iq intel; then
|
|
|
|
echo "Intel GPU detected"
|
|
|
|
if [ -d /opt/intel ]; then
|
|
|
|
GPU_ACCELERATION=true
|
|
|
|
GPU_VENDOR=intel
|
|
|
|
else
|
|
|
|
echo "Intel GPU detected, but Intel GPU drivers are not installed. GPU acceleration will not be available."
|
|
|
|
fi
|
|
|
|
fi
|
|
|
|
}
|
|
|
|
|
|
|
|
function check_nvidia_wsl() {
|
|
|
|
if lspci | grep -E 'VGA|3D' | grep -iq "Microsoft Corporation Device 008e"; then
|
|
|
|
# We make the assumption this WSL2 cars is NVIDIA, then check for nvidia-smi
|
|
|
|
# Make sure the container was run with `--gpus all` as the only required parameter
|
|
|
|
echo "NVIDIA GPU detected via WSL2"
|
|
|
|
# nvidia-smi should be installed in the container
|
|
|
|
if nvidia-smi; then
|
|
|
|
GPU_ACCELERATION=true
|
|
|
|
GPU_VENDOR=nvidia
|
|
|
|
else
|
|
|
|
echo "NVIDIA GPU detected via WSL2, but nvidia-smi is not installed. GPU acceleration will not be available."
|
|
|
|
fi
|
|
|
|
fi
|
|
|
|
}
|
|
|
|
|
|
|
|
function check_amd() {
|
|
|
|
if lspci | grep -E 'VGA|3D' | grep -iq amd; then
|
|
|
|
echo "AMD GPU detected"
|
|
|
|
# Check if ROCm is installed
|
|
|
|
if [ -d /opt/rocm ]; then
|
|
|
|
GPU_ACCELERATION=true
|
|
|
|
GPU_VENDOR=amd
|
|
|
|
else
|
|
|
|
echo "AMD GPU detected, but ROCm is not installed. GPU acceleration will not be available."
|
|
|
|
fi
|
|
|
|
fi
|
|
|
|
}
|
|
|
|
|
|
|
|
function check_nvidia() {
|
|
|
|
if lspci | grep -E 'VGA|3D' | grep -iq nvidia; then
|
|
|
|
echo "NVIDIA GPU detected"
|
|
|
|
# nvidia-smi should be installed in the container
|
|
|
|
if nvidia-smi; then
|
|
|
|
GPU_ACCELERATION=true
|
|
|
|
GPU_VENDOR=nvidia
|
|
|
|
else
|
|
|
|
echo "NVIDIA GPU detected, but nvidia-smi is not installed. GPU acceleration will not be available."
|
|
|
|
fi
|
|
|
|
fi
|
|
|
|
}
|
|
|
|
|
|
|
|
function check_metal() {
|
|
|
|
if system_profiler SPDisplaysDataType | grep -iq 'Metal'; then
|
|
|
|
echo "Apple Metal supported GPU detected"
|
|
|
|
GPU_ACCELERATION=true
|
|
|
|
GPU_VENDOR=apple
|
|
|
|
fi
|
|
|
|
}
|
|
|
|
|
2024-03-21 22:09:04 +01:00
|
|
|
function detect_gpu() {
|
|
|
|
case "$(uname -s)" in
|
|
|
|
Linux)
|
2024-03-30 12:04:32 +01:00
|
|
|
check_nvidia
|
|
|
|
check_amd
|
|
|
|
check_intel
|
|
|
|
check_nvidia_wsl
|
2024-03-21 22:09:04 +01:00
|
|
|
;;
|
|
|
|
Darwin)
|
2024-03-30 12:04:32 +01:00
|
|
|
check_metal
|
2024-03-21 22:09:04 +01:00
|
|
|
;;
|
|
|
|
esac
|
|
|
|
}
|
|
|
|
|
|
|
|
function detect_gpu_size() {
|
|
|
|
# Attempting to find GPU memory size for NVIDIA GPUs
|
2024-03-25 10:36:18 -07:00
|
|
|
if [ "$GPU_ACCELERATION" = true ] && [ "$GPU_VENDOR" = "nvidia" ]; then
|
2024-03-21 22:09:04 +01:00
|
|
|
echo "NVIDIA GPU detected. Attempting to find memory size..."
|
2024-03-25 10:36:18 -07:00
|
|
|
# Using head -n 1 to get the total memory of the 1st NVIDIA GPU detected.
|
|
|
|
# If handling multiple GPUs is required in the future, this is the place to do it
|
|
|
|
nvidia_sm=$(nvidia-smi --query-gpu=memory.total --format=csv,noheader,nounits | head -n 1)
|
2024-03-21 22:09:04 +01:00
|
|
|
if [ ! -z "$nvidia_sm" ]; then
|
2024-03-25 10:36:18 -07:00
|
|
|
echo "Total GPU Memory: $nvidia_sm MiB"
|
|
|
|
# if bigger than 8GB, use 16GB
|
|
|
|
#if [ "$nvidia_sm" -gt 8192 ]; then
|
|
|
|
# GPU_SIZE=gpu-16g
|
|
|
|
#else
|
|
|
|
GPU_SIZE=gpu-8g
|
|
|
|
#fi
|
2024-03-21 22:09:04 +01:00
|
|
|
else
|
2024-03-25 10:36:18 -07:00
|
|
|
echo "Unable to determine NVIDIA GPU memory size. Falling back to CPU."
|
|
|
|
GPU_SIZE=gpu-8g
|
2024-03-21 22:09:04 +01:00
|
|
|
fi
|
2024-03-26 18:45:25 +01:00
|
|
|
elif [ "$GPU_ACCELERATION" = true ] && [ "$GPU_VENDOR" = "intel" ]; then
|
|
|
|
GPU_SIZE=intel
|
2024-03-25 10:36:18 -07:00
|
|
|
# Default to a generic GPU size until we implement GPU size detection for non NVIDIA GPUs
|
|
|
|
elif [ "$GPU_ACCELERATION" = true ]; then
|
|
|
|
echo "Non-NVIDIA GPU detected. Specific GPU memory size detection is not implemented."
|
|
|
|
GPU_SIZE=gpu-8g
|
2024-03-21 22:09:04 +01:00
|
|
|
|
|
|
|
# default to cpu if GPU_SIZE is not set
|
2024-03-25 10:36:18 -07:00
|
|
|
else
|
|
|
|
echo "GPU acceleration is not enabled or supported. Defaulting to CPU."
|
2024-03-21 22:09:04 +01:00
|
|
|
GPU_SIZE=cpu
|
|
|
|
fi
|
|
|
|
}
|
|
|
|
|
|
|
|
function check_vars() {
|
|
|
|
if [ -z "$MODELS" ]; then
|
|
|
|
echo "MODELS environment variable is not set. Please set it to a comma-separated list of model YAML files to load."
|
|
|
|
exit 1
|
|
|
|
fi
|
|
|
|
|
2024-03-30 12:04:32 +01:00
|
|
|
if [ -z "$PROFILE" ]; then
|
|
|
|
echo "PROFILE environment variable is not set. Please set it to one of the following: cpu, gpu-8g, gpu-16g, apple"
|
2024-03-21 22:09:04 +01:00
|
|
|
exit 1
|
|
|
|
fi
|
|
|
|
}
|
|
|
|
|
|
|
|
detect_gpu
|
|
|
|
detect_gpu_size
|
|
|
|
|
2024-03-30 12:04:32 +01:00
|
|
|
PROFILE="${PROFILE:-$GPU_SIZE}" # default to cpu
|
2024-04-25 00:19:02 +02:00
|
|
|
export MODELS="${MODELS:-/aio/${PROFILE}/embeddings.yaml,/aio/${PROFILE}/rerank.yaml,/aio/${PROFILE}/text-to-speech.yaml,/aio/${PROFILE}/image-gen.yaml,/aio/${PROFILE}/text-to-text.yaml,/aio/${PROFILE}/speech-to-text.yaml,/aio/${PROFILE}/vision.yaml}"
|
2024-03-21 22:09:04 +01:00
|
|
|
|
|
|
|
check_vars
|
|
|
|
|
2024-03-30 12:04:32 +01:00
|
|
|
echo "===> Starting LocalAI[$PROFILE] with the following models: $MODELS"
|
2024-03-21 22:09:04 +01:00
|
|
|
|
2024-04-02 02:15:44 -05:00
|
|
|
exec /build/entrypoint.sh "$@"
|