litellm / entrypoint.sh
zhengr's picture
Update entrypoint.sh
4433f67 verified
raw
history blame
520 Bytes
#!/bin/bash
# Starting server
echo "Starting server"
ollama serve &
sleep 1
# Splitting the models by comma and pulling each
IFS=',' read -ra MODELS <<< "$model"
for m in "${MODELS[@]}"; do
echo "Pulling $m"
ollama pull "$m"
sleep 5
echo "Running $m"
ollama run "$m" --keepalive -1s
# No need to sleep here unless you want to give some delay between each pull for some reason
done
litellm --model ollama/"$m" --drop_params
# Keep the script running to prevent the container from exiting
wait