litellm / entrypoint.sh
zhengr's picture
init
df054a5
raw
history blame
569 Bytes
#!/bin/bash
# Starting server
echo "Starting server"
#ollama serve &
#sleep 1
# Splitting the models by comma and pulling each
# IFS=',' read -ra MODELS <<< "$model"
# for m in "${MODELS[@]}"; do
# echo "Pulling $m"
# ollama pull "$m"
# sleep 5
# echo "Running $m"
# ollama run "$m" --keepalive -1s
# No need to sleep here unless you want to give some delay between each pull for some reason
# done
#litellm --model ollama/"$m" --drop_params
litellm --config /config.yaml
# Keep the script running to prevent the container from exiting
wait