#!/bin/bash # Starting server echo "Starting server" ollama serve & sleep 1 # Splitting the models by comma and pulling each IFS=',' read -ra MODELS <<< "$model" for m in "${MODELS[@]}"; do echo "Pulling $m" ollama pull "$m" sleep 5 echo "Running $m" ollama run "$m" --keepalive -1s # No need to sleep here unless you want to give some delay between each pull for some reason done litellm --model ollama/"$m" --drop_params # Keep the script running to prevent the container from exiting wait