#!/bin/bash

# Start Ollama service in the background
ollama serve &

# Wait for Ollama to be ready
sleep 5

# Pull the required embedding model
echo "Pulling nomic-embed-text..."
ollama pull nomic-embed-text

# Pull the small LLM for generating responses (llama3.2:1b)
echo "Pulling llama3.2:1b... (Lightweight model for HF Free Tier)"
ollama pull llama3.2:1b

# Start the FastAPI server on port 7860 (default for HF Spaces)
echo "Starting Application..."
uvicorn main:app --host 0.0.0.0 --port 7860