Spaces:

Krish-05
/

chatbot_final

Sleeping

App Files Files Community

chatbot_final / start.sh

Krish-05

Update start.sh

ceabda8 verified 5 months ago

raw

history blame contribute delete

4.7 kB

	#!/bin/bash

	# ==============================================================================
	# Start Script for Ollama, FastAPI Backend, and Nginx Frontend
	# This script initializes the environment, starts dependent services,
	# and then launches the main application components.
	# ==============================================================================

	# ------------------------------------------------------------------------------
	# 1. Environment Setup
	# Set essential environment variables for performance and GPU usage.
	# ------------------------------------------------------------------------------
	echo "--- Initializing Environment Variables ---"
	export OMP_NUM_THREADS=4
	export MKL_NUM_THREADS=4
	export CUDA_VISIBLE_DEVICES=0 # Specifies which GPU to use, 0 for the first GPU

	# ------------------------------------------------------------------------------
	# 2. Start Ollama Server and Pull Models
	# Ollama must be running and the required models available before FastAPI starts.
	# ------------------------------------------------------------------------------
	echo "--- Starting Ollama Server ---"
	# Start Ollama in the background
	# The 'serve' command runs the Ollama API server.
	ollama serve &

	# Define the models to be pulled
	MODEL_TO_PULL="krishna_choudhary/tinyllama:latest"
	WHISPER_MODEL_TO_PULL="whisper:tiny"

	# Pull the LLM model if it's not already present
	echo "Checking for Ollama LLM model: $MODEL_TO_PULL"
	if ! ollama list \| grep -q "$MODEL_TO_PULL"; then
	echo "Pulling Ollama LLM model: $MODEL_TO_PULL (This may take some time)..."
	ollama pull "$MODEL_TO_PULL"
	else
	echo "Ollama LLM model $MODEL_TO_PULL already present."
	fi

	# Pull the Whisper model for transcription if it's not already present
	echo "Checking for Ollama Whisper model: $WHISPER_MODEL_TO_PULL"
	if ! ollama list \| grep -q "$WHISPER_MODEL_TO_PULL"; then
	echo "Pulling Ollama Whisper model: $WHISPER_MODEL_TO_PULL (This may take some time)..."
	ollama pull "$WHISPER_MODEL_TO_PULL"
	else
	echo "Ollama Whisper model $WHISPER_MODEL_TO_PULL already present."
	fi

	# Wait for Ollama to become responsive
	max_attempts=90 # Maximum attempts (90 seconds)
	attempt=0
	echo "Waiting for Ollama API to be ready (max $max_attempts seconds)..."
	while ! curl -s http://localhost:11434/api/tags >/dev/null; do
	sleep 1
	attempt=$((attempt + 1))
	if [ $attempt -eq $max_attempts ]; then
	echo "Error: Ollama failed to start within $((max_attempts)) seconds. Exiting."
	exit 1
	fi
	done
	echo "Ollama is ready and responsive."

	# ------------------------------------------------------------------------------
	# 3. Debugging: List Files
	# Useful for verifying that application files are correctly copied into the container.
	# ------------------------------------------------------------------------------
	echo "--- Files in current directory ($PWD): ---"
	ls -le
	echo "-------------------------------------------"

	# ------------------------------------------------------------------------------
	# 4. Start FastAPI Backend Server
	# The FastAPI application serves the API endpoints.
	# ------------------------------------------------------------------------------
	echo "--- Starting FastAPI Server ---"
	# Run Uvicorn to serve the FastAPI application.
	# --host 0.0.0.0 makes it accessible from outside the container (via exposed port).
	# --port 7860 is where FastAPI listens.
	# --workers 1 and --limit-concurrency 20 are performance settings.
	uvicorn main:app --host 0.0.0.0 --port 7860 --workers 1 --limit-concurrency 20 &
	FASTAPI_PID=$!
	echo "FastAPI server started with PID: $FASTAPI_PID"

	# Give FastAPI a moment to fully initialize (optional but good practice)
	sleep 5

	# ------------------------------------------------------------------------------
	# 5. Start Nginx Web Server
	# Nginx acts as a reverse proxy for the FastAPI backend and serves the React frontend.
	# ------------------------------------------------------------------------------
	echo "--- Starting Nginx Web Server on Port 8501 ---"
	# Start Nginx in the foreground so the script waits for it to exit,
	# keeping the Docker container alive.
	# 'daemon off;' ensures Nginx runs in the foreground.
	nginx -g 'daemon off;' &
	NGINX_PID=$!
	echo "Nginx started with PID: $NGINX_PID"

	# ------------------------------------------------------------------------------
	# 6. Keep Container Alive
	# The 'wait' command will keep the script running as long as Nginx is running.
	# ------------------------------------------------------------------------------
	echo "All services initiated. Keeping container alive by waiting for Nginx..."
	wait $NGINX_PID

	echo "Nginx stopped. Container may exit now."