Spaces:

Komal01
/

Streaming_RAG_chatbot

Sleeping

Streaming_RAG_chatbot / start.sh

Upload 2 files

b37c0cf verified 3 months ago

1.01 kB

	#!/bin/bash

	# Set environment variables for optimization
	export OMP_NUM_THREADS=4
	export MKL_NUM_THREADS=4
	export CUDA_VISIBLE_DEVICES=0,1

	# Start Ollama in the background
	ollama serve &

	# Pull the model if not already present
	if ! ollama list \| grep -q "deepseek-r1:7b"; then
	ollama pull deepseek-r1:7b
	fi
	if ! ollama list \| grep -q "nomic-embed-text"; then
	ollama pull nomic-embed-text
	fi
	# Wait for Ollama to start up
	max_attempts=30
	attempt=0
	while ! curl -s http://localhost:11434/api/tags >/dev/null; do
	sleep 1
	attempt=$((attempt + 1))
	if [ $attempt -eq $max_attempts ]; then
	echo "Ollama failed to start within 30 seconds. Exiting."
	exit 1
	fi
	done

	echo "Ollama is ready."

	# Print the API URL
	echo "API is running on: http://0.0.0.0:7860"

	# Start FastAPI in the background
	uvicorn app:app --host 0.0.0.0 --port 8000 --workers 1 --limit-concurrency 20 &

	# Start Streamlit for UI
	streamlit run streamlit_app.py --server.port 7860 --server.address 0.0.0.0