Spaces:

Lyte
/

DeepSeek-R1-Distill-Qwen-32B-Demo-GGUF

Running

Upload 4 files

45e65a9 verified 6 months ago

402 Bytes

	#!/bin/bash

	# Start llama-server in background
	cd /llama.cpp/build
	./bin/llama-server --host 0.0.0.0 --port 8080 --model /models/model.q2_k_l.gguf --ctx-size 16384 &

	# Wait for server to initialize
	echo "Waiting for server to start..."
	until curl -s "http://localhost:8080/v1/models" >/dev/null; do
	sleep 1
	done

	echo "Server is ready. Starting Gradio app."

	# Start Gradio UI
	cd /
	python3 app.py