Spaces:

NitinBot001
/

llama3.2-api

Sleeping

App Files Files Community

llama3.2-api / app.py

NitinBot001

Create app.py

6cb858c verified 24 days ago

raw

history blame

3.25 kB

	import os
	import requests
	from flask import Flask, request, jsonify
	from llama_cpp import Llama
	import subprocess
	import time
	import json

	app = Flask(__name__)
	MODEL_PATH = "model/calme-3.3-llamaloi-3b.Q4_K_M.gguf"
	GH_PAT = os.getenv("GH_PAT","ghp_TGVMURDWG3HkLIfWUa4hyJUGYOYgXH1EljIi") # GitHub Personal Access Token
	REPO_URL = "https://github.com/NitinBot001/Audio-url-new-js.git"

	def download_model():
	os.makedirs("model", exist_ok=True)
	if not os.path.exists(MODEL_PATH):
	print("Downloading model...")
	r = requests.get(
	"https://huggingface.co/MaziyarPanahi/calme-3.3-llamaloi-3b-GGUF/resolve/main/calme-3.3-llamaloi-3b.Q4_K_M.gguf",
	stream=True,
	)
	with open(MODEL_PATH, "wb") as f:
	for chunk in r.iter_content(chunk_size=8192):
	f.write(chunk)

	def start_tunnel():
	# Start nport tunnel
	tunnel_process = subprocess.Popen(
	["npx", "nport", "-s", "ai-service", "-p", "5000"],
	stdout=subprocess.PIPE,
	stderr=subprocess.PIPE,
	)
	time.sleep(10) # Wait for tunnel to establish

	# Extract tunnel URL from logs
	tunnel_url = None
	for line in iter(tunnel_process.stdout.readline, b""):
	line = line.decode("utf-8").strip()
	if "your domain is:" in line:
	tunnel_url = line.split("your domain is: ")[1]
	break

	if not tunnel_url:
	raise Exception("Failed to extract tunnel URL")

	return tunnel_url

	def push_tunnel_url_to_repo(tunnel_url):
	# Create instance.json
	instance_data = {"tunnel_url": tunnel_url}
	with open("instance.json", "w") as f:
	json.dump(instance_data, f)

	# Clone the repository
	subprocess.run(
	["git", "clone", f"https://x-access-token:{GH_PAT}@{REPO_URL.split('https://')[1]}", "repo"],
	check=True,
	)
	os.chdir("repo")

	# Move instance.json to the repository
	subprocess.run(["mv", "../instance.json", "."], check=True)

	# Commit and push changes
	subprocess.run(["git", "config", "--global", "user.email", "[email protected]"], check=True)
	subprocess.run(["git", "config", "--global", "user.name", "github-actions"], check=True)
	subprocess.run(["git", "add", "instance.json"], check=True)
	subprocess.run(["git", "commit", "-m", f"Update tunnel URL to {tunnel_url}"], check=True)
	subprocess.run(["git", "push", "origin", "main"], check=True)

	@app.route("/chat", methods=["POST"])
	def chat():
	data = request.json
	prompt = f"<\|begin_of_text\|><\|start_header_id\|>user<\|end_header_id\|>\n{data.get('message','')}<\|eot_id\|>\n<\|start_header_id\|>assistant<\|end_header_id\|>\n"
	output = llm(prompt, max_tokens=2048, stop=["<\|eot_id\|>"], temperature=0.8, top_p=0.9)
	return jsonify({"response": output["choices"][0]["text"].strip()})

	if __name__ == "__main__":
	# Download the model
	download_model()

	# Initialize the LLM
	llm = Llama(
	model_path=MODEL_PATH,
	n_ctx=8192,
	n_threads=2,
	n_gpu_layers=0,
	verbose=False,
	)

	# Start the tunnel and push the URL
	tunnel_url = start_tunnel()
	push_tunnel_url_to_repo(tunnel_url)

	# Run the Flask app
	app.run(host="0.0.0.0", port=5000)