llama-cpp-agent

Paused

pabloce commited on May 21, 2024

Commit

0fd9e08

verified ·

1 Parent(s): 2bd7c02

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -7,7 +7,7 @@ from huggingface_hub import hf_hub_download
 subprocess.run('pip install llama-cpp-python==0.2.75 --extra-index-url https://abetlen.github.io/llama-cpp-python/whl/cu124', shell=True)
 subprocess.run('pip install llama-cpp-agent==0.2.10', shell=True)
-hf_hub_download(repo_id="bartowski/Meta-Llama-3-70B-Instruct-GGUF", filename="Meta-Llama-3-70B-Instruct-Q4_K_M.gguf",  local_dir = "./models")
 @spaces.GPU(duration=120)
 def respond(
@@ -26,7 +26,7 @@ def respond(
     from llama_cpp_agent.chat_history.messages import Roles
     llm = Llama(
-        model_path="models/Meta-Llama-3-70B-Instruct-Q4_K_M.gguf",
         n_gpu_layers=81,
     )
     provider = LlamaCppPythonProvider(llm)

 subprocess.run('pip install llama-cpp-python==0.2.75 --extra-index-url https://abetlen.github.io/llama-cpp-python/whl/cu124', shell=True)
 subprocess.run('pip install llama-cpp-agent==0.2.10', shell=True)
+hf_hub_download(repo_id="bartowski/Meta-Llama-3-70B-Instruct-GGUF", filename="Meta-Llama-3-70B-Instruct-Q3_K_M.gguf",  local_dir = "./models")
 @spaces.GPU(duration=120)
 def respond(
     from llama_cpp_agent.chat_history.messages import Roles
     llm = Llama(
+        model_path="models/Meta-Llama-3-70B-Instruct-Q3_K_M.gguf",
         n_gpu_layers=81,
     )
     provider = LlamaCppPythonProvider(llm)