gdnartea commited on
Commit
a783284
·
verified ·
1 Parent(s): 0d9b453

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -4,7 +4,7 @@ from llama_cpp import Llama
4
 
5
 
6
  llm = Llama(
7
- model_path="./Phi-3-mini-4k-instruct-q4.gguf", # path to GGUF file
8
  n_ctx=2048, # The max sequence length to use - note that longer sequence lengths require much more resources
9
  n_threads=8, # The number of CPU threads to use, tailor to your system and the resulting performance
10
  n_gpu_layers=0, # The number of layers to offload to GPU, if you have GPU acceleration available. Set to 0 if no GPU acceleration is available on your system.
 
4
 
5
 
6
  llm = Llama(
7
+ model_path="microsoft/Phi-3-mini-4k-instruct-q4.gguf", # path to GGUF file
8
  n_ctx=2048, # The max sequence length to use - note that longer sequence lengths require much more resources
9
  n_threads=8, # The number of CPU threads to use, tailor to your system and the resulting performance
10
  n_gpu_layers=0, # The number of layers to offload to GPU, if you have GPU acceleration available. Set to 0 if no GPU acceleration is available on your system.