radames commited on
Commit
7794339
·
1 Parent(s): 26cd590

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -1
app.py CHANGED
@@ -12,7 +12,7 @@ llm = Llama(
12
  filename="llama-2-7b-chat.ggmlv3.q5_0.bin",
13
  ),
14
  n_ctx=2048,
15
- n_gpu_layers=1500, # change n_gpu_layers if you have more or less VRAM
16
  )
17
 
18
  history = []
@@ -61,6 +61,8 @@ demo = gr.ChatInterface(
61
  generate_text,
62
  title="llama-cpp-python on GPU",
63
  description="Running LLM with https://github.com/abetlen/llama-cpp-python",
 
 
64
  retry_btn=None,
65
  undo_btn="Delete Previous",
66
  clear_btn="Clear",
 
12
  filename="llama-2-7b-chat.ggmlv3.q5_0.bin",
13
  ),
14
  n_ctx=2048,
15
+ n_gpu_layers=5000, # change n_gpu_layers if you have more or less VRAM
16
  )
17
 
18
  history = []
 
61
  generate_text,
62
  title="llama-cpp-python on GPU",
63
  description="Running LLM with https://github.com/abetlen/llama-cpp-python",
64
+ examples=["tell me everything about llamas"],
65
+ cache_examples=True,
66
  retry_btn=None,
67
  undo_btn="Delete Previous",
68
  clear_btn="Clear",