Spaces:

joaogante
/

assisted_generation_demo

Running on Zero

joaogante commited on Aug 21, 2024

Commit

4b1483e

verified ·

1 Parent(s): 68ac19e

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,3 +1,4 @@
 from threading import Thread
 import torch
@@ -20,6 +21,7 @@ tokenizer = AutoTokenizer.from_pretrained(model_id)
 assistant_model = AutoModelForCausalLM.from_pretrained(assistant_id).to(torch_device)
 def run_generation(user_text, use_assistant, temperature, max_new_tokens):
     if temperature < 0.1:
         do_sample = False

+import spaces
 from threading import Thread
 import torch
 assistant_model = AutoModelForCausalLM.from_pretrained(assistant_id).to(torch_device)
+@spaces.GPU
 def run_generation(user_text, use_assistant, temperature, max_new_tokens):
     if temperature < 0.1:
         do_sample = False