Spaces:

He-Xingwei
/

llama2_test

Sleeping

He-Xingwei commited on Dec 4, 2023

Commit

bb86659

1 Parent(s): 4526b2c

first version

Files changed (1) hide show

app.py CHANGED Viewed

@@ -33,14 +33,14 @@ if not torch.cuda.is_available():
     DESCRIPTION += "\n<p>Running on CPU 🥶 This demo does not work on CPU.</p>"
-# if torch.cuda.is_available():
-model_id = "meta-llama/Llama-2-7b-chat-hf"
-model = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype=torch.float16, device_map="auto")
-tokenizer = AutoTokenizer.from_pretrained(model_id)
-tokenizer.use_default_system_prompt = False
-# @spaces.GPU
 def generate(
     message: str,
     chat_history: list[tuple[str, str]],

     DESCRIPTION += "\n<p>Running on CPU 🥶 This demo does not work on CPU.</p>"
+if torch.cuda.is_available():
+    model_id = "meta-llama/Llama-2-7b-chat-hf"
+    model = AutoModelForCausalLM.from_pretrained(model_id, torch_dtype=torch.float16, device_map="auto")
+    tokenizer = AutoTokenizer.from_pretrained(model_id)
+    tokenizer.use_default_system_prompt = False
+@spaces.GPU
 def generate(
     message: str,
     chat_history: list[tuple[str, str]],