Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
@@ -20,7 +20,7 @@ MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "4096"))
|
|
20 |
if torch.cuda.is_available():
|
21 |
#model_id = "Qwen/Qwen2.5-7B-Instruct"
|
22 |
model_id = "BenBranyon/sumbot7b"
|
23 |
-
model =
|
24 |
tokenizer = AutoTokenizer.from_pretrained(model_id)
|
25 |
tokenizer.use_default_system_prompt = False
|
26 |
|
|
|
20 |
if torch.cuda.is_available():
|
21 |
#model_id = "Qwen/Qwen2.5-7B-Instruct"
|
22 |
model_id = "BenBranyon/sumbot7b"
|
23 |
+
model = AutoPeftModelForCausalLM.from_pretrained(model_id, device_map="auto")
|
24 |
tokenizer = AutoTokenizer.from_pretrained(model_id)
|
25 |
tokenizer.use_default_system_prompt = False
|
26 |
|