eikarna
commited on
Commit
·
c376a77
1
Parent(s):
f858b89
Minor Update
Browse files
app.py
CHANGED
@@ -36,7 +36,7 @@ def load_model():
|
|
36 |
model = AutoModelForCausalLM.from_pretrained(
|
37 |
MODEL_NAME,
|
38 |
trust_remote_code=True,
|
39 |
-
torch_dtype=torch.
|
40 |
device_map="auto"
|
41 |
)
|
42 |
|
@@ -71,7 +71,6 @@ def generate_response(prompt: str, settings: Dict[str, Any]) -> str:
|
|
71 |
max_new_tokens=settings["max_tokens"],
|
72 |
temperature=settings["temperature"],
|
73 |
top_p=settings["top_p"],
|
74 |
-
do_sample=True,
|
75 |
pad_token_id=st.session_state.tokenizer.eos_token_id
|
76 |
)
|
77 |
|
|
|
36 |
model = AutoModelForCausalLM.from_pretrained(
|
37 |
MODEL_NAME,
|
38 |
trust_remote_code=True,
|
39 |
+
torch_dtype=torch.float16,
|
40 |
device_map="auto"
|
41 |
)
|
42 |
|
|
|
71 |
max_new_tokens=settings["max_tokens"],
|
72 |
temperature=settings["temperature"],
|
73 |
top_p=settings["top_p"],
|
|
|
74 |
pad_token_id=st.session_state.tokenizer.eos_token_id
|
75 |
)
|
76 |
|