michailroussos commited on
Commit
0556c99
·
1 Parent(s): 1188d49
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -37,10 +37,10 @@ def respond(message, history, system_message, max_tokens, temperature, top_p):
37
  ).to("cuda" if torch.cuda.is_available() else "cpu")
38
 
39
  # Generate the response
40
- attention_mask = inputs.ne(tokenizer.pad_token_id).long()
41
  generated_tokens = model.generate(
42
  input_ids=inputs,
43
- attention_mask=attention_mask,
44
  max_new_tokens=max_tokens,
45
  use_cache=True,
46
  temperature=temperature,
 
37
  ).to("cuda" if torch.cuda.is_available() else "cpu")
38
 
39
  # Generate the response
40
+ #attention_mask = inputs.ne(tokenizer.pad_token_id).long()
41
  generated_tokens = model.generate(
42
  input_ids=inputs,
43
+ #attention_mask=attention_mask,
44
  max_new_tokens=max_tokens,
45
  use_cache=True,
46
  temperature=temperature,