CreitinGameplays commited on
Commit
ea5e120
·
verified ·
1 Parent(s): c6eb853

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -1
app.py CHANGED
@@ -15,7 +15,7 @@ if not torch.cuda.is_available():
15
  DESCRIPTION += "\n<p>Running on CPU 🥶 This demo does not work on CPU.</p>"
16
 
17
  MAX_MAX_NEW_TOKENS = 2048
18
- DEFAULT_MAX_NEW_TOKENS = 1024
19
  MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "4096"))
20
 
21
  if torch.cuda.is_available():
@@ -62,6 +62,7 @@ def generate(
62
  outputs = []
63
  for text in streamer:
64
  outputs.append(text)
 
65
  yield "".join(outputs)
66
 
67
 
 
15
  DESCRIPTION += "\n<p>Running on CPU 🥶 This demo does not work on CPU.</p>"
16
 
17
  MAX_MAX_NEW_TOKENS = 2048
18
+ DEFAULT_MAX_NEW_TOKENS = 512
19
  MAX_INPUT_TOKEN_LENGTH = int(os.getenv("MAX_INPUT_TOKEN_LENGTH", "4096"))
20
 
21
  if torch.cuda.is_available():
 
62
  outputs = []
63
  for text in streamer:
64
  outputs.append(text)
65
+ outputs = outputs.replace("||assistant|>", "").strip()
66
  yield "".join(outputs)
67
 
68