lengyue233 commited on
Commit
58a44f9
·
verified ·
1 Parent(s): 5b8d983

Try compile on zero

Browse files
Files changed (1) hide show
  1. app.py +2 -0
app.py CHANGED
@@ -251,6 +251,7 @@ def build_app():
251
  # speaker,
252
  ],
253
  [audio, error],
 
254
  )
255
 
256
  return app
@@ -286,6 +287,7 @@ if __name__ == "__main__":
286
  args = parse_args()
287
 
288
  args.precision = torch.half if args.half else torch.bfloat16
 
289
 
290
  logger.info("Loading Llama model...")
291
  llama_model, decode_one_token = load_llama_model(
 
251
  # speaker,
252
  ],
253
  [audio, error],
254
+ concurrency_limit=1,
255
  )
256
 
257
  return app
 
287
  args = parse_args()
288
 
289
  args.precision = torch.half if args.half else torch.bfloat16
290
+ args.compile = True
291
 
292
  logger.info("Loading Llama model...")
293
  llama_model, decode_one_token = load_llama_model(