jonaschua commited on
Commit
2c71536
·
verified ·
1 Parent(s): a583c0c

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -9,7 +9,7 @@ import requests
9
  model = ""
10
  duration = 5
11
  token = os.getenv('deepseekv2')
12
- provider = 'together' #'fal-ai' #None #replicate # sambanova
13
 
14
  print(f"Is CUDA available: {torch.cuda.is_available()}")
15
  print(f"CUDA device: {torch.cuda.get_device_name(torch.cuda.current_device())}")
@@ -71,7 +71,7 @@ def respond(message, history: list[tuple[str, str]], model, system_message, max_
71
  print(model)
72
  model_name = choose_model(model)
73
 
74
- client = InferenceClient(model_name, provider="sambanova", token=os.getenv('deepseekv2'))
75
 
76
  messages = [{"role": "system", "content": system_message}]
77
 
 
9
  model = ""
10
  duration = 5
11
  token = os.getenv('deepseekv2')
12
+ provider = 'sambanova' #'fal-ai' #None #replicate # sambanova
13
 
14
  print(f"Is CUDA available: {torch.cuda.is_available()}")
15
  print(f"CUDA device: {torch.cuda.get_device_name(torch.cuda.current_device())}")
 
71
  print(model)
72
  model_name = choose_model(model)
73
 
74
+ client = InferenceClient(model_name, provider=provider, token=os.getenv('deepseekv2'))
75
 
76
  messages = [{"role": "system", "content": system_message}]
77