jonaschua commited on
Commit
cec57c9
Β·
verified Β·
1 Parent(s): af89835

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +7 -0
app.py CHANGED
@@ -7,11 +7,18 @@ import gradio as gr
7
  from gradio import FileData
8
  import time
9
  import spaces
 
 
 
 
10
  ckpt = "meta-llama/Llama-3.2-11B-Vision-Instruct"
11
  model = MllamaForConditionalGeneration.from_pretrained(ckpt,
12
  torch_dtype=torch.bfloat16).to("cuda")
13
  processor = AutoProcessor.from_pretrained(ckpt)
14
 
 
 
 
15
 
16
  @spaces.GPU
17
  def bot_streaming(message, history, max_new_tokens=250):
 
7
  from gradio import FileData
8
  import time
9
  import spaces
10
+ import os
11
+ from huggingface_hub import InferenceClient
12
+
13
+
14
  ckpt = "meta-llama/Llama-3.2-11B-Vision-Instruct"
15
  model = MllamaForConditionalGeneration.from_pretrained(ckpt,
16
  torch_dtype=torch.bfloat16).to("cuda")
17
  processor = AutoProcessor.from_pretrained(ckpt)
18
 
19
+ token = os.getenv('deepseekv2')
20
+ client = InferenceClient(model, token=os.getenv('deepseekv2'))
21
+
22
 
23
  @spaces.GPU
24
  def bot_streaming(message, history, max_new_tokens=250):