SreyanG-NVIDIA commited on
Commit
d9be71a
·
verified ·
1 Parent(s): 94b4ec9

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +5 -4
app.py CHANGED
@@ -15,14 +15,15 @@ MODEL_BASE_THINK = os.path.join(MODEL_BASE_SINGLE, 'stage35')
15
  # model_single = llava.load(MODEL_BASE_SINGLE, model_base=None, devices=[0])
16
  model_single = llava.load(MODEL_BASE_SINGLE, model_base=None)
17
  model_single = model_single.to("cuda")
 
18
 
19
  generation_config_single = model_single.default_generation_config
20
 
21
  model_think = PeftModel.from_pretrained(
22
  model_single,
23
- MODEL_BASE_THINK,
24
- device_map="auto",
25
- torch_dtype=torch.float16,
26
  )
27
 
28
  # # ---------------------------------
@@ -40,7 +41,7 @@ def single_turn_infer(audio_file, prompt_text):
40
  try:
41
  sound = llava.Sound(audio_file)
42
  full_prompt = f"<sound>\n{prompt_text}"
43
- response = model_single.generate_content([sound, full_prompt], generation_config=generation_config_single)
44
  return response
45
  except Exception as e:
46
  return f"❌ Error: {str(e)}"
 
15
  # model_single = llava.load(MODEL_BASE_SINGLE, model_base=None, devices=[0])
16
  model_single = llava.load(MODEL_BASE_SINGLE, model_base=None)
17
  model_single = model_single.to("cuda")
18
+ model_single_copy = copy.deepcopy(model_single)
19
 
20
  generation_config_single = model_single.default_generation_config
21
 
22
  model_think = PeftModel.from_pretrained(
23
  model_single,
24
+ MODEL_BASE_THINK,
25
+ device_map="auto",
26
+ torch_dtype=torch.float16,
27
  )
28
 
29
  # # ---------------------------------
 
41
  try:
42
  sound = llava.Sound(audio_file)
43
  full_prompt = f"<sound>\n{prompt_text}"
44
+ response = model_single_copy.generate_content([sound, full_prompt], generation_config=generation_config_single)
45
  return response
46
  except Exception as e:
47
  return f"❌ Error: {str(e)}"