Spaces:

mrcuddle
/

Ministral-8B-2410-RP-DPO

Build error

mrcuddle commited on Jan 21

Commit

39d1b86

verified ·

1 Parent(s): c4df5b8

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,13 +1,18 @@
 import gradio as gr
 from vllm import LLM
 from vllm.sampling_params import SamplingParams
 import spaces
 # Define the model and sampling parameters
 model_name = "mistralai/Ministral-8B-Instruct-2410"
 sampling_params = SamplingParams(max_tokens=8192)
-# Initialize the LLM model
-llm = LLM(model=model_name, tokenizer_mode="mistral", config_format="mistral", load_format="mistral")
 @spaces.GPU
 # Define the chatbot function
@@ -46,4 +51,4 @@ with gr.Blocks() as demo:
     txt.submit(chatbot, [txt, chatbot], [chatbot, txt])
 # Launch the Gradio interface
-demo.launch()

 import gradio as gr
 from vllm import LLM
 from vllm.sampling_params import SamplingParams
+import torch
 import spaces
 # Define the model and sampling parameters
 model_name = "mistralai/Ministral-8B-Instruct-2410"
 sampling_params = SamplingParams(max_tokens=8192)
+# Check if GPU is available
+device = "cuda" if torch.cuda.is_available() else "cpu"
+# Initialize the LLM model with the specified device
+llm = LLM(model=model_name, tokenizer_mode="mistral", config_format="mistral", load_format="mistral", device=device)
 @spaces.GPU
 # Define the chatbot function
     txt.submit(chatbot, [txt, chatbot], [chatbot, txt])
 # Launch the Gradio interface
+demo.launch()