import gradio as gr this = gr.load("models/HuggingFaceTB/SmolLM2-1.7B-Instruct") print(this) def run_llm(inp,history): yield this(inp) with gr.Blocks() as app: chat=gr.ChatInterface( fn=run_llm, ) app.launch()