import gradio as gr this = gr.load("models/HuggingFaceTB/SmolLM2-1.7B-Instruct") print(this) def run_llm(inp,history): out = this(inp) print(out) yield out with gr.Blocks() as app: chat=gr.ChatInterface( fn=run_llm, ) app.launch()