import gradio as gr gr.load( "models/BSC-LT/salamandra-2b-instruct", provider="hf-inference", ).launch()