import gradio as gr gr.load( "models/fxmarty/tiny-doc-qa-vision-encoder-decoder", provider="hf-inference", ).launch()