import gradio as gr gr.load( "models/google/flan-t5-base", provider="hf-inference", ).launch()