import gradio as gr gr.load( "models/meta-llama/Llama-3.2-3B", provider="hf-inference", ).launch()