import gradio as gr gr.load("models/unsloth/llama-3-8b-bnb-4bit").launch()