import gradio as gr gr.load("models/openbmb/MiniCPM-Llama3-V-2_5-int4").launch()