import gradio as gr gr.Interface.load("models/stabilityai/stablecode-instruct-alpha-3b").launch() model.cuda() tokens = model.generate( **inputs, max_new_tokens=480, temperature=0.2, do_sample=True, )