import gradio as gr import torch from transformers import pipeline ans = pipeline(model="databricks/dolly-v2-3b", torch_dtype=torch.bfloat16, trust_remote_code=True, device_map="auto") def answer(query): out=ans(query) return out Demo = gr.Interface(fn=answer,inputs='text',outputs='text',examples=[['What is the capital of India ?']]) Demo.launch()