Mistral-7B / app.py
AnishHF's picture
Update app.py
573cd07 verified
raw
history blame
1.15 kB
import os
import torch
import gradio as gr
from transformers import AutoTokenizer, AutoModelForCausalLM, QuantoConfig
access_token = os.environ["GATED_ACCESS_TOKEN"]
quantization_config = QuantoConfig(
weights = "int4"
)
model = AutoModelForCausalLM.from_pretrained("mistralai/Mistral-7B-Instruct-v0.1", quantization_config=quantization_config, device_map="auto", token=access_token)
tokenizer = AutoTokenizer.from_pretrained("mistralai/Mistral-7B-Instruct-v0.1", token = access_token)
# Function to generate text using the model
def generate_text(prompt):
text = prompt
inputs = tokenizer(text, return_tensors="pt")
outputs = model.generate(**inputs, max_new_tokens=512)
return tokenizer.decode(outputs[0], skip_special_tokens=True)
# Create the Gradio interface
iface = gr.Interface(
fn=generate_text,
inputs=[
gr.inputs.Textbox(lines=5, label="Input Prompt"),
],
outputs=gr.outputs.Textbox(label="Generated Text"),
title="MisTRAL Text Generation",
description="Use this interface to generate text using the MisTRAL language model.",
)
# Launch the Gradio interface
iface.launch()