AnishHF commited on
Commit
a3606dd
1 Parent(s): 2bc1680

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +8 -13
app.py CHANGED
@@ -2,22 +2,17 @@ import gradio as gr
2
  from transformers import AutoTokenizer, AutoModelForCausalLM
3
 
4
  # Load the tokenizer and model
5
- tokenizer = AutoTokenizer.from_pretrained("mistralai/Mistral-7B-v0.1")
6
- model = AutoModelForCausalLM.from_pretrained("mistralai/Mistral-7B-v0.1", device_map="auto")
 
7
 
8
  # Function to generate text using the model
9
  def generate_text(prompt, max_length=500, temperature=0.7, top_k=50, top_p=0.95, num_return_sequences=1):
10
- input_ids = tokenizer.encode(prompt, return_tensors="pt")
11
- output = model.generate(
12
- input_ids,
13
- max_length=max_length,
14
- temperature=temperature,
15
- top_k=top_k,
16
- top_p=top_p,
17
- num_return_sequences=num_return_sequences,
18
- )
19
- generated_text = tokenizer.batch_decode(output, skip_special_tokens=True)[0]
20
- return generated_text
21
 
22
  # Create the Gradio interface
23
  iface = gr.Interface(
 
2
  from transformers import AutoTokenizer, AutoModelForCausalLM
3
 
4
  # Load the tokenizer and model
5
+ model_id = "mistralai/Mixtral-8x22B-v0.1"
6
+ tokenizer = AutoTokenizer.from_pretrained(model_id)
7
+ model = AutoModelForCausalLM.from_pretrained(model_id)
8
 
9
  # Function to generate text using the model
10
  def generate_text(prompt, max_length=500, temperature=0.7, top_k=50, top_p=0.95, num_return_sequences=1):
11
+ text = prompt
12
+ inputs = tokenizer(text, return_tensors="pt")
13
+
14
+ outputs = model.generate(**inputs, max_new_tokens=20)
15
+ return tokenizer.decode(outputs[0], skip_special_tokens=True)
 
 
 
 
 
 
16
 
17
  # Create the Gradio interface
18
  iface = gr.Interface(