Spaces:

Silvers-145
/

Mistral-Ticket

Sleeping

App Files Files Community

Silvers-145 commited on Jan 1

Commit

d92103a

•

1 Parent(s): be91cb0

Update app.py

Browse files

Files changed (1) hide show

app.py +25 -31

app.py CHANGED Viewed

@@ -1,12 +1,14 @@
 from huggingface_hub import InferenceClient
 import gradio as gr
 client = InferenceClient(
-    # "mistralai/Mixtral-8x7B-Instruct-v0.1"
     "Silvers-145/mistral_instruct_generation"
-)
-# system_prompt = "Your name is S2 Bot and you work for the company name S2. You have to give answer to the user in rude way"
 def format_prompt(message, history):
   prompt = "<s>"
@@ -16,9 +18,7 @@ def format_prompt(message, history):
   prompt += f"[INST] {message} [/INST]"
   return prompt
-def generate(
-    prompt, history, system_prompt, temperature=0.9, max_new_tokens=256, top_p=0.95, repetition_penalty=1.0,
-):
     temperature = float(temperature)
     if temperature < 1e-2:
         temperature = 1e-2
@@ -30,10 +30,11 @@ def generate(
         top_p=top_p,
         repetition_penalty=repetition_penalty,
         do_sample=True,
-        seed=42,
     )
-    formatted_prompt = format_prompt(f"{system_prompt}, {prompt}", history)
     stream = client.text_generation(formatted_prompt, **generate_kwargs, stream=True, details=True, return_full_text=False)
     output = ""
@@ -44,11 +45,6 @@ def generate(
 additional_inputs=[
-    gr.Textbox(
-        label="System Prompt",
-        max_lines=1,
-        interactive=True,
-    ),
     gr.Slider(
         label="Temperature",
         value=0.9,
@@ -60,9 +56,9 @@ additional_inputs=[
     ),
     gr.Slider(
         label="Max new tokens",
-        value=256,
-        minimum=0,
-        maximum=1048,
         step=64,
         interactive=True,
         info="The maximum numbers of new tokens",
@@ -87,19 +83,17 @@ additional_inputs=[
     )
 ]
-examples=[["I'm planning a vacation to Japan. Can you suggest a one-week itinerary including must-visit places and local cuisines to try?", None, None, None, None, None, ],
-          ["Can you write a short story about a time-traveling detective who solves historical mysteries?", None, None, None, None, None,],
-          ["I'm trying to learn French. Can you provide some common phrases that would be useful for a beginner, along with their pronunciations?", None, None, None, None, None,],
-          ["I have chicken, rice, and bell peppers in my kitchen. Can you suggest an easy recipe I can make with these ingredients?", None, None, None, None, None,],
-          ["Can you explain how the QuickSort algorithm works and provide a Python implementation?", None, None, None, None, None,],
-          ["What are some unique features of Rust that make it stand out compared to other systems programming languages like C++?", None, None, None, None, None,],
-         ]
-gr.ChatInterface(
-    fn=generate,
-    chatbot=gr.Chatbot(show_label=False, show_share_button=False, show_copy_button=True, likeable=True, layout="panel"),
-    additional_inputs=additional_inputs,
-    title="Mixtral 46.7B",
-    examples=examples,
-    concurrency_limit=20,
-).launch(show_api=False)

 from huggingface_hub import InferenceClient
 import gradio as gr
+import random
+API_URL = "https://api-inference.huggingface.co/models/"
 client = InferenceClient(
+    # "mistralai/Mistral-7B-Instruct-v0.1"
     "Silvers-145/mistral_instruct_generation"
+)
 def format_prompt(message, history):
   prompt = "<s>"
   prompt += f"[INST] {message} [/INST]"
   return prompt
+def generate(prompt, history, temperature=0.9, max_new_tokens=512, top_p=0.95, repetition_penalty=1.0):
     temperature = float(temperature)
     if temperature < 1e-2:
         temperature = 1e-2
         top_p=top_p,
         repetition_penalty=repetition_penalty,
         do_sample=True,
+        seed=random.randint(0, 10**7),
     )
+    formatted_prompt = format_prompt(prompt, history)
     stream = client.text_generation(formatted_prompt, **generate_kwargs, stream=True, details=True, return_full_text=False)
     output = ""
 additional_inputs=[
     gr.Slider(
         label="Temperature",
         value=0.9,
     ),
     gr.Slider(
         label="Max new tokens",
+        value=512,
+        minimum=64,
+        maximum=1024,
         step=64,
         interactive=True,
         info="The maximum numbers of new tokens",
     )
 ]
+customCSS = """
+#component-7 { # this is the default element ID of the chat component
+  height: 800px; # adjust the height as needed
+  flex-grow: 1;
+}
+"""
+with gr.Blocks(css=customCSS) as demo:
+    gr.ChatInterface(
+        generate,
+        additional_inputs=additional_inputs,
+    )
+demo.queue().launch(debug=True)