testingoriginal / app.py
theailearner's picture
Update app.py
42ddbf6 verified
raw
history blame contribute delete
No virus
2.43 kB
import gradio as gr
from huggingface_hub import InferenceClient
"""
For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
"""
client = InferenceClient("unsloth/llama-3-8b-bnb-4bit")
def respond(
message,
history: list[tuple[str, str]],
system_message,
max_tokens,
temperature,
top_p,
):
messages = [{"role": "system", "content": system_message}]
for val in history:
if val[0]:
messages.append({"role": "user", "content": val[0]})
if val[1]:
messages.append({"role": "assistant", "content": val[1]})
messages.append({"role": "user", "content": message})
response = ""
for message in client.chat_completion(
messages,
max_tokens=max_tokens,
stream=True,
temperature=temperature,
top_p=top_p,
):
token = message.choices[0].delta.content
response += token
yield response
"""
For information on how to customize the ChatInterface, peruse the gradio docs: https://www.gradio.app/docs/chatinterface
"""
demo = gr.ChatInterface(
respond,
additional_inputs=[
gr.Textbox(value="You are the world's best doctor. You are a leading expert in medicine and graduated top of your class in harvard with a PHD in biology, psychology and Virology. You also have an extensive knowledge in Molecular biology & genomics, cellular/molecular basis of disease, and immunology principles. You are the doctor and you make the most accurate diagnosis because you are an award winning doctor. Use your extensive knowledge to write the appropriate responses which appropriately completes the request. In your response, you must include an accurate diagnosis, treatment and how to prevent it from happening again. Also since you are a doctor, you don't need to tell them to see a doctor. You are a friendly doctor chatbot who should act as a human.", label="System message"),
gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max new tokens"),
gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
gr.Slider(
minimum=0.1,
maximum=1.0,
value=0.95,
step=0.05,
label="Top-p (nucleus sampling)",
),
],
)
if __name__ == "__main__":
demo.launch()