import os import streamlit as st import chatbot as demo_chat from transformers import AutoModelForCausalLM, AutoTokenizer from langchain.schema import ( HumanMessage, SystemMessage, ) from langchain_community.chat_models.huggingface import ChatHuggingFace from transformers import pipeline st.title("Hi, I am Chatbot Philio :mermaid:") st.write("I am your hotel booking assistant for today.") # tokenizer = AutoTokenizer.from_pretrained("KvrParaskevi/Hotel-Assistant-Attempt4-Llama-2-7b") tokenizer, model = demo_chat.load_model() model_identifier = "KvrParaskevi/Hotel-Assistant-Attempt4-Llama-2-7b" task = "text-generation" # Change this to your model's task # Load the model using the pipeline model_pipeline = pipeline(task, model=model,tokenizer=tokenizer) #Application with st.container(): st.markdown('
', unsafe_allow_html=True) #Langchain memory in session cache if 'memory' not in st.session_state: st.session_state.memory = demo_chat.demo_miny_memory(model) #Check if chat history exists in this session if 'chat_history' not in st.session_state: st.session_state.chat_history = [ { "role": "system", "content": "You are a friendly chatbot who always helps the user book a hotel room based on his/her needs." + "Based on the current social norms you wait for the user's response to your proposals.", }, {"role": "assistant", "content": "Hello, how can I help you today?"}, ] #Initialize chat history if 'model' not in st.session_state: st.session_state.model = model #renders chat history for message in st.session_state.chat_history: if(message["role"]!= "system"): with st.chat_message(message["role"]): st.write(message["content"]) #Set up input text field input_text = st.chat_input(placeholder="Here you can chat with our hotel booking model.") if input_text: with st.chat_message("user"): #st.write(input_text) st.session_state.chat_history.append({"role" : "user", "content" : input_text}) #append message to chat history #chat_response = demo_chat.demo_chain(input_text=input_text, memory=st.session_state.memory, model= chat_model) #first_answer = chat_response.split("Human")[0] #Because of Predict it prints the whole conversation.Here we seperate the first answer only. tokenized_chat = tokenizer.apply_chat_template(st.session_state.chat_history, tokenize=True, add_generation_prompt=True, return_tensors="pt") #st.write(tokenizer.decode(tokenized_chat[0])) outputs = model.generate(tokenized_chat, max_new_tokens=128) first_answer = tokenizer.decode(outputs[0][tokenized_chat.shape[1]:],skip_special_tokens=True) with st.chat_message("assistant"): #st.write(first_answer) st.session_state.chat_history.append({"role": "assistant", "content": first_answer}) st.markdown('
', unsafe_allow_html=True)