Spaces:

Vishnu-add
/

chat-with-doc

Sleeping

App Files Files Community

chat-with-doc / chatbot.py

Vishnu-add

Upload 15 files

0b5fda4 11 months ago

raw

history blame contribute delete

3.02 kB

	import streamlit as st
	from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
	from transformers import pipeline
	import torch
	import base64
	import textwrap
	from langchain.embeddings import SentenceTransformerEmbeddings
	from langchain.vectorstores import Chroma
	from langchain.llms.huggingface_pipeline import HuggingFacePipeline
	from langchain.chains import RetrievalQA
	from streamlit_chat import message

	# device = torch.device('cpu')
	device = torch.device('cuda:0')


	checkpoint = "LaMini-T5-738M"
	tokenizer = AutoTokenizer.from_pretrained(checkpoint)
	base_model = AutoModelForSeq2SeqLM.from_pretrained(
	checkpoint,
	device_map=device,
	torch_dtype = torch.float32,
	# offload_folder= "/model_ck"
	)

	@st.cache_resource
	def llm_pipeline():
	pipe = pipeline(
	'text2text-generation',
	model = base_model,
	tokenizer=tokenizer,
	max_length = 256,
	do_sample = True,
	temperature = 0.3,
	top_p = 0.95,
	)

	local_llm = HuggingFacePipeline(pipeline = pipe)
	return local_llm

	@st.cache_resource
	def qa_llm():
	llm = llm_pipeline()
	embeddings = SentenceTransformerEmbeddings(model_name="all-MiniLM-L6-v2")
	db = Chroma(persist_directory="db", embedding_function = embeddings)
	retriever = db.as_retriever()
	qa = RetrievalQA.from_chain_type(
	llm=llm,
	chain_type = "stuff",
	retriever = retriever,
	return_source_documents=True
	)
	return qa


	def process_answer(instruction):
	response=''
	instruction = instruction
	qa = qa_llm()
	generated_text = qa(instruction)
	answer = generated_text['result']
	return answer, generated_text

	# Display conversation history using Streamlit messages
	def display_conversation(history):
	for i in range(len(history["generated"])):
	message(history["past"][i] , is_user=True, key= str(i) + "_user")
	message(history["generated"][i] , key= str(i))


	def main():
	st.title("Chat with your pdf📚")
	with st.expander("About the App"):
	st.markdown(
	"""
	This is a Generative AI powered Question and Answering app that responds to questions about your PDF file.
	"""
	)

	user_input = st.text_input("",key="input")

	# Initialize session state for generated responses and past messages
	if "generated" not in st.session_state:
	st.session_state["generated"] = ["I am ready to help you"]
	if "past" not in st.session_state:
	st.session_state["past"] = ["Hey There!"]

	# Search the database for a response based on user input and update session state
	if user_input:
	answer = process_answer({"query" : user_input})
	st.session_state["past"].append(user_input)
	response = answer
	st.session_state["generated"].append(response)

	# Display Conversation history using Streamlit messages
	if st.session_state["generated"]:
	display_conversation(st.session_state)



	if __name__ == "__main__":
	main()