-
Notifications
You must be signed in to change notification settings - Fork 7
/
app.py
118 lines (95 loc) · 3.96 KB
/
app.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
import streamlit as st
from dotenv import load_dotenv
import pickle
from PyPDF2 import PdfReader
from streamlit_extras.add_vertical_space import add_vertical_space
from langchain.text_splitter import RecursiveCharacterTextSplitter
from langchain.embeddings.openai import OpenAIEmbeddings
from langchain.vectorstores import FAISS
from langchain.llms import OpenAI
from langchain.chains.question_answering import load_qa_chain
from langchain.callbacks import get_openai_callback
import os
st.set_page_config(page_title='🤗💬 PDF Chat App - GPT')
# Sidebar contents
with st.sidebar:
st.title('🤗💬 PDF Chat App')
st.markdown('''
## About
This app is an LLM-powered chatbot built using:
- [Streamlit](https://streamlit.io/)
- [LangChain](https://python.langchain.com/)
- [OpenAI](https://platform.openai.com/docs/models) LLM model
''')
add_vertical_space(5)
st.write('Made with ❤️ by [Livia Ellen](https://liviaellen.com/portfolio)')
def main():
st.header("Talk to your PDF 💬")
st.write("This app uses OpenAI's LLM model to answer questions about your PDF file. Upload your PDF file and ask questions about it. The app will return the answer from your PDF file.")
st.header("1. Pass your OPEN AI API KEY here")
v='demo'
openai_key=st.text_input("**OPEN AI API KEY**", value=v)
st.write("You can get your OpenAI API key from [here](https://platform.openai.com/account/api-keys)")
if openai_key==v:
openai_key=st.secrets["OPENAI_API_KEY"]
# if openai_key=='':
# load_dotenv()
os.environ["OPENAI_API_KEY"] = openai_key
# upload a PDF file
st.header("2. Upload PDF")
pdf = st.file_uploader("**Upload your PDF**", type='pdf')
# st.write(pdf)
if pdf is not None:
pdf_reader = PdfReader(pdf)
text = ""
for page in pdf_reader.pages:
text += page.extract_text()
text_splitter = RecursiveCharacterTextSplitter(
chunk_size=1000,
chunk_overlap=200,
length_function=len
)
chunks = text_splitter.split_text(text=text)
# # embeddings
store_name = pdf.name[:-4]
st.write(f'{store_name}')
# st.write(chunks)
if os.path.exists(f"{store_name}.pkl"):
with open(f"{store_name}.pkl", "rb") as f:
VectorStore = pickle.load(f)
# st.write('Embeddings Loaded from the Disk')s
else:
embeddings = OpenAIEmbeddings()
VectorStore = FAISS.from_texts(chunks, embedding=embeddings)
with open(f"{store_name}.pkl", "wb") as f:
pickle.dump(VectorStore, f)
# embeddings = OpenAIEmbeddings()
# VectorStore = FAISS.from_texts(chunks, embedding=embeddings)
# st.header("or.. Try it with this The Alchaemist PDF book")
# if st.button('Ask The Alchemist Book Questions'):
# with open("The_Alchemist.pkl", "rb") as f:
# VectorStore = pickle.load(f)
# Accept user questions/query
st.header("3. Ask questions about your PDF file:")
q="Tell me about the content of the PDF"
query = st.text_input("Questions",value=q)
# st.write(query)
if st.button("Ask"):
# st.write(openai_key)
# os.environ["OPENAI_API_KEY"] = openai_key
if openai_key=='':
st.write('Warning: Please pass your OPEN AI API KEY on Step 1')
else:
docs = VectorStore.similarity_search(query=query, k=3)
llm = OpenAI()
chain = load_qa_chain(llm=llm, chain_type="stuff")
with get_openai_callback() as cb:
response = chain.run(input_documents=docs, question=query)
print(cb)
st.header("Answer:")
st.write(response)
st.write('--')
st.header("OpenAI API Usage:")
st.text(cb)
if __name__ == '__main__':
main()