|
import streamlit as st |
|
import tempfile |
|
import udfPreprocess.docPreprocessing as pre |
|
import udfPreprocess.cleaning as clean |
|
|
|
def add_upload(choice): |
|
|
|
|
|
if choice == 'Upload Document': |
|
uploaded_file = st.sidebar.file_uploader('Upload the File', type=['pdf', 'docx', 'txt']) |
|
if uploaded_file is not None: |
|
with tempfile.NamedTemporaryFile(mode="wb") as temp: |
|
bytes_data = uploaded_file.getvalue() |
|
temp.write(bytes_data) |
|
st.session_state['filename'] = uploaded_file.name |
|
|
|
file_name = uploaded_file.name |
|
file_path = temp.name |
|
docs = pre.load_document(file_path, file_name) |
|
haystackDoc, dataframeDoc, textData, paraList = clean.preprocessing(docs) |
|
st.session_state['docs'] = docs |
|
st.session_state['paraList'] = paraList |
|
|
|
|
|
else: |
|
|
|
option = st.sidebar.selectbox('Select the example document', |
|
('South Africa:Low Emission strategy', |
|
'Ethiopia: 10 Year Development Plan')) |
|
if option is 'South Africa:Low Emission strategy': |
|
file_name = file_path = 'sample/South Africa_s Low Emission Development Strategy.txt' |
|
st.session_state['filename'] = file_name |
|
|
|
|
|
|
|
else: |
|
|
|
file_name = file_path = 'sample/Ethiopia_s_2021_10 Year Development Plan.txt' |
|
st.session_state['filename'] = file_name |
|
|
|
|
|
if option is not None: |
|
docs = pre.load_document(file_path,file_name) |
|
haystackDoc, dataframeDoc, textData, paraList = clean.preprocessing(docs) |
|
st.session_state['docs'] = docs |
|
st.session_state['paraList'] = paraList |
|
|
|
|