Spaces:

Daoneeee
/

task_Chatbot

Sleeping

Daoneeee commited on Nov 21, 2023

Commit

62f948e

1 Parent(s): 0db9945

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -125,25 +125,36 @@ def main():
         st.subheader("Your documents")
         docs = st.file_uploader(
             "Upload your PDFs here and click on 'Process'", accept_multiple_files=True)
-        # 'Process' 버튼 블록 내에서
         if st.button("Process"):
             with st.spinner("Processing"):
                 doc_list = []
                 for file in docs:
                     if file.type == 'text/plain':
                         doc_list.extend(get_text_file(file))
                     elif file.type in ['application/octet-stream', 'application/pdf']:
                         doc_list.extend(get_pdf_text(file))
                     elif file.type == 'text/csv':
                         doc_list.extend(get_csv_file(file))
                     elif file.type == 'application/json':
                         doc_list.extend(get_json_file(file))
                 text_chunks = get_text_chunks(doc_list)
                 vectorstore = get_vectorstore(text_chunks)
-                st.session_state.conversation = get_conversation_chain(vectorstore)
 if __name__ == '__main__':
-    main()

         st.subheader("Your documents")
         docs = st.file_uploader(
             "Upload your PDFs here and click on 'Process'", accept_multiple_files=True)
         if st.button("Process"):
             with st.spinner("Processing"):
+                # get pdf text
                 doc_list = []
                 for file in docs:
+                    print('file - type : ', file.type)
                     if file.type == 'text/plain':
+                        # file is .txt
                         doc_list.extend(get_text_file(file))
                     elif file.type in ['application/octet-stream', 'application/pdf']:
+                        # file is .pdf
                         doc_list.extend(get_pdf_text(file))
                     elif file.type == 'text/csv':
+                        # file is .csv
                         doc_list.extend(get_csv_file(file))
                     elif file.type == 'application/json':
+                        # file is .json
                         doc_list.extend(get_json_file(file))
+                # get the text chunks
                 text_chunks = get_text_chunks(doc_list)
+                # create vector store
                 vectorstore = get_vectorstore(text_chunks)
+                # create conversation chain
+                st.session_state.conversation = get_conversation_chain(
+                    vectorstore)
 if __name__ == '__main__':
+    main()