Spaces:

Effyis
/

AGDS-UI

Sleeping

App Files Files Community

Nechba commited on Jun 21, 2024

Commit

c1903e3

1 Parent(s): f31bfcd

add text area option

Browse files

Files changed (4) hide show

app.py +38 -20
utlis/__pycache__/constant.cpython-39.pyc +0 -0
utlis/__pycache__/helper.cpython-39.pyc +0 -0
utlis/helper.py +27 -0

app.py CHANGED Viewed

@@ -33,11 +33,21 @@ with st.sidebar:
         if len(services)>0:
-            st.session_state.uploaded_files = st.file_uploader("Upload PDF file",  type=["pdf","txt"], accept_multiple_files=False)
-            if st.session_state.uploaded_files:
-                st.session_state.process = st.button('Process')
-                if st.session_state.process:
-                    add_document(st.session_state.token,st.session_state.service)
     elif st.session_state.genre=="Select document":
         st.title('Scrape Document')
@@ -69,7 +79,8 @@ with st.sidebar:
                 st.session_state.method = st.selectbox("Chunking Method", ["chunk_per_page", "personalize_chunking"])
                 if st.session_state.method=="personalize_chunking":
                     st.session_state.split_token = st.text_area("Split Token")
-            elif st.session_state.doument_slected_to_chat.split("_")[-1]=="txt":
                 st.session_state.method = st.selectbox("Chunking Method", ["personalize_chunking"])
                 st.session_state.split_token = st.text_area("Split Token")
         else:
@@ -160,6 +171,12 @@ st.markdown(css_style, unsafe_allow_html=True)
 with st.container():
     st.markdown('<h1 class="title">Augmented Generative Document Scraper</h1>', unsafe_allow_html=True)
     if st.session_state.genre=="Select document" and st.session_state.service_slected_to_chat:
         schema = display_and_validate_schema()
         comments = None
@@ -182,7 +199,8 @@ with st.container():
                 headers = {'Content-Type': 'application/json'}
                 response  = requests.get(RESPONSE_API,data=json_data, headers=headers)
                 response_data = json.loads(response.text)
-            elif st.session_state.doument_slected_to_chat.split("_")[-1]=="txt":
                 data = {"token": st.session_state.token,
                 "service_name": st.session_state.service_slected_to_chat,
                 "document_name": st.session_state.doument_slected_to_chat,
@@ -195,18 +213,18 @@ with st.container():
                 headers = {'Content-Type': 'application/json'}
                 response  = requests.get(RESPONSE_TXT_API,data=json_data, headers=headers)
                 response_data = json.loads(response.text)
-            if response_data.get('status')=='success':
-                json_str =response_data.get("json")
-                json_str_formatted = json.dumps(json_str)
-                # Encode this JSON string to bytes, which is required for the download
-                json_bytes = json_str_formatted.encode('utf-8')
-                st.download_button(
-                    label="Download JSON",
-                    data=json_bytes,
-                    file_name="results.json",
-                    mime="application/json"
-                )
-            else:
-                st.error("Error in processing document")

         if len(services)>0:
+            st.session_state.doc_ortext = st.radio("Choose option",["Documnt", "Text area"])
+            if st.session_state.doc_ortext=="Documnt":
+                st.session_state.uploaded_files = st.file_uploader("Upload PDF file",  type=["pdf","txt"], accept_multiple_files=False)
+                if st.session_state.uploaded_files:
+                    st.session_state.process = st.button('Process')
+                    if st.session_state.process:
+                        add_document(st.session_state.token,st.session_state.service)
+            # elif st.session_state.doc_ortext=="Text area":
+            #     st.session_state.name_text_area = st.container().text_area("Enter name of the text area")
+            #     st.session_state.text_area = st.container().text_area("Enter text")
+            #     if st.session_state.text_area:
+            #         st.session_state.process = st.container().button('Process')
+            #         if st.session_state.process:
+            #             add_text_document(st.session_state.token,st.session_state.service)
     elif st.session_state.genre=="Select document":
         st.title('Scrape Document')
                 st.session_state.method = st.selectbox("Chunking Method", ["chunk_per_page", "personalize_chunking"])
                 if st.session_state.method=="personalize_chunking":
                     st.session_state.split_token = st.text_area("Split Token")
+            #elif st.session_state.doument_slected_to_chat.split("_")[-1]=="txt":
+            else:
                 st.session_state.method = st.selectbox("Chunking Method", ["personalize_chunking"])
                 st.session_state.split_token = st.text_area("Split Token")
         else:
 with st.container():
     st.markdown('<h1 class="title">Augmented Generative Document Scraper</h1>', unsafe_allow_html=True)
+    if st.session_state.genre=="Add document(s)" and st.session_state.doc_ortext == "Text area":
+                st.session_state.name_text_area = st.text_input("Enter name of the text area:")
+                st.session_state.text_area = st.text_area("Enter text:")
+                if st.session_state.text_area:
+                    if st.button('Process Text'):
+                        add_text_document(st.session_state.token, st.session_state.service)
     if st.session_state.genre=="Select document" and st.session_state.service_slected_to_chat:
         schema = display_and_validate_schema()
         comments = None
                 headers = {'Content-Type': 'application/json'}
                 response  = requests.get(RESPONSE_API,data=json_data, headers=headers)
                 response_data = json.loads(response.text)
+            #elif st.session_state.doument_slected_to_chat.split("_")[-1]=="txt":
+            else:
                 data = {"token": st.session_state.token,
                 "service_name": st.session_state.service_slected_to_chat,
                 "document_name": st.session_state.doument_slected_to_chat,
                 headers = {'Content-Type': 'application/json'}
                 response  = requests.get(RESPONSE_TXT_API,data=json_data, headers=headers)
                 response_data = json.loads(response.text)
+                if response_data.get('status')=='success':
+                    json_str =response_data.get("json")
+                    json_str_formatted = json.dumps(json_str)
+                    # Encode this JSON string to bytes, which is required for the download
+                    json_bytes = json_str_formatted.encode('utf-8')
+                    st.download_button(
+                        label="Download JSON",
+                        data=json_bytes,
+                        file_name="results.json",
+                        mime="application/json"
+                    )
+                else:
+                    st.error("Error in processing document")

utlis/__pycache__/constant.cpython-39.pyc CHANGED Viewed

Binary files a/utlis/__pycache__/constant.cpython-39.pyc and b/utlis/__pycache__/constant.cpython-39.pyc differ

utlis/__pycache__/helper.cpython-39.pyc CHANGED Viewed

Binary files a/utlis/__pycache__/helper.cpython-39.pyc and b/utlis/__pycache__/helper.cpython-39.pyc differ

utlis/helper.py CHANGED Viewed

@@ -117,6 +117,33 @@ def add_service(token,servicename):
         st.success(f"{servicename} added successfully")
     else:
         st.error(response.text)
 def add_document(token,servicename):

         st.success(f"{servicename} added successfully")
     else:
         st.error(response.text)
+def add_text_document(token, servicename):
+    # Retrieve text and document name from session state
+    document_text = st.session_state.text_area
+    document_name = st.session_state.name_text_area.replace(" ", "_").replace("(", "_").replace(")", "_").replace("-", "_").replace(".", "_")
+    # Encode the document text as Base64
+    encoded_text = base64.b64encode(document_text.encode('utf-8')).decode('utf-8')
+    url = ADD_STORE_DOCUMENT
+    # Prepare the JSON payload
+    data = {
+        "token": token,
+        "service_name": servicename,
+        "document_name": document_name,
+        "file": encoded_text  # Assuming the API can handle Base64 encoded text under the 'file' key
+    }
+    # Convert the dictionary to a JSON formatted string and send the POST request
+    headers = {'Content-Type': 'application/json'}
+    response = requests.post(url, data=json.dumps(data), headers=headers)
+    status = json.loads(response.text).get("status")
+    if status == "success":
+        st.success(f"{document_name} uploaded successfully as text")
+    else:
+        st.error(f"{document_name} not uploaded successfully")
 def add_document(token,servicename):