Zamanonymize3

Build error

App Files Files Community

OthmaneLKH commited on Sep 28, 2024

Commit

9023283

verified ·

1 Parent(s): 0ca0215

Update app.py

Browse files

Files changed (1) hide show

app.py +21 -55

app.py CHANGED Viewed

@@ -418,70 +418,36 @@ def anonymization_with_fn(selected_sentences, query):
         identified_words_output_df: gr.update(value=identified_df, visible=False),
     }
-def query_chatgpt_fn(anonymized_query, anonymized_document):
-    print("------------ Step 5: ChatGPT communication")
-    if not (KEYS_DIR / f"{USER_ID}/evaluation_key").is_file():
-        error_message = "Error ❌: Please generate the key first!"
-        return {chatgpt_response_anonymized: gr.update(value=error_message)}
-    if not (CLIENT_DIR / f"{USER_ID}_encrypted_output").is_file():
-        error_message = "Error ❌: Please encrypt your query first!"
-        return {chatgpt_response_anonymized: gr.update(value=error_message)}
-    context_prompt = read_txt(PROMPT_PATH)
-    # Prepare prompt
-    query = (
-        "Document content:\n```\n"
-        + anonymized_document
-        + "\n\n```"
-        + "Query:\n```\n"
-        + anonymized_query
-        + "\n```"
-    )
-    print(f'Prompt of CHATGPT:\n{query}')
-    completion = client.chat.completions.create(
-        model="gpt-4-1106-preview",  # Replace with "gpt-4" if available
-        messages=[
-            {"role": "system", "content": context_prompt},
-            {"role": "user", "content": query},
-        ],
-    )
-    anonymized_response = completion.choices[0].message.content
-    uuid_map = read_json(MAPPING_UUID_PATH)
-    inverse_uuid_map = {
-        v: k for k, v in uuid_map.items()
-    }  # TODO load the inverse mapping from disk for efficiency
-    # Pattern to identify words and non-words (including punctuation, spaces, etc.)
-    tokens = re.findall(r"(\b[\w\.\/\-@]+\b|[\s,.!?;:'\"-]+)", anonymized_response)
-    processed_tokens = []
-    for token in tokens:
-        # Directly append non-word tokens or whitespace to processed_tokens
-        if not token.strip() or not re.match(r"\w+", token):
-            processed_tokens.append(token)
-            continue
-        if token in inverse_uuid_map:
-            processed_tokens.append(inverse_uuid_map[token])
-        else:
-            processed_tokens.append(token)
-    deanonymized_response = "".join(processed_tokens)
-    return {chatgpt_response_anonymized: gr.update(value=anonymized_response),
-            chatgpt_response_deanonymized: gr.update(value=deanonymized_response)}
 demo = gr.Blocks(css=".markdown-body { font-size: 18px; }")
 with demo:
     gr.Markdown(
         """
         <p align="center">

         identified_words_output_df: gr.update(value=identified_df, visible=False),
     }
+# Define the folder path containing audio files
+AUDIO_FOLDER_PATH = "./files/"
+# Function to list available audio files in the folder
+def get_audio_files():
+    files = [f for f in os.listdir(AUDIO_FOLDER_PATH) if f.endswith(('.wav', '.mp3'))]
+    return files
+# Step 1: Load and display audio file
+def load_audio_file(selected_audio):
+    file_path = os.path.join(AUDIO_FOLDER_PATH, selected_audio)
+    return file_path
 demo = gr.Blocks(css=".markdown-body { font-size: 18px; }")
 with demo:
+    # Step 1: Add an audio file
+    gr.Markdown("## Step 1: Add an Audio File")
+    audio_files = get_audio_files()
+    with gr.Row():
+        audio_file_dropdown = gr.Dropdown(audio_files, label="Select an Audio File", interactive=True)
+        audio_output = gr.Audio(label="Selected Audio", type="filepath")
+    # When an audio file is selected, it will display the file path
+    audio_file_dropdown.change(fn=load_audio_file, inputs=[audio_file_dropdown], outputs=[audio_output])
     gr.Markdown(
         """
         <p align="center">