Spaces:

jingxiangmo
/

Azza

Runtime error

App Files Files Community

Jingxiang Mo commited on Mar 26, 2023

Commit

d4e5967

1 Parent(s): 77e7345

Code optimization and response wrap

Browse files

Files changed (3) hide show

.env +1 -0
__pycache__/app.cpython-39.pyc +0 -0
app.py +32 -9

.env ADDED Viewed

	@@ -0,0 +1 @@


1	+ OPENAI_API_KEY="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"

__pycache__/app.cpython-39.pyc CHANGED Viewed

Binary files a/__pycache__/app.cpython-39.pyc and b/__pycache__/app.cpython-39.pyc differ

app.py CHANGED Viewed

@@ -13,6 +13,7 @@ from transformers import (
 )
 from transformers.pipelines import AggregationStrategy
 import torch
 # =====[ DEFINE PIPELINE ]===== #
@@ -33,6 +34,9 @@ class KeyphraseExtractionPipeline(TokenClassificationPipeline):
         return np.unique([result.get("word").strip() for result in results])
 # =====[ LOAD PIPELINE ]===== #
 keyPhraseExtractionModel = "ml6team/keyphrase-extraction-kbir-inspec"
 extractor = KeyphraseExtractionPipeline(model=keyPhraseExtractionModel)
@@ -44,14 +48,18 @@ tokenizer = BertTokenizer.from_pretrained(
 )
-def keyphrases_extraction(text: str) -> str:
-    keyphrases = extractor(text)
-    return keyphrases
-def wikipedia_search(input: str) -> str:
     input = input.replace("\n", " ")
-    keyphrases = keyphrases_extraction(input)
     wiki = wk.Wikipedia("en")
@@ -78,15 +86,23 @@ def wikipedia_search(input: str) -> str:
         return "I cannot answer this question"
-def answer_question(question):
     context = wikipedia_search(question)
     if (context == "I cannot answer this question") or (
         context == "Can you add more details to your question?"
     ):
         return context
-    # Tokenize
-    # Apply the tokenizer to the input text, treating them as a text-pair.
     input_ids = tokenizer.encode(question, context)
     question_ids = input_ids[: input_ids.index(tokenizer.sep_token_id) + 1]
@@ -157,7 +173,14 @@ def answer_question(question):
         scores.append((max_start_score, max_end_score, answer))
     # Compare scores for answers found and each paragraph and pick the most relevant.
-    return max(scores, key=lambda x: x[0] + x[1])[2]
 # =====[ DEFINE INTERFACE ]===== #'

 )
 from transformers.pipelines import AggregationStrategy
 import torch
+from dotenv import load_dotenv
 # =====[ DEFINE PIPELINE ]===== #
         return np.unique([result.get("word").strip() for result in results])
+load_dotenv()
+openai.api_key = os.getenv("OPENAI_API_KEY")
 # =====[ LOAD PIPELINE ]===== #
 keyPhraseExtractionModel = "ml6team/keyphrase-extraction-kbir-inspec"
 extractor = KeyphraseExtractionPipeline(model=keyPhraseExtractionModel)
 )
+def wikipedia_search(input: str) -> str:
+    """Perform a Wikipedia search using keyphrases.
+    Args:
+        input (str): The input text.
+    Returns:
+        str: The summary of the Wikipedia page.
+    """
     input = input.replace("\n", " ")
+    keyphrases = extractor(input)
     wiki = wk.Wikipedia("en")
         return "I cannot answer this question"
+def answer_question(question: str) -> str:
+    """Answer the question using the context from the Wikipedia search.
+    Args:
+        question (str): The input question.
+    Returns:
+        str: The answer to the question.
+    """
     context = wikipedia_search(question)
     if (context == "I cannot answer this question") or (
         context == "Can you add more details to your question?"
     ):
         return context
+    # Tokenize and split input
     input_ids = tokenizer.encode(question, context)
     question_ids = input_ids[: input_ids.index(tokenizer.sep_token_id) + 1]
         scores.append((max_start_score, max_end_score, answer))
     # Compare scores for answers found and each paragraph and pick the most relevant.
+    answer = max(scores, key=lambda x: x[0] + x[1])[2]
+    response = openai.Completion.create(
+        model="text-davinci-003",
+        prompt="Answer the question " + question + "using this answer: " + answer,
+        max_tokens=3000,
+    )
+    return response.choices[0].text.replace("\n\n", " ")
 # =====[ DEFINE INTERFACE ]===== #'