Spaces:

robjm16
/

domain_specific_ChatGPT

Runtime error

robjm16 commited on Jan 16, 2023

Commit

275329e

1 Parent(s): d456449

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -13,12 +13,12 @@ Far more robust domain-specific responses are possible by further customizing/re
 ################################# LOAD LIBRARIES/IMPORTS #########################################
-! pip install openai --quiet
-! pip install transformers --quiet
-! pip install gradio --quiet
-! pip install PyPDF2 --quiet
-! pip install python-docx --quiet
-! pip install pandas --quiet
 import docx
@@ -45,7 +45,7 @@ openai.api_key = os.environ["API_KEY"]
 MODEL_NAME = "curie"
 DOC_EMBEDDINGS_MODEL = f"text-search-{MODEL_NAME}-doc-001"
 QUERY_EMBEDDINGS_MODEL = f"text-search-{MODEL_NAME}-query-001"
-MAX_SECTION_LEN =1100  # The API limits total tokens -- for the prompt containing the wuestion and domain-specific content and the answer -- to 2048 tokens, or about 1500 words.
 SEPARATOR = "\n* "  # A string called SEPARATOR is defined as the newline character followed by an asterisk and a space. This string will be used as a separator between different pieces of text.
 tokenizer = GPT2TokenizerFast.from_pretrained("gpt2")
 separator_len = len(tokenizer.tokenize(SEPARATOR))

 ################################# LOAD LIBRARIES/IMPORTS #########################################
+pip install openai --quiet
+pip install transformers --quiet
+pip install gradio --quiet
+pip install PyPDF2 --quiet
+pip install python-docx --quiet
+pip install pandas --quiet
 import docx
 MODEL_NAME = "curie"
 DOC_EMBEDDINGS_MODEL = f"text-search-{MODEL_NAME}-doc-001"
 QUERY_EMBEDDINGS_MODEL = f"text-search-{MODEL_NAME}-query-001"
+MAX_SECTION_LEN =1100  # The API limits total tokens -- for the prompt containing the question and domain-specific content and the answer -- to 2048 tokens, or about 1500 words.
 SEPARATOR = "\n* "  # A string called SEPARATOR is defined as the newline character followed by an asterisk and a space. This string will be used as a separator between different pieces of text.
 tokenizer = GPT2TokenizerFast.from_pretrained("gpt2")
 separator_len = len(tokenizer.tokenize(SEPARATOR))