Spaces:

igrisds
/

AskDS

Runtime error

App Files Files Community

igrisds commited on Apr 25, 2024

Commit

48ee539

verified ·

1 Parent(s): 0428aad

Update app.py

Browse files

Files changed (1) hide show

app.py +8 -4

app.py CHANGED Viewed

@@ -29,9 +29,9 @@ def create_bedrock_client():
         aws_session_token=AWS_SESSION
     )
 def create_s3_client():
-    # Create an S3 client
     return boto3.client(
         's3',
         aws_access_key_id=AWS_ACCESS_KEY_ID,
@@ -39,6 +39,7 @@ def create_s3_client():
         aws_session_token=AWS_SESSION
     )
 def read_json_from_s3():
     response = s3_client.get_object(Bucket=BUCKET_NAME, Key=EXTRACTIONS_PATH)
@@ -47,6 +48,7 @@ def read_json_from_s3():
     return json_content
 def get_titan_embedding(bedrock_client, doc_name, text, attempt=0, cutoff=10000):
     """
     Retrieves a text embedding for a given document using the Amazon Titan Embedding model.
@@ -87,9 +89,9 @@ def get_titan_embedding(bedrock_client, doc_name, text, attempt=0, cutoff=10000)
     response_body = json.loads(response['body'].read())
     return response_body.get('embedding')
 def ask_ds(message, history):
     if len(message) == 0:
         return
@@ -110,7 +112,6 @@ def ask_ds(message, history):
     for file, _ in top_3:
         similar_content += extractions[file]['content'] + '\n'
     # Invoke
     response = bedrock_client.invoke_model_with_response_stream(
         modelId="anthropic.claude-3-sonnet-20240229-v1:0",
@@ -145,6 +146,7 @@ def ask_ds(message, history):
         ),
     )
     all_text = ''
     stream = response.get('body')
     if stream:
@@ -159,13 +161,15 @@ def ask_ds(message, history):
                 except:
                     pass
     output = '\n\nCheck out the following documents for more information:\n'
     for file, sim in top_3:
-        output += f"\n{file.replace('.txt', '.pdf')} ({(1-sim) * 100}%)"
     yield all_text + output
 bedrock_client = create_bedrock_client()
 s3_client = create_s3_client()
 extractions = read_json_from_s3()

         aws_session_token=AWS_SESSION
     )
+# Create AWS S3 client using environment variables
 def create_s3_client():
     return boto3.client(
         's3',
         aws_access_key_id=AWS_ACCESS_KEY_ID,
         aws_session_token=AWS_SESSION
     )
+# Read JSON directly into mem from S3
 def read_json_from_s3():
     response = s3_client.get_object(Bucket=BUCKET_NAME, Key=EXTRACTIONS_PATH)
     return json_content
+# Get AWS Titan embedding of text
 def get_titan_embedding(bedrock_client, doc_name, text, attempt=0, cutoff=10000):
     """
     Retrieves a text embedding for a given document using the Amazon Titan Embedding model.
     response_body = json.loads(response['body'].read())
     return response_body.get('embedding')
+# Main Chat
 def ask_ds(message, history):
     if len(message) == 0:
         return
     for file, _ in top_3:
         similar_content += extractions[file]['content'] + '\n'
     # Invoke
     response = bedrock_client.invoke_model_with_response_stream(
         modelId="anthropic.claude-3-sonnet-20240229-v1:0",
         ),
     )
+    # Stream the response
     all_text = ''
     stream = response.get('body')
     if stream:
                 except:
                     pass
+    # Print relevant files
     output = '\n\nCheck out the following documents for more information:\n'
     for file, sim in top_3:
+        output += f"\n{file.replace('.txt', '.pdf')}"
     yield all_text + output
+# Create necessary services and collect data
 bedrock_client = create_bedrock_client()
 s3_client = create_s3_client()
 extractions = read_json_from_s3()