Spaces:

ProjectFrozone
/

Site

Paused

App Files Files Community

riderle commited on Mar 23

Commit

4dde0fb

verified ·

1 Parent(s): ac9a89a

Remove trailing punctuation 80% of the time

Browse files

Files changed (1) hide show

chat_application/main.py +14 -8

chat_application/main.py CHANGED Viewed

@@ -62,6 +62,7 @@ class datasetHandler():
 CHAT_CONTEXT = 20 #how many messages from chat history to append to inference prompt
 #minimum number of chars where we start checking for duplicate messages
 DUP_LEN = 25 #since short messages may reasonably be the same
 # Directory alignment
 BASE_DIR = Path(__file__).resolve().parent
@@ -368,8 +369,10 @@ def ask_bot(room_id, bot, bot_display_name, initial_prompt, instruct_prompt):
         print("PASSED")
         return True # a pass is still recorded in the database, but not sent to the client
     #remove encapsulating quotes
-    no_quotes = remove_quotes(parsed_response)
     #humanize the response (remove obvious AI formatting styles)
     humanized_response = humanize(no_quotes)
     #replace most semicolons
@@ -378,11 +381,14 @@ def ask_bot(room_id, bot, bot_display_name, initial_prompt, instruct_prompt):
     corrupted_response = corrupt(less_semicolons_response, misspell_aug_p=0.01, typo_aug_p=0.005)
     #remove weird chars
     no_weird_chars = remove_weird_characters(corrupted_response)
-    #sub letters for names, so if the bot addressed A -> Apple
-    named_response = let_to_name(room_id, no_weird_chars)
     #check that there are no reccent duplicate messages
-    if len(named_response) > DUP_LEN and duplicate_check(named_response, context):
         print("****DUPLICATE MESSAGE DETECTED")
         print("Treating this bot's response as a pass.")
         # Do not store/send messages if the chat has ended
@@ -392,7 +398,7 @@ def ask_bot(room_id, bot, bot_display_name, initial_prompt, instruct_prompt):
         # Store the error response in the database
         bot_message = {
             "sender": bot_display_name,
-            "message": f"DUPLICATE message detected - treated as a (pass) : {named_response}",
             "timestamp": datetime.utcnow()
         }
         rooms_collection.update_one(
@@ -407,7 +413,7 @@ def ask_bot(room_id, bot, bot_display_name, initial_prompt, instruct_prompt):
     print(corrupted_response)
     # Add latency/wait time for bot responses
-    delay = get_response_delay(named_response);
     print(delay)
     time.sleep(delay)
@@ -419,7 +425,7 @@ def ask_bot(room_id, bot, bot_display_name, initial_prompt, instruct_prompt):
     # Store the response in the database
     bot_message = {
         "sender": bot_display_name,
-        "message": named_response, #save fruits in db so page reload shows proper names
         "timestamp": datetime.utcnow()
     }
     rooms_collection.update_one(
@@ -428,7 +434,7 @@ def ask_bot(room_id, bot, bot_display_name, initial_prompt, instruct_prompt):
     )
     # Send the bot's response to the client
-    socketio.emit("message", {"sender": bot_display_name, "message": named_response}, to=room_id)
     return False
 def ask_bot_round(room_id):

 CHAT_CONTEXT = 20 #how many messages from chat history to append to inference prompt
 #minimum number of chars where we start checking for duplicate messages
 DUP_LEN = 25 #since short messages may reasonably be the same
+REMOVE_PUNC_RATE = .8 #how often to remove final punctuation
 # Directory alignment
 BASE_DIR = Path(__file__).resolve().parent
         print("PASSED")
         return True # a pass is still recorded in the database, but not sent to the client
+    #sub letters for names, so if the bot addressed A -> Apple
+    named_response = let_to_name(room_id, parsed_response)
     #remove encapsulating quotes
+    no_quotes = remove_quotes(named_response)
     #humanize the response (remove obvious AI formatting styles)
     humanized_response = humanize(no_quotes)
     #replace most semicolons
     corrupted_response = corrupt(less_semicolons_response, misspell_aug_p=0.01, typo_aug_p=0.005)
     #remove weird chars
     no_weird_chars = remove_weird_characters(corrupted_response)
+    #remove trailing punctuation % of the time
+    if random.random() < REMOVE_PUNC_RATE:
+        no_weird_chars = re.sub(r'[^\w\s]+$', '', no_weird_chars)
+    final_response = no_weird_chars
     #check that there are no reccent duplicate messages
+    if len(final_response) > DUP_LEN and duplicate_check(final_response, context):
         print("****DUPLICATE MESSAGE DETECTED")
         print("Treating this bot's response as a pass.")
         # Do not store/send messages if the chat has ended
         # Store the error response in the database
         bot_message = {
             "sender": bot_display_name,
+            "message": f"DUPLICATE message detected - treated as a (pass) : {final_response}",
             "timestamp": datetime.utcnow()
         }
         rooms_collection.update_one(
     print(corrupted_response)
     # Add latency/wait time for bot responses
+    delay = get_response_delay(final_response);
     print(delay)
     time.sleep(delay)
     # Store the response in the database
     bot_message = {
         "sender": bot_display_name,
+        "message": final_response, #save fruits in db so page reload shows proper names
         "timestamp": datetime.utcnow()
     }
     rooms_collection.update_one(
     )
     # Send the bot's response to the client
+    socketio.emit("message", {"sender": bot_display_name, "message": final_response}, to=room_id)
     return False
 def ask_bot_round(room_id):