Spaces:

AllenChai
/

EEP596_MiniProject1_StarGroup

Sleeping

yuanjunchai commited on Jan 27, 2025

Commit

8249632

1 Parent(s): 7e1eff0

add application files

Files changed (1) hide show

app.py CHANGED Viewed

@@ -263,23 +263,39 @@ def averaged_glove_embeddings_gdrive(sentence, word_index_dict, embeddings, mode
     5. Return averaged embeddings
     (30 pts)
     """
-    embedding = np.zeros(int(model_type.split("d")[0]))
-    # Split sentence into words
     words = sentence.split()
-    valid_words = 0
     for word in words:
-        # Check if the word is in the word_index_dict
-        if word in word_index_dict:
-            word_idx = word_index_dict[word]
-            embedding += embeddings[word_idx]
-            valid_words += 1
-    if valid_words > 0:
-        raise ValueError("No valid words in sentence")
-    embedding /= valid_words
     return embedding

     5. Return averaged embeddings
     (30 pts)
     """
+    # embedding = np.zeros(int(model_type.split("d")[0]))
+    # # Split sentence into words
+    # words = sentence.split()
+    # valid_words = 0
+    # for word in words:
+    #     # Check if the word is in the word_index_dict
+    #     if word in word_index_dict:
+    #         word_idx = word_index_dict[word]
+    #         embedding += embeddings[word_idx]
+    #         valid_words += 1
+    # if valid_words > 0:
+    #     raise ValueError("No valid words in sentence")
+    # embedding /= valid_words
+    # return embedding
+    embedding_dim = np.zeros(int(model_type.split("d")[0]))
+    embedding = np.zeros(embedding_dim)
     words = sentence.split()
+    valid_word_count = 0
     for word in words:
+        if word.lower() in word_index_dict:
+            embedding += embeddings[word_index_dict[word.lower()]]
+            valid_word_count += 1
+    if valid_word_count > 0:
+        embedding /= valid_word_count
     return embedding