Spaces:

AllenChai
/

EEP596_MiniProject1_StarGroup

Sleeping

yuanjunchai commited on Jan 27, 2025

Commit

05fff77

1 Parent(s): 170c474

add application files

Files changed (1) hide show

app.py CHANGED Viewed

@@ -24,8 +24,7 @@ import os
 import gdown
 from sentence_transformers import SentenceTransformer
 import matplotlib.pyplot as plt
-import math
 ### Some predefined utility functions for you to load the text embeddings
@@ -53,20 +52,24 @@ def get_model_id_gdrive(model_type):
 def download_glove_embeddings_gdrive(model_type):
-    # Get glove embeddings from google drive
-    word_index_id, embeddings_id = get_model_id_gdrive(model_type)
     # Use gdown to get files from google drive
     embeddings_temp = "embeddings_" + str(model_type) + "_temp.npy"
     word_index_temp = "word_index_dict_" + str(model_type) + "_temp.pkl"
-    # Download word_index pickle file
-    print("Downloading word index dictionary....\n")
-    gdown.download(id=word_index_id, output=word_index_temp, quiet=False)
-    # Download embeddings numpy file
-    print("Donwloading embedings...\n\n")
-    gdown.download(id=embeddings_id, output=embeddings_temp, quiet=False)
 # @st.cache_data()

 import gdown
 from sentence_transformers import SentenceTransformer
 import matplotlib.pyplot as plt
+from huggingface_hub import hf_hub_download
 ### Some predefined utility functions for you to load the text embeddings
 def download_glove_embeddings_gdrive(model_type):
     # Use gdown to get files from google drive
     embeddings_temp = "embeddings_" + str(model_type) + "_temp.npy"
     word_index_temp = "word_index_dict_" + str(model_type) + "_temp.pkl"
+    # 100d download
+    if model_type == "100d":
+        hf_hub_download(repo_id='AveMujica/glove-twitter-100d', filename='embeddings_100d_temp.npy')
+        hf_hub_download(repo_id='AveMujica/glove-twitter-100d', filename='word_index_dict_100d_temp.pkl')
+    else:
+        # Get glove embeddings from google drive
+        word_index_id, embeddings_id = get_model_id_gdrive(model_type)
+        # Download word_index pickle file
+        print("Downloading word index dictionary....\n")
+        gdown.download(id=word_index_id, output=word_index_temp, quiet=False)
+        # Download embeddings numpy file
+        print("Donwloading embedings...\n\n")
+        gdown.download(id=embeddings_id, output=embeddings_temp, quiet=False)
 # @st.cache_data()