Blessmore commited on
Commit
aff0f0f
·
verified ·
1 Parent(s): ceee85a

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +0 -104
app.py CHANGED
@@ -173,107 +173,3 @@ def main():
173
  epochs=100,
174
  bucket=2000000,
175
  min_n=3,
176
- max_n=6
177
- )
178
- end_time = time.time()
179
-
180
- # Calculate the elapsed time
181
- elapsed_time = end_time - start_time
182
- st.write("Time taken: {:.2f} minutes".format(elapsed_time / 60))
183
-
184
- st.write("Model trained successfully!")
185
-
186
- # Zip the model files in memory
187
- zip_buffer = zip_model(model)
188
-
189
- # Provide download link
190
- st.download_button(
191
- label="Download Model",
192
- data=zip_buffer,
193
- file_name="fasttext_model.zip",
194
- mime="application/zip"
195
- )
196
- except Exception as e:
197
- st.error(f"An error occurred: {str(e)}")
198
- st.error("Check the server logs for more details.")
199
-
200
- elif option == "Generate Embeddings":
201
- st.header("Generate Embeddings with Pretrained FastText Model")
202
-
203
- # Specify the path to the model folder
204
- model_folder = "Fast_text_50_dim"
205
-
206
- # Load the model from the specified folder
207
- model = load_fasttext_model(model_folder)
208
-
209
- st.subheader("Generate Word Embedding")
210
- word = st.text_input("Enter a word:")
211
- if word:
212
- embedding = generate_word_embedding(word, model)
213
- if embedding is not None:
214
- st.write(f"Embedding for '{word}':", embedding)
215
- else:
216
- st.write(f"'{word}' not in vocabulary")
217
-
218
- st.subheader("Find Similar Words")
219
- word_for_similar = st.text_input("Enter a word to find similar words:")
220
- if word_for_similar:
221
- similar_words = find_similar_words(word_for_similar, model)
222
- if similar_words:
223
- st.write("Similar words:")
224
- for word, similarity in similar_words:
225
- st.write(f"{word}: {similarity}")
226
- else:
227
- st.write(f"No similar words found for '{word_for_similar}'")
228
-
229
- st.subheader("Generate Embeddings for Words in a Sentence")
230
- sentence = st.text_input("Enter a sentence:")
231
- if sentence:
232
- word_embeddings = generate_embeddings_for_sentence(sentence, model, r'\b\w+\b')
233
- if word_embeddings:
234
- for idx, embedding in enumerate(word_embeddings):
235
- st.write(f"Word {idx+1} embedding:", embedding)
236
- else:
237
- st.write("No embeddings could be generated for the words in the sentence.")
238
-
239
- st.subheader("Generate Embedding for a Sentence")
240
- sentence_for_embedding = st.text_input("Enter a sentence to generate its embedding:")
241
- if sentence_for_embedding:
242
- sentence_embedding = generate_sentence_embedding(sentence_for_embedding, model, r'\b\w+\b')
243
- if sentence_embedding is not None:
244
- st.write("Sentence embedding:", sentence_embedding)
245
- else:
246
- st.write("No embedding could be generated for the sentence.")
247
-
248
- st.subheader("Find Most Similar Sentence Pairs")
249
- uploaded_sentences_file = st.file_uploader("Upload a text file with sentences (one per line)", type=["txt"])
250
- if uploaded_sentences_file:
251
- sentences = uploaded_sentences_file.read().decode('utf-8').splitlines()
252
- sentence_embeddings = generate_sentence_embeddings(sentences, model, r'\b\w+\b')
253
- sentence_pairs = []
254
- for i in range(len(sentences)):
255
- for j in range(i + 1, len(sentences)):
256
- if sentence_embeddings[i] is not None and sentence_embeddings[j] is not None:
257
- similarity = cosine_similarity([sentence_embeddings[i]], [sentence_embeddings[j]])[0][0]
258
- sentence_pairs.append((sentences[i], sentences[j], similarity))
259
- sentence_pairs = sorted(sentence_pairs, key=lambda x: x[2], reverse=True)
260
- st.write("Most similar sentence pairs:")
261
- for sent1, sent2, sim in sentence_pairs[:5]:
262
- st.write(f"Sentence 1: {sent1}")
263
- st.write(f"Sentence 2: {sent2}")
264
- st.write(f"Similarity: {sim}")
265
- st.write("-----")
266
-
267
- # Sub-sidebar under "Generate Embeddings" option
268
- if option == "Generate Embeddings":
269
- st.sidebar.title("Embeddings Operations")
270
- operation = st.sidebar.radio("Select an operation", ("Operation 1", "Operation 2", "Operation 3"))
271
- if operation == "Operation 1":
272
- st.write("You selected Operation 1")
273
- elif operation == "Operation 2":
274
- st.write("You selected Operation 2")
275
- elif operation == "Operation 3":
276
- st.write("You selected Operation 3")
277
-
278
- if __name__ == "__main__":
279
- main()
 
173
  epochs=100,
174
  bucket=2000000,
175
  min_n=3,