Update app.py
Browse files
app.py
CHANGED
|
@@ -91,8 +91,6 @@ We'll use regex and basic string methods.
|
|
| 91 |
Normalize the text: remove URLs, HTML tags, Reddit-specific formatting, etc.
|
| 92 |
"""
|
| 93 |
|
| 94 |
-
!pip install gensim tqdm
|
| 95 |
-
|
| 96 |
from gensim.models import Word2Vec
|
| 97 |
from tqdm import tqdm
|
| 98 |
import re
|
|
@@ -172,7 +170,6 @@ chunk_embeddings = [get_chunk_embedding(tokens, model) for tokens in tokenized_c
|
|
| 172 |
|
| 173 |
"""Converting variable length chunks to fixed level embeddings"""
|
| 174 |
|
| 175 |
-
!pip install faiss-cpu
|
| 176 |
|
| 177 |
import faiss
|
| 178 |
|
|
|
|
| 91 |
Normalize the text: remove URLs, HTML tags, Reddit-specific formatting, etc.
|
| 92 |
"""
|
| 93 |
|
|
|
|
|
|
|
| 94 |
from gensim.models import Word2Vec
|
| 95 |
from tqdm import tqdm
|
| 96 |
import re
|
|
|
|
| 170 |
|
| 171 |
"""Converting variable length chunks to fixed level embeddings"""
|
| 172 |
|
|
|
|
| 173 |
|
| 174 |
import faiss
|
| 175 |
|