Spaces:
Sleeping
Sleeping
Ilyas KHIAT commited on
Commit ·
62a5ad1
1
Parent(s): e1bcbc6
more details content
Browse files- requirements.txt +0 -1
- utils/audit/audit_doc.py +1 -1
requirements.txt
CHANGED
|
@@ -10,5 +10,4 @@ openai
|
|
| 10 |
nltk
|
| 11 |
rake_nltk
|
| 12 |
python-docx
|
| 13 |
-
io
|
| 14 |
pillow
|
|
|
|
| 10 |
nltk
|
| 11 |
rake_nltk
|
| 12 |
python-docx
|
|
|
|
| 13 |
pillow
|
utils/audit/audit_doc.py
CHANGED
|
@@ -56,7 +56,7 @@ def evaluate_text_quality(text: str) -> dict:
|
|
| 56 |
def extract_keywords(text):
|
| 57 |
rake = Rake(stopwords.words('english'))
|
| 58 |
rake.extract_keywords_from_text(text)
|
| 59 |
-
return rake.
|
| 60 |
|
| 61 |
def count_tokens(input_string: str) -> int:
|
| 62 |
tokenizer = tiktoken.get_encoding("cl100k_base")
|
|
|
|
| 56 |
def extract_keywords(text):
|
| 57 |
rake = Rake(stopwords.words('english'))
|
| 58 |
rake.extract_keywords_from_text(text)
|
| 59 |
+
return rake.get_ranked_phrases()
|
| 60 |
|
| 61 |
def count_tokens(input_string: str) -> int:
|
| 62 |
tokenizer = tiktoken.get_encoding("cl100k_base")
|