Update app.py
Browse files
app.py
CHANGED
|
@@ -25,7 +25,7 @@ def extract_english_paragraphs(text):
|
|
| 25 |
"""
|
| 26 |
Extract paragraphs that contain only English text
|
| 27 |
"""
|
| 28 |
-
paragraphs = text.split('
|
| 29 |
english_paragraphs = [paragraphs[0]]
|
| 30 |
|
| 31 |
#for para in paragraphs:
|
|
@@ -36,7 +36,7 @@ def extract_english_paragraphs(text):
|
|
| 36 |
return '\n\n'.join(english_paragraphs)
|
| 37 |
|
| 38 |
def extract_native_text(text):
|
| 39 |
-
paragraphs = text.split('
|
| 40 |
nativelang_paragraphs = paragraphs[1]
|
| 41 |
#pattern = r'[^\x00-\x7F]'
|
| 42 |
|
|
|
|
| 25 |
"""
|
| 26 |
Extract paragraphs that contain only English text
|
| 27 |
"""
|
| 28 |
+
paragraphs = text.split('\n\n')
|
| 29 |
english_paragraphs = [paragraphs[0]]
|
| 30 |
|
| 31 |
#for para in paragraphs:
|
|
|
|
| 36 |
return '\n\n'.join(english_paragraphs)
|
| 37 |
|
| 38 |
def extract_native_text(text):
|
| 39 |
+
paragraphs = text.split('\n\n')
|
| 40 |
nativelang_paragraphs = paragraphs[1]
|
| 41 |
#pattern = r'[^\x00-\x7F]'
|
| 42 |
|