Spaces:
Running
Running
letters
Browse files- app.py +1 -1
- textual.py +1 -2
app.py
CHANGED
|
@@ -90,7 +90,7 @@ def audionar_tts(text=None,
|
|
| 90 |
tokenizer = cached_tokenizer
|
| 91 |
text = only_greek_or_only_latin(text, lang=lang_code)
|
| 92 |
text = transliterate_number(text, lang=lang_code)
|
| 93 |
-
text = fix_vocals(text, lang=lang_code)
|
| 94 |
|
| 95 |
|
| 96 |
sentences = textwrap.wrap(text, width=439)
|
|
|
|
| 90 |
tokenizer = cached_tokenizer
|
| 91 |
text = only_greek_or_only_latin(text, lang=lang_code)
|
| 92 |
text = transliterate_number(text, lang=lang_code)
|
| 93 |
+
text = fix_vocals(text, lang=lang_code) + '!' # assures the text has at least 1 character that has token emb
|
| 94 |
|
| 95 |
|
| 96 |
sentences = textwrap.wrap(text, width=439)
|
textual.py
CHANGED
|
@@ -45,7 +45,7 @@ def only_greek_or_only_latin(text, lang='grc'):
|
|
| 45 |
'а': 'a', 'б': 'b', 'в': 'v', 'г': 'g', 'д': 'd', 'е': 'e', 'ж': 'z',
|
| 46 |
'з': 'z', 'и': 'i', 'ј': 'j', 'к': 'k', 'л': 'l', 'м': 'm', 'н': 'n',
|
| 47 |
'о': 'o', 'п': 'p', 'р': 'r', 'с': 's', 'т': 't', 'у': 'u', 'ф': 'f',
|
| 48 |
-
'х': 'h', 'ц': 'c', 'ч': 'c', 'ш': 's',
|
| 49 |
'ђ': 'dzi', 'љ': 'li', 'њ': 'ni', 'ћ': 'c', 'џ': 'dz',
|
| 50 |
'ё': 'e', 'й': 'i', 'щ': 's', 'ъ': '', 'ы': 'y', 'ь': '',
|
| 51 |
'э': 'e', 'ю': 'io', 'я': 'a',
|
|
@@ -287,7 +287,6 @@ def fix_vocals(text, lang='ron'):
|
|
| 287 |
# "đ": "ď",
|
| 288 |
# "lj": "ľ",
|
| 289 |
# "nj": "ň",
|
| 290 |
-
"ž": "z",
|
| 291 |
# "c": "č"
|
| 292 |
}
|
| 293 |
|
|
|
|
| 45 |
'а': 'a', 'б': 'b', 'в': 'v', 'г': 'g', 'д': 'd', 'е': 'e', 'ж': 'z',
|
| 46 |
'з': 'z', 'и': 'i', 'ј': 'j', 'к': 'k', 'л': 'l', 'м': 'm', 'н': 'n',
|
| 47 |
'о': 'o', 'п': 'p', 'р': 'r', 'с': 's', 'т': 't', 'у': 'u', 'ф': 'f',
|
| 48 |
+
'х': 'h', 'ц': 'c', 'ч': 'c', 'ш': 's', "ž": "z",
|
| 49 |
'ђ': 'dzi', 'љ': 'li', 'њ': 'ni', 'ћ': 'c', 'џ': 'dz',
|
| 50 |
'ё': 'e', 'й': 'i', 'щ': 's', 'ъ': '', 'ы': 'y', 'ь': '',
|
| 51 |
'э': 'e', 'ю': 'io', 'я': 'a',
|
|
|
|
| 287 |
# "đ": "ď",
|
| 288 |
# "lj": "ľ",
|
| 289 |
# "nj": "ň",
|
|
|
|
| 290 |
# "c": "č"
|
| 291 |
}
|
| 292 |
|