Spaces:
Sleeping
Sleeping
Return None if no text in xml, due to no subtitle and automatic_captions with gibberish except xml(xml format text part is empty) in this video https://youtu.be/LI0mzC6sl7w
Browse files- fetchYoutubeSubtitle.py +4 -1
fetchYoutubeSubtitle.py
CHANGED
|
@@ -227,6 +227,8 @@ def xml_caption_to_srt(xml_captions: str) -> str:
|
|
| 227 |
caption = unescape(
|
| 228 |
text.replace("\n", " ").replace(" ", " "),
|
| 229 |
)
|
|
|
|
|
|
|
| 230 |
try:
|
| 231 |
duration = float(child.attrib["dur"])
|
| 232 |
except KeyError:
|
|
@@ -241,7 +243,8 @@ def xml_caption_to_srt(xml_captions: str) -> str:
|
|
| 241 |
text=caption,
|
| 242 |
)
|
| 243 |
segments.append(line)
|
| 244 |
-
return
|
|
|
|
| 245 |
|
| 246 |
|
| 247 |
async def fetchSubtitleUrls(url: str, proxy: Optional[str] = None) -> json:
|
|
|
|
| 227 |
caption = unescape(
|
| 228 |
text.replace("\n", " ").replace(" ", " "),
|
| 229 |
)
|
| 230 |
+
if len(caption) == 0:
|
| 231 |
+
continue
|
| 232 |
try:
|
| 233 |
duration = float(child.attrib["dur"])
|
| 234 |
except KeyError:
|
|
|
|
| 243 |
text=caption,
|
| 244 |
)
|
| 245 |
segments.append(line)
|
| 246 |
+
# return None if no text in xml
|
| 247 |
+
return "\n".join(segments).strip() if len(segments) > 0 else None
|
| 248 |
|
| 249 |
|
| 250 |
async def fetchSubtitleUrls(url: str, proxy: Optional[str] = None) -> json:
|