Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -79,7 +79,7 @@ def trace_origins(description_html, max_depth=2):
|
|
| 79 |
seeds = [a["href"] for a in soup_desc.find_all("a", href=True) if a["href"].startswith("http")]
|
| 80 |
# include any URLs in text
|
| 81 |
text = soup_desc.get_text(separator=' ')
|
| 82 |
-
seeds += re.findall(r"https?://[^\s"']+", text)
|
| 83 |
seen = set()
|
| 84 |
def recurse(url, depth):
|
| 85 |
if depth > max_depth or url in seen:
|
|
|
|
| 79 |
seeds = [a["href"] for a in soup_desc.find_all("a", href=True) if a["href"].startswith("http")]
|
| 80 |
# include any URLs in text
|
| 81 |
text = soup_desc.get_text(separator=' ')
|
| 82 |
+
seeds += re.findall(r"https?://[^\s\"']+", text)
|
| 83 |
seen = set()
|
| 84 |
def recurse(url, depth):
|
| 85 |
if depth > max_depth or url in seen:
|