wuhp commited on
Commit
ada90f3
·
verified ·
1 Parent(s): 7ca9c00

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -1
app.py CHANGED
@@ -79,7 +79,7 @@ def trace_origins(description_html, max_depth=2):
79
  seeds = [a["href"] for a in soup_desc.find_all("a", href=True) if a["href"].startswith("http")]
80
  # include any URLs in text
81
  text = soup_desc.get_text(separator=' ')
82
- seeds += re.findall(r"https?://[^\s"']+", text)
83
  seen = set()
84
  def recurse(url, depth):
85
  if depth > max_depth or url in seen:
 
79
  seeds = [a["href"] for a in soup_desc.find_all("a", href=True) if a["href"].startswith("http")]
80
  # include any URLs in text
81
  text = soup_desc.get_text(separator=' ')
82
+ seeds += re.findall(r"https?://[^\s\"']+", text)
83
  seen = set()
84
  def recurse(url, depth):
85
  if depth > max_depth or url in seen: