Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -39,7 +39,7 @@ def download_file(url, local_filename):
|
|
| 39 |
|
| 40 |
def download_html_and_files(url, subdir):
|
| 41 |
html_content = requests.get(url).text
|
| 42 |
-
soup = BeautifulSoup(html_content, 'html.parser',
|
| 43 |
base_url = urllib.parse.urlunparse(urllib.parse.urlparse(url)._replace(path='', params='', query='', fragment=''))
|
| 44 |
|
| 45 |
for link in soup.find_all('a'):
|
|
|
|
| 39 |
|
| 40 |
def download_html_and_files(url, subdir):
|
| 41 |
html_content = requests.get(url).text
|
| 42 |
+
soup = BeautifulSoup(html_content, 'html.parser', 'lxml-xml')
|
| 43 |
base_url = urllib.parse.urlunparse(urllib.parse.urlparse(url)._replace(path='', params='', query='', fragment=''))
|
| 44 |
|
| 45 |
for link in soup.find_all('a'):
|