Spaces:
Sleeping
Sleeping
meirk-brd
commited on
Commit
·
87f5e0a
1
Parent(s):
1711f91
add url validation
Browse files
tool.py
CHANGED
|
@@ -216,16 +216,18 @@ class BrightDataDatasetTool(Tool):
|
|
| 216 |
return self._ensure_scheme(raw)
|
| 217 |
|
| 218 |
if isinstance(raw, dict):
|
|
|
|
|
|
|
|
|
|
|
|
|
| 219 |
orig_name = raw.get("orig_name")
|
| 220 |
-
if
|
|
|
|
|
|
|
|
|
|
|
|
|
| 221 |
return self._ensure_scheme(orig_name)
|
| 222 |
|
| 223 |
-
url_value = raw.get("url")
|
| 224 |
-
if isinstance(url_value, str):
|
| 225 |
-
if url_value.startswith(("http://", "https://")):
|
| 226 |
-
return url_value
|
| 227 |
-
return None
|
| 228 |
-
|
| 229 |
return None
|
| 230 |
|
| 231 |
def _ensure_scheme(self, url: str) -> str:
|
|
|
|
| 216 |
return self._ensure_scheme(raw)
|
| 217 |
|
| 218 |
if isinstance(raw, dict):
|
| 219 |
+
url_value = raw.get("url")
|
| 220 |
+
if isinstance(url_value, str) and url_value.startswith(("http://", "https://")):
|
| 221 |
+
return url_value
|
| 222 |
+
|
| 223 |
orig_name = raw.get("orig_name")
|
| 224 |
+
if (
|
| 225 |
+
isinstance(orig_name, str)
|
| 226 |
+
and orig_name
|
| 227 |
+
and (orig_name.startswith(("http://", "https://")) or "." in orig_name)
|
| 228 |
+
):
|
| 229 |
return self._ensure_scheme(orig_name)
|
| 230 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 231 |
return None
|
| 232 |
|
| 233 |
def _ensure_scheme(self, url: str) -> str:
|