Spaces:
Sleeping
Sleeping
File size: 1,096 Bytes
19a3093 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 | """Probe for section-level parquet files on Lex CDN."""
import httpx
base = "https://lexdownloads.blob.core.windows.net/downloads/latest"
patterns = [
"legislation_section.parquet",
"legislation_sections.parquet",
"legislation_section_1983.parquet",
"legislation_section/1983.parquet",
"sections/1983.parquet",
"legislation_sections/1983.parquet",
"legislation_section_2005.parquet",
"legislation_section_2014.parquet",
"sections_1983.parquet",
"legislation-section.parquet",
"legislation-sections.parquet",
"explanatory_note.parquet",
"amendment.parquet",
]
for p in patterns:
url = f"{base}/{p}"
try:
r = httpx.head(url, timeout=10, follow_redirects=True)
size = r.headers.get("content-length", "?")
mb = int(size) // 1024 // 1024 if size.isdigit() else "?"
status = "FOUND" if r.status_code == 200 else str(r.status_code)
print(f"{status}: {p} ({mb} MB)" if r.status_code == 200 else f" {r.status_code}: {p}")
except Exception as e:
print(f" ERROR: {p} -> {type(e).__name__}")
|