Spaces:
Running
Running
| from __future__ import annotations | |
| from dataclasses import dataclass | |
| class FetchResult: | |
| url: str | |
| status: int | |
| fetched_at: str | |
| content_type: str | |
| html: str | |
| class CrawlStats: | |
| queued_urls: int = 0 | |
| fetch_reserved: int = 0 | |
| fetch_succeeded: int = 0 | |
| fetch_failed: int = 0 | |
| parsed_pages: int = 0 | |
| parse_failed: int = 0 | |
| extracted_links: int = 0 | |
| dropped_urls: int = 0 | |
| robots_blocked: int = 0 | |
| stored_rows: int = 0 | |
| written_shards: int = 0 | |
| uploaded_shards: int = 0 | |
| tokenized_shards: int = 0 | |
| tokenized_rows: int = 0 | |
| tokenized_tokens: int = 0 | |