File size: 340 Bytes
bb0b469
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
import requests
from bs4 import BeautifulSoup

HEADERS = {
    "User-Agent": "FOIA-Federated-Search/1.0 (public, non-crawling)"
}

def fetch(url, params=None):
    r = requests.get(url, params=params, headers=HEADERS, timeout=10)
    r.raise_for_status()
    return r.text

def clean(text):
    return " ".join(text.split()) if text else ""