Spaces:
Sleeping
Sleeping
Commit
·
2f59867
1
Parent(s):
d4ff3d2
Update app.py
Browse files
app.py
CHANGED
|
@@ -21,6 +21,7 @@ def extract_website_domain(url):
|
|
| 21 |
def google_address(address):
|
| 22 |
|
| 23 |
address_number = re.findall(r'\b\d+\b', address)[0]
|
|
|
|
| 24 |
|
| 25 |
search_query = quote(address)
|
| 26 |
url=f'https://www.google.com/search?q={search_query}'
|
|
@@ -55,16 +56,17 @@ def google_address(address):
|
|
| 55 |
|
| 56 |
df['Square Footage']=df['Description'].str.extract(r"((\d+) Square Feet|(\d+) sq. ft.|(\d+) sqft|(\d+) Sq. Ft.|(\d+) sq|(\d+(?:,\d+)?) Sq\. Ft\.|(\d+(?:,\d+)?) sq)")[0]
|
| 57 |
df['Square Footage']=df['Square Footage'].replace({',':''},regex=True).str.replace(r'\D', '')
|
| 58 |
-
|
| 59 |
df['Beds']=df['Description'].replace({'-':' ','total':''},regex=True).str.extract(r"(\d+) bed")
|
| 60 |
|
|
|
|
| 61 |
df['Baths']=df['Description'].replace({'-':' ','total':''},regex=True).str.extract(r"((\d+) bath|(\d+(?:\.\d+)?) bath)")[0]
|
| 62 |
df['Baths']=df['Baths'].str.extract(r'([\d.]+)').astype(float)
|
| 63 |
|
| 64 |
df['Year Built']=df['Description'].str.extract(r"built in (\d{4})")
|
| 65 |
|
| 66 |
df_final=df[df['Address'].notnull()]
|
| 67 |
-
df_final=df_final[df_final['Address'].str.contains(str(address_number))]
|
| 68 |
df_final.insert(0,'Address Input',address)
|
| 69 |
return df_final
|
| 70 |
|
|
|
|
| 21 |
def google_address(address):
|
| 22 |
|
| 23 |
address_number = re.findall(r'\b\d+\b', address)[0]
|
| 24 |
+
address_zip =re.search(r'(\d{5})$', address).group()
|
| 25 |
|
| 26 |
search_query = quote(address)
|
| 27 |
url=f'https://www.google.com/search?q={search_query}'
|
|
|
|
| 56 |
|
| 57 |
df['Square Footage']=df['Description'].str.extract(r"((\d+) Square Feet|(\d+) sq. ft.|(\d+) sqft|(\d+) Sq. Ft.|(\d+) sq|(\d+(?:,\d+)?) Sq\. Ft\.|(\d+(?:,\d+)?) sq)")[0]
|
| 58 |
df['Square Footage']=df['Square Footage'].replace({',':''},regex=True).str.replace(r'\D', '')
|
| 59 |
+
|
| 60 |
df['Beds']=df['Description'].replace({'-':' ','total':''},regex=True).str.extract(r"(\d+) bed")
|
| 61 |
|
| 62 |
+
|
| 63 |
df['Baths']=df['Description'].replace({'-':' ','total':''},regex=True).str.extract(r"((\d+) bath|(\d+(?:\.\d+)?) bath)")[0]
|
| 64 |
df['Baths']=df['Baths'].str.extract(r'([\d.]+)').astype(float)
|
| 65 |
|
| 66 |
df['Year Built']=df['Description'].str.extract(r"built in (\d{4})")
|
| 67 |
|
| 68 |
df_final=df[df['Address'].notnull()]
|
| 69 |
+
df_final=df_final[(df_final['Address'].str.contains(str(address_number))| df_final['Address'].str.contains(str(address_zip)))]
|
| 70 |
df_final.insert(0,'Address Input',address)
|
| 71 |
return df_final
|
| 72 |
|