Spaces:
Sleeping
Sleeping
Commit
·
2f59867
1
Parent(s):
d4ff3d2
Update app.py
Browse files
app.py
CHANGED
@@ -21,6 +21,7 @@ def extract_website_domain(url):
|
|
21 |
def google_address(address):
|
22 |
|
23 |
address_number = re.findall(r'\b\d+\b', address)[0]
|
|
|
24 |
|
25 |
search_query = quote(address)
|
26 |
url=f'https://www.google.com/search?q={search_query}'
|
@@ -55,16 +56,17 @@ def google_address(address):
|
|
55 |
|
56 |
df['Square Footage']=df['Description'].str.extract(r"((\d+) Square Feet|(\d+) sq. ft.|(\d+) sqft|(\d+) Sq. Ft.|(\d+) sq|(\d+(?:,\d+)?) Sq\. Ft\.|(\d+(?:,\d+)?) sq)")[0]
|
57 |
df['Square Footage']=df['Square Footage'].replace({',':''},regex=True).str.replace(r'\D', '')
|
58 |
-
|
59 |
df['Beds']=df['Description'].replace({'-':' ','total':''},regex=True).str.extract(r"(\d+) bed")
|
60 |
|
|
|
61 |
df['Baths']=df['Description'].replace({'-':' ','total':''},regex=True).str.extract(r"((\d+) bath|(\d+(?:\.\d+)?) bath)")[0]
|
62 |
df['Baths']=df['Baths'].str.extract(r'([\d.]+)').astype(float)
|
63 |
|
64 |
df['Year Built']=df['Description'].str.extract(r"built in (\d{4})")
|
65 |
|
66 |
df_final=df[df['Address'].notnull()]
|
67 |
-
df_final=df_final[df_final['Address'].str.contains(str(address_number))]
|
68 |
df_final.insert(0,'Address Input',address)
|
69 |
return df_final
|
70 |
|
|
|
21 |
def google_address(address):
|
22 |
|
23 |
address_number = re.findall(r'\b\d+\b', address)[0]
|
24 |
+
address_zip =re.search(r'(\d{5})$', address).group()
|
25 |
|
26 |
search_query = quote(address)
|
27 |
url=f'https://www.google.com/search?q={search_query}'
|
|
|
56 |
|
57 |
df['Square Footage']=df['Description'].str.extract(r"((\d+) Square Feet|(\d+) sq. ft.|(\d+) sqft|(\d+) Sq. Ft.|(\d+) sq|(\d+(?:,\d+)?) Sq\. Ft\.|(\d+(?:,\d+)?) sq)")[0]
|
58 |
df['Square Footage']=df['Square Footage'].replace({',':''},regex=True).str.replace(r'\D', '')
|
59 |
+
|
60 |
df['Beds']=df['Description'].replace({'-':' ','total':''},regex=True).str.extract(r"(\d+) bed")
|
61 |
|
62 |
+
|
63 |
df['Baths']=df['Description'].replace({'-':' ','total':''},regex=True).str.extract(r"((\d+) bath|(\d+(?:\.\d+)?) bath)")[0]
|
64 |
df['Baths']=df['Baths'].str.extract(r'([\d.]+)').astype(float)
|
65 |
|
66 |
df['Year Built']=df['Description'].str.extract(r"built in (\d{4})")
|
67 |
|
68 |
df_final=df[df['Address'].notnull()]
|
69 |
+
df_final=df_final[(df_final['Address'].str.contains(str(address_number))| df_final['Address'].str.contains(str(address_zip)))]
|
70 |
df_final.insert(0,'Address Input',address)
|
71 |
return df_final
|
72 |
|