mattritchey commited on
Commit
2f59867
·
1 Parent(s): d4ff3d2

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -2
app.py CHANGED
@@ -21,6 +21,7 @@ def extract_website_domain(url):
21
  def google_address(address):
22
 
23
  address_number = re.findall(r'\b\d+\b', address)[0]
 
24
 
25
  search_query = quote(address)
26
  url=f'https://www.google.com/search?q={search_query}'
@@ -55,16 +56,17 @@ def google_address(address):
55
 
56
  df['Square Footage']=df['Description'].str.extract(r"((\d+) Square Feet|(\d+) sq. ft.|(\d+) sqft|(\d+) Sq. Ft.|(\d+) sq|(\d+(?:,\d+)?) Sq\. Ft\.|(\d+(?:,\d+)?) sq)")[0]
57
  df['Square Footage']=df['Square Footage'].replace({',':''},regex=True).str.replace(r'\D', '')
58
-
59
  df['Beds']=df['Description'].replace({'-':' ','total':''},regex=True).str.extract(r"(\d+) bed")
60
 
 
61
  df['Baths']=df['Description'].replace({'-':' ','total':''},regex=True).str.extract(r"((\d+) bath|(\d+(?:\.\d+)?) bath)")[0]
62
  df['Baths']=df['Baths'].str.extract(r'([\d.]+)').astype(float)
63
 
64
  df['Year Built']=df['Description'].str.extract(r"built in (\d{4})")
65
 
66
  df_final=df[df['Address'].notnull()]
67
- df_final=df_final[df_final['Address'].str.contains(str(address_number))]
68
  df_final.insert(0,'Address Input',address)
69
  return df_final
70
 
 
21
  def google_address(address):
22
 
23
  address_number = re.findall(r'\b\d+\b', address)[0]
24
+ address_zip =re.search(r'(\d{5})$', address).group()
25
 
26
  search_query = quote(address)
27
  url=f'https://www.google.com/search?q={search_query}'
 
56
 
57
  df['Square Footage']=df['Description'].str.extract(r"((\d+) Square Feet|(\d+) sq. ft.|(\d+) sqft|(\d+) Sq. Ft.|(\d+) sq|(\d+(?:,\d+)?) Sq\. Ft\.|(\d+(?:,\d+)?) sq)")[0]
58
  df['Square Footage']=df['Square Footage'].replace({',':''},regex=True).str.replace(r'\D', '')
59
+
60
  df['Beds']=df['Description'].replace({'-':' ','total':''},regex=True).str.extract(r"(\d+) bed")
61
 
62
+
63
  df['Baths']=df['Description'].replace({'-':' ','total':''},regex=True).str.extract(r"((\d+) bath|(\d+(?:\.\d+)?) bath)")[0]
64
  df['Baths']=df['Baths'].str.extract(r'([\d.]+)').astype(float)
65
 
66
  df['Year Built']=df['Description'].str.extract(r"built in (\d{4})")
67
 
68
  df_final=df[df['Address'].notnull()]
69
+ df_final=df_final[(df_final['Address'].str.contains(str(address_number))| df_final['Address'].str.contains(str(address_zip)))]
70
  df_final.insert(0,'Address Input',address)
71
  return df_final
72