48 lines
1.3 KiB
Python
48 lines
1.3 KiB
Python
import re
|
|
|
|
|
|
def parse_address_two(street_address: str) -> tuple:
|
|
if not street_address:
|
|
return street_address, None
|
|
|
|
apt_match = re.search(
|
|
r"(APT\s*[\dA-Z]+|#[\dA-Z]+|UNIT\s*[\dA-Z]+|LOT\s*[\dA-Z]+)$",
|
|
street_address,
|
|
re.I,
|
|
)
|
|
|
|
if apt_match:
|
|
apt_str = apt_match.group().strip()
|
|
cleaned_apt_str = re.sub(r"(APT\s*|UNIT\s*|LOT\s*)", "#", apt_str, flags=re.I)
|
|
|
|
main_address = street_address.replace(
|
|
apt_str, ""
|
|
).strip() # Remove the matched part from the original address
|
|
return main_address, cleaned_apt_str
|
|
else:
|
|
return street_address, None
|
|
|
|
|
|
def parse_unit(street_address: str):
|
|
if not street_address:
|
|
return None
|
|
apt_match = re.search(
|
|
r"(APT\s*[\dA-Z]+|#[\dA-Z]+|UNIT\s*[\dA-Z]+|LOT\s*[\dA-Z]+)$",
|
|
street_address,
|
|
re.I,
|
|
)
|
|
|
|
if apt_match:
|
|
apt_str = apt_match.group().strip()
|
|
apt_str = re.sub(r"(APT\s*|UNIT\s*|LOT\s*)", "#", apt_str, flags=re.I)
|
|
return apt_str
|
|
else:
|
|
return None
|
|
|
|
|
|
if __name__ == "__main__":
|
|
print(parse_address_two("4303 E Cactus Rd Apt 126"))
|
|
print(parse_address_two("1234 Elm Street apt 2B"))
|
|
print(parse_address_two("1234 Elm Street UNIT 3A"))
|
|
print(parse_address_two("1234 Elm Street unit 3A"))
|