HomeHarvest/homeharvest/__init__.py

from .core.scrapers.redfin import RedfinScraper
from .core.scrapers.realtor import RealtorScraper
from .core.scrapers.types import ListingType, Home
from .core.scrapers import ScraperInput
from .exceptions import InvalidSite, InvalidListingType


_scrapers = {
    "redfin": RedfinScraper,
    "realtor.com": RealtorScraper
}


def scrape_property(
        location: str,
        site_name: str,
        listing_type: str = "for_sale",  #: for_sale, for_rent, sold
) -> list[Home]:  #: eventually, return pandas dataframe
    if site_name.lower() not in _scrapers:
        raise InvalidSite(f"Provided site, '{site_name}', does not exist.")

    if listing_type.upper() not in ListingType.__members__:
        raise InvalidListingType(f"Provided listing type, '{listing_type}', does not exist.")

    scraper_input = ScraperInput(
        location=location,
        listing_type=ListingType[listing_type.upper()],
    )

    site = _scrapers[site_name.lower()](scraper_input)

    return site.search()
- base 2023-09-15 15:17:37 -07:00			`from .core.scrapers.redfin import RedfinScraper`
- realtor init 2023-09-15 20:58:54 -07:00			`from .core.scrapers.realtor import RealtorScraper`
- base 2023-09-15 15:17:37 -07:00			`from .core.scrapers.types import ListingType, Home`
			`from .core.scrapers import ScraperInput`
			`from .exceptions import InvalidSite, InvalidListingType`


			`_scrapers = {`
			`"redfin": RedfinScraper,`
- realtor init 2023-09-15 20:58:54 -07:00			`"realtor.com": RealtorScraper`
- base 2023-09-15 15:17:37 -07:00			`}`


			`def scrape_property(`
			`location: str,`
- realtor init 2023-09-15 20:58:54 -07:00			`site_name: str,`
- base 2023-09-15 15:17:37 -07:00			`listing_type: str = "for_sale", #: for_sale, for_rent, sold`
			`) -> list[Home]: #: eventually, return pandas dataframe`
- housekeeping 2023-09-15 15:21:29 -07:00			`if site_name.lower() not in _scrapers:`
- base 2023-09-15 15:17:37 -07:00			`raise InvalidSite(f"Provided site, '{site_name}', does not exist.")`

			`if listing_type.upper() not in ListingType.__members__:`
			`raise InvalidListingType(f"Provided listing type, '{listing_type}', does not exist.")`

			`scraper_input = ScraperInput(`
			`location=location,`
			`listing_type=ListingType[listing_type.upper()],`
			`)`

- housekeeping 2023-09-15 15:21:29 -07:00			`site = _scrapers[site_name.lower()](scraper_input)`
- base 2023-09-15 15:17:37 -07:00
			`return site.search()`