feat: Ability to query by time posted for linkedin, indeed, glassdoor, ziprecruiter (#103)

This commit is contained in:
VitaminB16
2024-02-09 20:02:03 +00:00
committed by GitHub
parent 2563c5ca08
commit 91b137ef86
7 changed files with 53 additions and 23 deletions

View File

@@ -42,6 +42,8 @@ def scrape_jobs(
full_description: bool | None = False,
linkedin_company_ids: list[int] | None = None,
offset: int | None = 0,
hours_old: int = None,
**kwargs,
) -> pd.DataFrame:
"""
Simultaneously scrapes job data from multiple job sites.
@@ -84,6 +86,7 @@ def scrape_jobs(
results_wanted=results_wanted,
linkedin_company_ids=linkedin_company_ids,
offset=offset,
hours_old=hours_old
)
def scrape_site(site: Site) -> Tuple[str, JobResponse]:
@@ -189,4 +192,4 @@ def scrape_jobs(
else:
jobs_formatted_df = pd.DataFrame()
return jobs_formatted_df
return jobs_formatted_df.sort_values(by='date_posted', ascending=False)