fix(zr): date posted (#98)

2024-02-03 07:20:53 -06:00 · 2024-02-03 07:20:53 -06:00 · 02caf1b38d
parent 8e2ab277da
commit 02caf1b38d
3 changed files with 5 additions and 14 deletions
--- a/pyproject.toml
+++ b/pyproject.toml
@ -1,6 +1,6 @@
 [tool.poetry]
 name = "python-jobspy"
-version = "1.1.40"
+version = "1.1.41"
 description = "Job scraper for LinkedIn, Indeed, Glassdoor & ZipRecruiter"
 authors = ["Zachary Hampton <zachary@bunsly.com>", "Cullen Watson <cullen@bunsly.com>"]
 homepage = "https://github.com/Bunsly/JobSpy"
--- a/src/jobspy/scrapers/glassdoor/init.py
+++ b/src/jobspy/scrapers/glassdoor/init.py
@ -246,6 +246,8 @@ class GlassdoorScraper(Scraper):
            location_type = "CITY"
        elif location_type == "S":
            location_type = "STATE"
        elif location_type == 'N':
            location_type = "COUNTRY"
        return int(items[0]["locationId"]), location_type
    @staticmethod
--- a/src/jobspy/scrapers/ziprecruiter/init.py
+++ b/src/jobspy/scrapers/ziprecruiter/init.py
@ -6,8 +6,7 @@ This module contains routines to scrape ZipRecruiter.
 """
 import math
 import time
-import re
+from datetime import datetime, timezone
 from datetime import datetime, date
 from typing import Optional, Tuple, Any
 from bs4 import BeautifulSoup
@ -119,17 +118,7 @@ class ZipRecruiterScraper(Scraper):
        job_type = ZipRecruiterScraper.get_job_type_enum(
            job.get("employment_type", "").replace("_", "").lower()
        )
-
+        date_posted = datetime.fromisoformat(job['posted_time'].rstrip("Z")).date()
        save_job_url = job.get("SaveJobURL", "")
        posted_time_match = re.search(
            r"posted_time=(\d{4}-\d{2}-\d{2}T\d{2}:\d{2}:\d{2}Z)", save_job_url
        )
        if posted_time_match:
            date_time_str = posted_time_match.group(1)
            date_posted_obj = datetime.strptime(date_time_str, "%Y-%m-%dT%H:%M:%SZ")
            date_posted = date_posted_obj.date()
        else:
            date_posted = date.today()
        return JobPost(
            title=title,