From 6330c148797fdda3e1f61591734d8ac4bde77a39 Mon Sep 17 00:00:00 2001 From: Cullen Watson Date: Mon, 15 Jul 2024 21:19:01 -0500 Subject: [PATCH] minor fix --- src/jobspy/__init__.py | 2 +- src/jobspy/scrapers/indeed/__init__.py | 1 + src/jobspy/scrapers/linkedin/__init__.py | 6 +++--- 3 files changed, 5 insertions(+), 4 deletions(-) diff --git a/src/jobspy/__init__.py b/src/jobspy/__init__.py index a29f571..3e69a60 100644 --- a/src/jobspy/__init__.py +++ b/src/jobspy/__init__.py @@ -210,13 +210,13 @@ def scrape_jobs( "is_remote", "job_level", "job_function", + "company_industry", "listing_type", "emails", "description", "company_url", "company_url_direct", "company_addresses", - "company_industry", "company_num_employees", "company_revenue", "company_description", diff --git a/src/jobspy/scrapers/indeed/__init__.py b/src/jobspy/scrapers/indeed/__init__.py index 252d7de..21ad103 100644 --- a/src/jobspy/scrapers/indeed/__init__.py +++ b/src/jobspy/scrapers/indeed/__init__.py @@ -244,6 +244,7 @@ class IndeedScraper(Scraper): .replace("Iv1", "") .replace("_", " ") .title() + .strip() if employer_details.get("industry") else None ), diff --git a/src/jobspy/scrapers/linkedin/__init__.py b/src/jobspy/scrapers/linkedin/__init__.py index 45bf31a..6f301ef 100644 --- a/src/jobspy/scrapers/linkedin/__init__.py +++ b/src/jobspy/scrapers/linkedin/__init__.py @@ -219,7 +219,7 @@ class LinkedInScraper(Scraper): job_url=f"{self.base_url}/jobs/view/{job_id}", compensation=compensation, job_type=job_details.get("job_type"), - job_level=job_details.get("job_level"), + job_level=job_details.get("job_level", "").lower(), company_industry=job_details.get("company_industry"), description=job_details.get("description"), job_url_direct=job_details.get("job_url_direct"), @@ -351,7 +351,7 @@ class LinkedInScraper(Scraper): job_level = job_level_span.get_text(strip=True) return job_level - + @staticmethod def _parse_company_industry(soup_industry: BeautifulSoup) -> str | None: """ @@ -373,7 +373,7 @@ class LinkedInScraper(Scraper): if industry_span: industry = industry_span.get_text(strip=True) - return industry + return industry def _parse_job_url_direct(self, soup: BeautifulSoup) -> str | None: """