mirror of
https://github.com/Bunsly/JobSpy.git
synced 2026-03-06 04:24:30 -08:00
Compare commits
3 Commits
v1.1.79
...
94d413bad1
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
94d413bad1 | ||
|
|
61205bcc77 | ||
|
|
f1602eca70 |
@@ -3,7 +3,7 @@ from __future__ import annotations
|
|||||||
import math
|
import math
|
||||||
import random
|
import random
|
||||||
import time
|
import time
|
||||||
from datetime import datetime, date
|
from datetime import datetime, date, timedelta
|
||||||
from typing import Optional
|
from typing import Optional
|
||||||
|
|
||||||
import regex as re
|
import regex as re
|
||||||
@@ -277,7 +277,7 @@ class Naukri(Scraper):
|
|||||||
match = re.search(r"(\d+)\s*day", label)
|
match = re.search(r"(\d+)\s*day", label)
|
||||||
if match:
|
if match:
|
||||||
days = int(match.group(1))
|
days = int(match.group(1))
|
||||||
parsed_date = today.replace(day=today.day - days).date()
|
parsed_date = (today - timedelta(days = days)).date()
|
||||||
log.debug(f"Date parsed: {days} days ago -> {parsed_date}")
|
log.debug(f"Date parsed: {days} days ago -> {parsed_date}")
|
||||||
return parsed_date
|
return parsed_date
|
||||||
elif created_date:
|
elif created_date:
|
||||||
|
|||||||
@@ -47,11 +47,12 @@ class RotatingProxySession:
|
|||||||
"""Utility method to format a proxy string into a dictionary."""
|
"""Utility method to format a proxy string into a dictionary."""
|
||||||
if proxy.startswith("http://") or proxy.startswith("https://"):
|
if proxy.startswith("http://") or proxy.startswith("https://"):
|
||||||
return {"http": proxy, "https": proxy}
|
return {"http": proxy, "https": proxy}
|
||||||
|
if proxy.startswith("socks5://"):
|
||||||
|
return {"http": proxy, "https": proxy}
|
||||||
return {"http": f"http://{proxy}", "https": f"http://{proxy}"}
|
return {"http": f"http://{proxy}", "https": f"http://{proxy}"}
|
||||||
|
|
||||||
|
|
||||||
class RequestsRotating(RotatingProxySession, requests.Session):
|
class RequestsRotating(RotatingProxySession, requests.Session):
|
||||||
|
|
||||||
def __init__(self, proxies=None, has_retry=False, delay=1, clear_cookies=False):
|
def __init__(self, proxies=None, has_retry=False, delay=1, clear_cookies=False):
|
||||||
RotatingProxySession.__init__(self, proxies=proxies)
|
RotatingProxySession.__init__(self, proxies=proxies)
|
||||||
requests.Session.__init__(self)
|
requests.Session.__init__(self)
|
||||||
@@ -86,7 +87,6 @@ class RequestsRotating(RotatingProxySession, requests.Session):
|
|||||||
|
|
||||||
|
|
||||||
class TLSRotating(RotatingProxySession, tls_client.Session):
|
class TLSRotating(RotatingProxySession, tls_client.Session):
|
||||||
|
|
||||||
def __init__(self, proxies=None):
|
def __init__(self, proxies=None):
|
||||||
RotatingProxySession.__init__(self, proxies=proxies)
|
RotatingProxySession.__init__(self, proxies=proxies)
|
||||||
tls_client.Session.__init__(self, random_tls_extension_order=True)
|
tls_client.Session.__init__(self, random_tls_extension_order=True)
|
||||||
@@ -344,7 +344,7 @@ desired_order = [
|
|||||||
"company_num_employees",
|
"company_num_employees",
|
||||||
"company_revenue",
|
"company_revenue",
|
||||||
"company_description",
|
"company_description",
|
||||||
#naukri-specific fields
|
# naukri-specific fields
|
||||||
"skills",
|
"skills",
|
||||||
"experience_range",
|
"experience_range",
|
||||||
"company_rating",
|
"company_rating",
|
||||||
|
|||||||
@@ -4,7 +4,7 @@ build-backend = "poetry.core.masonry.api"
|
|||||||
|
|
||||||
[tool.poetry]
|
[tool.poetry]
|
||||||
name = "python-jobspy"
|
name = "python-jobspy"
|
||||||
version = "1.1.79"
|
version = "1.1.80"
|
||||||
description = "Job scraper for LinkedIn, Indeed, Glassdoor, ZipRecruiter & Bayt"
|
description = "Job scraper for LinkedIn, Indeed, Glassdoor, ZipRecruiter & Bayt"
|
||||||
authors = ["Cullen Watson <cullen@cullenwatson.com>", "Zachary Hampton <zachary@zacharysproducts.com>"]
|
authors = ["Cullen Watson <cullen@cullenwatson.com>", "Zachary Hampton <zachary@zacharysproducts.com>"]
|
||||||
homepage = "https://github.com/cullenwatson/JobSpy"
|
homepage = "https://github.com/cullenwatson/JobSpy"
|
||||||
|
|||||||
Reference in New Issue
Block a user