mirror of https://github.com/Bunsly/JobSpy
set proxy
parent
2e59ab03e3
commit
4ae48d83c4
|
@ -2,13 +2,15 @@ from jobspy import scrape_jobs
|
||||||
import pandas as pd
|
import pandas as pd
|
||||||
|
|
||||||
jobs: pd.DataFrame = scrape_jobs(
|
jobs: pd.DataFrame = scrape_jobs(
|
||||||
site_name=["indeed", "linkedin", "zip_recruiter"],
|
# site_name=["indeed", "linkedin", "zip_recruiter"],
|
||||||
|
site_name=["indeed"],
|
||||||
search_term="software engineer",
|
search_term="software engineer",
|
||||||
location="Dallas, TX",
|
location="Dallas, TX",
|
||||||
results_wanted=50, # be wary the higher it is, the more likey you'll get blocked (rotating proxy should work tho)
|
results_wanted=20, # be wary the higher it is, the more likey you'll get blocked (rotating proxy should work tho)
|
||||||
country_indeed='USA',
|
country_indeed='USA',
|
||||||
offset=25 # start jobs from an offset (use if search failed and want to continue)
|
# offset=25 # start jobs from an offset (use if search failed and want to continue)
|
||||||
# proxy="http://jobspy:5a4vpWtj8EeJ2hoYzk@ca.smartproxy.com:20001",
|
# proxy="http://34.120.172.140:8123",
|
||||||
|
proxy="http://crawler-gost-proxy.jobright-internal.com:8080",
|
||||||
)
|
)
|
||||||
|
|
||||||
# formatting for pandas
|
# formatting for pandas
|
||||||
|
|
Loading…
Reference in New Issue