mirror of https://github.com/Bunsly/JobSpy
Fix Google job search (#223)
The previous regex did not capture all expected matches in the returned contentmain
parent
e44d13e1cf
commit
4e7ac9a583
|
@ -232,7 +232,7 @@ class GoogleJobsScraper(Scraper):
|
||||||
def _find_job_info_initial_page(html_text: str):
|
def _find_job_info_initial_page(html_text: str):
|
||||||
pattern = (
|
pattern = (
|
||||||
f'520084652":('
|
f'520084652":('
|
||||||
+ r"\[(?:[^\[\]]|\[(?:[^\[\]]|\[(?:[^\[\]]|\[[^\[\]]*\])*\])*\])*\])"
|
+ r"\[.*?\]\s*])\s*}\s*]\s*]\s*]\s*]\s*]"
|
||||||
)
|
)
|
||||||
results = []
|
results = []
|
||||||
matches = re.finditer(pattern, html_text)
|
matches = re.finditer(pattern, html_text)
|
||||||
|
|
Loading…
Reference in New Issue