Fix Google job search (#223)

The previous regex did not capture all expected matches in the returned content
main
Jason Geffner 2024-12-04 14:45:59 -08:00 committed by GitHub
parent e44d13e1cf
commit 4e7ac9a583
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
1 changed files with 1 additions and 1 deletions

View File

@ -232,7 +232,7 @@ class GoogleJobsScraper(Scraper):
def _find_job_info_initial_page(html_text: str):
pattern = (
f'520084652":('
+ r"\[(?:[^\[\]]|\[(?:[^\[\]]|\[(?:[^\[\]]|\[[^\[\]]*\])*\])*\])*\])"
+ r"\[.*?\]\s*])\s*}\s*]\s*]\s*]\s*]\s*]"
)
results = []
matches = re.finditer(pattern, html_text)