JobSpy/.github/workflows/job_scraper_dynamic.yml

87 lines
2.7 KiB
YAML

name: JobSpy Scraper Dynamic Workflow
on:
workflow_dispatch:
inputs:
user_email:
description: 'User email for the scraper'
required: true
default: 'branden@autoemployme.onmicrosoft.com'
search_terms:
description: 'Comma-separated list of search terms'
required: true
default: 'IT Support,CRM,Automation'
results_wanted:
description: 'Number of results to fetch'
required: true
default: '100'
max_days_old:
description: 'Fetch jobs posted in the last n days'
required: true
default: '2'
target_state:
description: 'Target state (e.g. NY)'
required: true
default: 'NY'
permissions:
actions: read
contents: read
id-token: write
jobs:
scrape_jobs:
runs-on: ubuntu-latest
steps:
- name: Checkout repository
uses: actions/checkout@v3
- name: Set up Python
uses: actions/setup-python@v4
with:
python-version: '3.10'
- name: Install dependencies
run: |
python -m pip install --upgrade pip
pip install -r requirements.txt
- name: Set environment variables
run: |
echo "USER_EMAIL=${{ github.event.inputs.user_email }}" >> $GITHUB_ENV
echo "SEARCH_TERMS=${{ github.event.inputs.search_terms }}" >> $GITHUB_ENV
echo "RESULTS_WANTED=${{ github.event.inputs.results_wanted }}" >> $GITHUB_ENV
echo "MAX_DAYS_OLD=${{ github.event.inputs.max_days_old }}" >> $GITHUB_ENV
echo "TARGET_STATE=${{ github.event.inputs.target_state }}" >> $GITHUB_ENV
- name: Sanitize email for filename
id: sanitize
run: |
safe_name=$(echo "${{ github.event.inputs.user_email }}" | sed 's/@/_at_/g; s/\./_/g')
echo "safe_name=$safe_name" >> $GITHUB_OUTPUT
- name: Run JobSpy Scraper Dynamic
run: |
python job_scraper_dynamic.py \
"${{ env.SEARCH_TERMS }}" \
"${{ env.RESULTS_WANTED }}" \
"${{ env.MAX_DAYS_OLD }}" \
"${{ env.TARGET_STATE }}" \
"${{ steps.sanitize.outputs.safe_name }}"
- name: Verify jobspy_output_dynamic file exists
run: |
file="jobspy_output_dynamic_${{ steps.sanitize.outputs.safe_name }}.csv"
if [ ! -f "$file" ]; then
echo "❌ ERROR: $file not found!"
exit 1
else
echo "✅ Output found: $file"
fi
- name: Upload JobSpy Output as Artifact
uses: actions/upload-artifact@v4
with:
name: jobspy-results-dynamic-${{ steps.sanitize.outputs.safe_name }}
path: jobspy_output_dynamic_${{ steps.sanitize.outputs.safe_name }}.csv