- Scrapes job listings from Greenhouse, Lever, and Ashby platforms - Tracks 14 companies (1Password, DuckDuckGo, GitLab, etc.) - SQLite database for change detection - Filters by engineering job titles and location preferences - Generates static HTML dashboard with search/filter - Docker support for deployment to Debian server
116 lines
2.4 KiB
YAML
116 lines
2.4 KiB
YAML
# Job Scraper Configuration
|
|
# ===========================
|
|
|
|
# Location filters - jobs matching these locations will be highlighted
|
|
location_filters:
|
|
- remote
|
|
- canada
|
|
- toronto
|
|
- vancouver
|
|
- berlin
|
|
- germany
|
|
|
|
# Job title filters - only jobs containing these keywords will be tracked
|
|
# Leave empty or remove to track all jobs
|
|
title_filters:
|
|
- engineer
|
|
- developer
|
|
- software
|
|
- sre
|
|
- devops
|
|
- infrastructure
|
|
- platform
|
|
- backend
|
|
- frontend
|
|
- fullstack
|
|
- full-stack
|
|
- security
|
|
|
|
# Companies to monitor
|
|
# Each company needs: name, platform, and platform-specific config
|
|
companies:
|
|
# Privacy & Security Focused
|
|
- name: Signal
|
|
platform: lever
|
|
lever_company: signal
|
|
|
|
- name: DuckDuckGo
|
|
platform: ashby
|
|
ashby_company: duck-duck-go
|
|
|
|
- name: 1Password
|
|
platform: ashby
|
|
ashby_company: 1password
|
|
|
|
- name: Bitwarden
|
|
platform: greenhouse
|
|
board_token: bitwarden
|
|
|
|
# Open Source Infrastructure & DevTools
|
|
- name: GrafanaLabs
|
|
platform: greenhouse
|
|
board_token: grafanalabs
|
|
|
|
- name: GitLab
|
|
platform: greenhouse
|
|
board_token: gitlab
|
|
|
|
- name: Sourcegraph
|
|
platform: greenhouse
|
|
board_token: sourcegraph91
|
|
|
|
- name: Supabase
|
|
platform: ashby
|
|
ashby_company: supabase
|
|
|
|
- name: Tailscale
|
|
platform: greenhouse
|
|
board_token: tailscale
|
|
|
|
- name: HashiCorp
|
|
platform: greenhouse
|
|
board_token: hashicorp
|
|
|
|
# Developer Tools & Platforms
|
|
- name: Automattic
|
|
platform: greenhouse
|
|
board_token: automatticcareers
|
|
|
|
- name: Canonical
|
|
platform: greenhouse
|
|
board_token: canonical
|
|
|
|
- name: ClickHouse
|
|
platform: greenhouse
|
|
board_token: clickhouse
|
|
|
|
- name: Cloudflare
|
|
platform: greenhouse
|
|
board_token: cloudflare
|
|
|
|
# Notification settings (optional - configure as needed)
|
|
notifications:
|
|
# Console output is always enabled
|
|
console: true
|
|
|
|
# Uncomment and configure for email notifications
|
|
# email:
|
|
# smtp_host: smtp.gmail.com
|
|
# smtp_port: 587
|
|
# username: your-email@gmail.com
|
|
# password: your-app-password
|
|
# from_addr: your-email@gmail.com
|
|
# to_addr: your-email@gmail.com
|
|
|
|
# Uncomment for Slack webhook
|
|
# slack:
|
|
# webhook_url: https://hooks.slack.com/services/YOUR/WEBHOOK/URL
|
|
|
|
# Scraper settings
|
|
scraper:
|
|
# Delay between requests in seconds (be respectful!)
|
|
request_delay: 2
|
|
# Timeout for requests in seconds
|
|
timeout: 30
|
|
# Number of retries on failure
|
|
retries: 3
|