job-scraper/config.yaml

178 lines
3.5 KiB
YAML
Raw Normal View History

# Job Scraper Configuration
# ===========================
# Location filters - jobs matching these locations will be highlighted
location_filters:
- remote
- canada
- toronto
- vancouver
- berlin
- germany
# Job title filters - only jobs containing these keywords will be tracked
# Leave empty or remove to track all jobs
title_filters:
- engineer
- developer
- software
- sre
- devops
- infrastructure
- platform
- backend
- frontend
- fullstack
- full-stack
- security
# Companies to monitor
# Each company needs: name, platform, and platform-specific config
companies:
# Privacy & Security Focused
- name: Signal
platform: lever
lever_company: signal
- name: DuckDuckGo
platform: ashby
ashby_company: duck-duck-go
- name: 1Password
platform: ashby
ashby_company: 1password
- name: Bitwarden
platform: greenhouse
board_token: bitwarden
# Open Source Infrastructure & DevTools
- name: GrafanaLabs
platform: greenhouse
board_token: grafanalabs
- name: GitLab
platform: greenhouse
board_token: gitlab
- name: Sourcegraph
platform: greenhouse
board_token: sourcegraph91
- name: Supabase
platform: ashby
ashby_company: supabase
- name: Tailscale
platform: greenhouse
board_token: tailscale
# Developer Tools & Platforms
- name: Automattic
platform: greenhouse
board_token: automatticcareers
- name: Canonical
platform: greenhouse
board_token: canonical
- name: ClickHouse
platform: greenhouse
board_token: clickhouse
- name: Cloudflare
platform: greenhouse
board_token: cloudflare
2026-01-20 18:08:11 +00:00
- name: Fastly
platform: greenhouse
board_token: fastly
# Database & Data Infrastructure
- name: Materialize
platform: greenhouse
board_token: materialize
- name: PingCAP
platform: greenhouse
board_token: pingcap
- name: CockroachLabs
platform: greenhouse
board_token: cockroachlabs
- name: TigerData
platform: ashby
ashby_company: tigerdata
# Observability & Monitoring
- name: Honeycomb
platform: greenhouse
board_token: honeycomb
- name: Datadog
platform: greenhouse
board_token: datadog
- name: Sentry
platform: ashby
ashby_company: sentry
# Cloud & Developer Platforms
- name: Render
platform: ashby
ashby_company: render
- name: Railway
platform: ashby
ashby_company: Railway
- name: Stripe
platform: greenhouse
board_token: stripe
- name: JetBrains
platform: greenhouse
board_token: jetbrains
# Rust-heavy / Visualization
- name: Rerun
platform: ashby
ashby_company: rerun
# Big Tech (Selective)
- name: Discord
platform: greenhouse
board_token: discord
- name: Dropbox
platform: greenhouse
board_token: dropbox
# Notification settings (optional - configure as needed)
notifications:
# Console output is always enabled
console: true
# Uncomment and configure for email notifications
# email:
# smtp_host: smtp.gmail.com
# smtp_port: 587
# username: your-email@gmail.com
# password: your-app-password
# from_addr: your-email@gmail.com
# to_addr: your-email@gmail.com
# Uncomment for Slack webhook
# slack:
# webhook_url: https://hooks.slack.com/services/YOUR/WEBHOOK/URL
# Scraper settings
scraper:
# Delay between requests in seconds (be respectful!)
request_delay: 2
# Timeout for requests in seconds
timeout: 30
# Number of retries on failure
retries: 3