Skip to content

Scrape

Scrape #81

Workflow file for this run

name: Scrape
on:
push:
branches:
- 'main'
paths:
- 'scraper/**/*'
- '.github/workflows/scrape.yml'
schedule:
- cron: '0 12 * * 0'
workflow_dispatch:
jobs:
ualberta:
runs-on: ubuntu-latest
steps:
- uses: actions/checkout@v3
- name: Use Node.js 18.x
uses: actions/setup-node@v3
with:
node-version: 18.x
cache: 'npm'
- name: Install npm dependencies
run: npm ci
- name: Rename old data
run: mv data/ualberta.ca.json data/ualberta.ca.old.json || true
- name: Scrape data
run: npm run scrape
- name: Run diff
run: |
./node_modules/.bin/json-diff data/ualberta.ca.old.json data/ualberta.ca.json > data/ualberta.ca.json.patch || true
cat data/ualberta.ca.json.patch
- name: Update data
run: |
git config --global user.name 'Steven Tang'
git config --global user.email '[email protected]'
git add data
git diff-index --quiet HEAD || git commit -m "Update UAlberta data"
git push
- uses: actions/upload-artifact@v3
with:
name: log
path: |
log.txt
data/ualberta.ca.json.patch