Skip to content

Scrape

Scrape #7

Workflow file for this run

name: Scrape
on:
workflow_dispatch:
schedule:
- cron: '0 0,12 * * *'
permissions:
contents: write
jobs:
scrape:
name: Scrape
runs-on: ubuntu-latest
steps:
- id: checkout
name: Checkout
uses: actions/checkout@v4
- uses: actions/setup-python@v4
with:
python-version: '3.11'
cache: 'pipenv'
- name: Install pipenv
run: curl https://raw.githubusercontent.com/pypa/pipenv/master/get-pipenv.py | python
shell: bash
- id: install-python-dependencies
name: Install Python dependencies
run: pipenv sync
shell: bash
- name: Run scrape command
run: pipenv run python -m src.download
shell: bash
- name: Run transform command
run: pipenv run python -m src.transform
shell: bash
- name: Datestamp
run: date > data/timestamp.txt
shell: bash
- name: Commit results
run: |
git config --global user.name "github-actions[bot]"
git config --global user.email "actions@github.com"
git config pull.rebase false
git status
git pull origin $GITHUB_REF
git add ./data
git commit -m "Scrape" --author="palewire <palewire@users.noreply.github.com>" && git push || true
shell: bash