-
Notifications
You must be signed in to change notification settings - Fork 1
54 lines (46 loc) · 1.37 KB
/
etl-extract-lighthouse.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
name: "Scheduled ETL: Extract Lighthouse sample"
on:
schedule:
- cron: '30 0 * * *'
workflow_dispatch:
concurrency:
group: extract-lighthouse
cancel-in-progress: true
jobs:
download-lighthouse:
name: Download Lighthouse
runs-on: ubuntu-latest
steps:
- id: checkout
name: Checkout
uses: actions/checkout@v3
- id: install
name: Install
uses: ./.github/actions/install
- id: cache
name: Update cache
uses: actions/cache@v3
with:
path: ~/.cache
key: extract-lighthouse-${{ github.run_id }}
restore-keys: |
extract-lighthouse
- id: download-lighthouse
name: Download Lighthouse files
run: pipenv run newshomepages-extract lighthouse --days=7 --output-path=./lighthouse-sample.csv;
shell: bash
- id: save
name: Save artifact
uses: actions/upload-artifact@v3
with:
name: extracts
path: ./lighthouse-sample.csv
if-no-files-found: error
- id: upload-to-internet-archive
name: Upload files to archive.org
uses: palewire/internet-archive-upload@v1
with:
access-key: ${{ secrets.IA_ACCESS_KEY }}
secret-key: ${{ secrets.IA_SECRET_KEY }}
identifier: news-homepages-extracts
files: lighthouse-sample.csv