Skip to content

Fetch Data

Fetch Data #56

Workflow file for this run

name: Fetch Data
on:
schedule:
# at 01:15 on days 1-20 in first month of each quarter
- cron: '15 1 1-20 1,4,7,10 *'
workflow_dispatch:
jobs:
fetch:
runs-on: ubuntu-latest
env:
GCS_DEVELOPER_KEY: ${{ secrets.GCS_DEVELOPER_KEY }}
GCS_CX: ${{ secrets.GCS_CX }}
# CC Technology team members:
# See cc-quantifying-bot GitHub entry in Bitwarden for information on
# BOT_ secrets
steps:
- name: Checkout repository
uses: actions/checkout@v4
with:
token: ${{ secrets.BOT_TOKEN }}
- name: Configure git
run: |
git config user.name "${{ secrets.BOT_NAME }}"
git config user.email "${{ secrets.BOT_EMAIL }}"
- name: Set up Python
uses: actions/setup-python@v5
with:
python-version: '3.11'
- name: Install dependencies
run: |
pip install --upgrade pip
pip install pipenv
pipenv sync --system
- name: Set PYTHONPATH
run: echo "PYTHONPATH=./scripts" >> $GITHUB_ENV
- name: Run fetch script
run:
# ./scripts/1-fetch/deviantart_fetched.py
# ./scripts/1-fetch/flickr_fetched.py
# ./scripts/1-fetch/github_fetched.py
# ./scripts/1-fetch/internetarchive_fetched.py
# ./scripts/1-fetch/metmuseum_fetched.py
# ./scripts/1-fetch/vimeo_fetched.py
# ./scripts/1-fetch/wikicommons_fetched.py
# ./scripts/1-fetch/wikipedia_fetched.py
# ./scripts/1-fetch/youtube_fetched.py
./scripts/1-fetch/gcs_fetched.py