Skip to content

Update GitHub Repo Languages Data #30

Update GitHub Repo Languages Data

Update GitHub Repo Languages Data #30

name: Update GitHub Repo Languages Data
on:
schedule:
- cron: '0 0 * * *' # Runs every day at midnight
workflow_dispatch: # Allows manual triggering
jobs:
fetch-and-save-data:
runs-on: ubuntu-latest
steps:
# Step 1: Checkout the repository
- name: Checkout Repository
uses: actions/checkout@v3
# Step 2: Set up Node.js
- name: Set up Node.js
uses: actions/setup-node@v3
with:
node-version: '16'
# Step 3: Fetch the repository data from GitHub API and extract languages
- name: Fetch Repo Languages Data
env:
STATS_API_TOKEN: ${{ secrets.STATS_API_TOKEN }}
run: |
echo "Fetching repository languages data..."
REPOS=$(curl -s -H "Authorization: token $STATS_API_TOKEN" https://api.github.com/user/repos?type=all&per_page=100)
# Log the fetched data for verification
echo "Fetched repository data for verification:"
echo "${REPOS}" | jq '.'
# This is where the fetched data stops and we start dealing with it.
# The fetching and logging are working well.
# Step 4: Write the JSON data (this is the step that requires improvements)
- name: Write JSON File
run: |
echo "Writing fetched data to JSON file..."
# Initialize an empty JSON array
echo "[]" > repo_data.json
# Iterate over each repository and fetch languages, then write to JSON
echo "${REPOS}" | jq -c '.[]' | while read -r row; do
REPO_NAME=$(echo "${row}" | jq -r '.name')
REPO_OWNER=$(echo "${row}" | jq -r '.owner.login')
LANGUAGES=$(curl -s -H "Authorization: token $STATS_API_TOKEN" "https://api.github.com/repos/${REPO_OWNER}/${REPO_NAME}/languages")
# Check if the languages request succeeded and if there are languages in the response
if [[ "${LANGUAGES}" == "{}" || -z "${LANGUAGES}" ]]; then
echo "No languages found or error fetching languages for ${REPO_NAME}. Skipping..."
continue
fi
# Only append languages to the JSON file
jq --arg repo "${REPO_NAME}" --argjson languages "${LANGUAGES}" \
'. += [{"repo": $repo, "languages": $languages}]' repo_data.json > tmp.json && mv tmp.json repo_data.json
done
# Output the content for verification
echo "Fetched languages saved to JSON file:"
cat repo_data.json
# Step 5: Remove the untracked JSON file if it exists
- name: Remove Untracked JSON File
run: |
if [ -f repo_data.json ]; then
echo "Removing existing repo_data.json to avoid conflicts when switching branches."
rm repo_data.json
fi
# Step 6: Checkout gh-pages branch
- name: Checkout gh-pages Branch
run: |
git fetch
git checkout gh-pages
# Step 7: Commit the JSON file to gh-pages branch
- name: Commit JSON File
run: |
git add repo_data.json
git config user.name "github-actions[bot]"
git config user.email "github-actions[bot]@users.noreply.github.com"
git commit -m "Update repository languages data [skip ci]" || echo "No changes to commit"
git push origin gh-pages