Skip to content

.github/workflows/gtn-news.yml #2767

.github/workflows/gtn-news.yml

.github/workflows/gtn-news.yml #2767

Workflow file for this run

---
# Pull news from the Galaxy Training Network's RSS feed and add them as
# Galaxy Hub posts.
name: Galaxy Training Network news
env:
base: master
branch: gtn-news
github_api_version: "2022-11-28"
on:
workflow_dispatch:
schedule:
- cron: 0 * * * *
jobs:
collect:
name: Collect news from the Galaxy Training Network
runs-on: ubuntu-latest
steps:
- name: Install feedparser.
run: pip install feedparser~=6.0
- name: Parse GTN RSS feed.
id: parse
shell: python -u {0}
run: |
import json
import os
from datetime import datetime, timedelta, timezone
import feedparser
feedparser.sanitizer._HTMLSanitizer.acceptable_elements.remove("a")
feedparser.sanitizer._HTMLSanitizer.acceptable_elements.remove("img")
feed = feedparser.parse("https://training.galaxyproject.org/training-material/feed.xml")
posts = {}
oldest = datetime.now().astimezone()
for entry in feed.entries:
feed_title = f"[GTN news] {entry['title']}"
feed_link = entry["link"]
feed_blurb = entry["summary"]
feed_published = entry["published"].split("T")[0]
feed_name = feed_link.split("/")[-1].replace(".html", "")
feed_author = entry["author"]
posts[f"{feed_published}-{feed_name}"] = {
"title": feed_title,
"link": feed_link,
"blurb": feed_blurb,
"published": feed_published,
"name": feed_name,
"author": feed_author,
}
feed_published_dt = datetime.fromisoformat(entry["published"])
oldest = feed_published_dt if feed_published_dt < oldest else oldest
oldest = (oldest - timedelta(days=1)).astimezone(timezone.utc).date()
# reverse ordering (sort by ascending date)
posts = {
post: posts[post]
for post in tuple(posts)[::-1]
}
with open(os.environ["GITHUB_OUTPUT"], 'w') as file:
print("posts=%s" % json.dumps(posts), file=file)
print(
"matrix=%s" % f"{json.dumps({'name': list(posts)})}",
file=file
)
# Not strictly necessary but produces a workflow with less jobs.
- name: Filter out already published posts.
id: filter
env:
GH_TOKEN: ${{ github.token }}
run: |
readarray -t all_posts <<< $(jq -r 'keys_unsorted | .[]' <<< '${{ steps.parse.outputs.posts }}')
posts=()
set +e
for post in "${all_posts[@]}"; do
# check in the base branch
gh api \
-H "Accept: application/vnd.github+json" \
-H "X-GitHub-Api-Version: ${{ env.github_api_version }}" \
/repos/${{ github.repository }}/contents/content/news/"$post"/index.md?ref=${{ env.base }}
test $? -ne 0 || continue
# check in the target branch
gh api \
-H "Accept: application/vnd.github+json" \
-H "X-GitHub-Api-Version: ${{ env.github_api_version }}" \
/repos/${{ github.repository }}/contents/content/news/"$post"/index.md?ref=${{ env.branch }}
test $? -ne 0 || continue
posts+=("$post")
done
set -e
json=$(printf '%s\n' "${posts[@]}" | jq -R . | jq -s --compact-output .)
matrix=$(jq -n --compact-output --argjson v "$json" '{"name": $v}')
echo matrix="$matrix" >> $GITHUB_OUTPUT
outputs:
posts: ${{ steps.parse.outputs.posts }}
matrix: ${{ steps.filter.outputs.matrix }}
commit:
name: Create commits
runs-on: ubuntu-latest
needs: collect
if: ${{ needs.collect.outputs.matrix != '{"name":[""]}' }}
strategy:
max-parallel: 1
fail-fast: false
matrix: ${{fromJson(needs.collect.outputs.matrix)}}
steps:
- name: Create the Galaxy Hub post.
shell: python -u {0}
run: |
import json
import textwrap
post = json.loads("""
${{ needs.collect.outputs.posts }}
""")["${{ matrix.name }}"]
post = textwrap.dedent(f"""
---
subsites: [all]
main_subsite: global
date: "{post['published']}"
tags: [training, gtn-news]
title: "{post['title']}"
authors: "{post['author']}"
external_url: '{post["link"]}'
---
{post["blurb"]}
""")[1:]
with open("index.md", "w") as file:
file.write(post)
- name: Create the PR branch.
env:
GH_TOKEN: ${{ github.token }}
run: |
# Check if the PR branch exists.
set +e
gh api \
-H "Accept: application/vnd.github+json" \
-H "X-GitHub-Api-Version: ${{ env.github_api_version }}" \
/repos/${{ github.repository }}/git/ref/heads/${{ env.branch }}
test $? -ne 0 || exit 0
set -e
# Get commit sha of the tip of the base branch.
sha=$(\
gh api \
-H "Accept: application/vnd.github+json" \
-H "X-GitHub-Api-Version: ${{ env.github_api_version }}" \
/repos/${{ github.repository }}/git/ref/heads/${{ env.base }} \
| jq -r '.object.sha' \
)
# Create the PR branch.
gh api \
--method POST \
-H "Accept: application/vnd.github.v3+json" \
-H "X-GitHub-Api-Version: ${{ env.github_api_version }}" \
/repos/${{ github.repository }}/git/refs \
-f ref='refs/heads/${{ env.branch }}' \
-f sha=$sha
- name: Commit the Galaxy Hub post.
run: |
base64=$(base64 --wrap=0 < index.md)
commit='{
"message": "Post ${{ matrix.name }} from GTN",
"author": {
"name": "GitHub",
"email": "[email protected]"
},
"branch": "${{ env.branch }}",
"content": "'$base64'"
}'
echo $commit > data.json
curl -L \
-X PUT \
-H "Accept: application/vnd.github+json" \
-H "Authorization: Bearer ${{ github.token }}" \
-H "X-GitHub-Api-Version: ${{ env.github_api_version }}" \
https://api.github.com/repos/${{ github.repository }}/contents/content/news/${{ matrix.name }}/index.md \
-d @data.json
pull_request:
name: Create pull request
runs-on: ubuntu-latest
needs: commit
if: always()
steps:
- name: Create a pull request.
env:
GH_TOKEN: ${{ github.token }}
run: |
# Check if an open pull request already exists.
exists=$(gh pr list \
--repo ${{ github.repository }} \
--head ${{ env.branch }} \
--state open \
--limit 1 \
--json number \
| jq '.[].number' | wc -l)
test $exists -ne 1 || exit 0
set +e
gh pr create \
--repo ${{ github.repository }} \
--base "${{ env.base }}" \
--head "${{ env.branch }}" \
--title "Publish latest news from the Galaxy Training Network" \
--body "Publish the latest news from the Galaxy Training Network."
true