Dump Baserow tables and create ARCHE turtle files #5
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
name: Dump Baserow tables and create ARCHE turtle files | |
on: | |
workflow_dispatch: | |
inputs: | |
database_id: | |
type: number | |
description: '(Required) Database ID as number' | |
required: true | |
default: 0 | |
project_name: | |
type: string | |
description: '(Required) Project Name as string' | |
required: true | |
default: '' | |
resource_files_url: | |
type: string | |
description: '(Optional) Latest Release of Resource Files as URL' | |
required: false | |
default: '' | |
primary_data_directory: | |
type: string | |
description: '(Optional) Primary Data Directory Path as string' | |
required: false | |
default: '' | |
primary_file_format: | |
type: string | |
description: '(Optional) Primary File Format as string' | |
required: false | |
default: 'xml' | |
resource_files_url_2: | |
type: string | |
description: '(Optional) Latest Release of Additional Resource Files as URL' | |
required: false | |
default: '' | |
secondary_data_directory: | |
type: string | |
description: '(Optional) Secondary Data Directory Path as string' | |
required: false | |
default: '' | |
secondary_file_format: | |
type: string | |
description: '(Optional) Secondary File Format as string' | |
required: false | |
default: 'xml' | |
jobs: | |
update_baserow: | |
name: Uploading Arche Schema to Baserow | |
runs-on: ubuntu-latest | |
env: | |
PRIMARY_FILE_FORMAT: ${{ github.event.inputs.primary_file_format }} | |
LATEST_RELEASE: ${{ github.event.inputs.resource_files_url }} | |
PRIMARY_DATA_DIRECTORY: ${{ github.event.inputs.primary_data_directory }} | |
ADDITIONAL_FILE_FORMAT: ${{ github.event.inputs.secondary_file_format }} | |
ADDITIONAL_RESOURCES: ${{ github.event.inputs.resource_files_url_2 }} | |
ADDITIONAL_DATA_DIRECTORY: ${{ github.event.inputs.secondary_data_directory }} | |
PROJECT_NAME: ${{ github.event.inputs.project_name }} | |
BASEROW_TOKEN: ${{ secrets.BASEROW_TOKEN }} | |
BASEROW_DB_ID: ${{ github.event.inputs.database_id }} | |
BASEROW_USER: ${{ secrets.BASEROW_USER }} | |
BASEROW_PW: ${{ secrets.BASEROW_PW }} | |
steps: | |
- name: Check out source repository | |
uses: actions/checkout@v3 | |
- name: Set up Python environment | |
uses: actions/setup-python@v4 | |
with: | |
python-version: "3.10" | |
- name: Install dependencies | |
run: | | |
python -m pip install --upgrade pip | |
pip install -r requirements.txt | |
- name: Baserow Dump and TEI/XML Download | |
run: | | |
python scripts/baserow_dump.py | |
- name: Adding attributes to TEI root node | |
run: | | |
./shellscripts/add_attributes.sh | |
- name: Run ant to add xml-model schema | |
run: | | |
apt-get update && apt-get install openjdk-11-jre-headless ant -y --no-install-recommend | |
./shellscripts/dl_saxon.sh | |
ant | |
- name: Creating ARCHE constants ttl file | |
run: | | |
python scripts/arche_constants.py | |
- name: cache AV database | |
id: avdb | |
uses: actions/cache@v3 | |
with: | |
path: ~/.cvdupdate | |
key: constant | |
- name: refresh AV database | |
run: | | |
python3 -m pip install --user cvdupdate && cvd update | |
- name: Verify RDF Metadata with metadata-crawler | |
run: | | |
./shellscripts/filechecker.sh | |
- name: Verify RDF Metadata with metadata-crawler | |
run: | | |
composer require "acdh-oeaw/arche-metadata-crawler:^0.5.0" | |
./shellscripts/crawler.sh | |
- name: Commit data | |
uses: stefanzweifel/git-auto-commit-action@v4 | |
with: | |
commit_message: Downloaded/Updated Data |