Skip to content

Download and process #60

Download and process

Download and process #60

name: Download and process
on:
workflow_dispatch:
inputs:
colId:
description: 'Collection ID'
required: true
default: '162553'
jobs:
build_pages:
name: Download METS files from Transkribus and convert them to TEIs
runs-on: ubuntu-latest
env:
ANT_OPTS: -Xmx5g
TR_USER: ${{ secrets.TR_USER }}
TR_PW: ${{ secrets.TR_PW}}
COL_ID: ${{ github.event.inputs.colId }}
steps:
- name: Perform Checkout
uses: actions/checkout@v2
- name: Install Saxon and Ant
run: |
mkdir -p mets
mkdir -p tei
apt-get update && apt-get install openjdk-11-jre-headless ant -y --no-install-recommend
pip install acdh-transkribus-utils
wget https://sourceforge.net/projects/saxon/files/Saxon-HE/9.9/SaxonHE9-9-1-7J.zip/download && unzip download -d saxon && rm -rf download
git clone --depth=1 --branch skurzinz-patch-1 --single-branch https://github.com/skurzinz/page2tei.git
- name: Download METS Files
run: |
python ./scripts/fetch_mets.py
- name: Transform to TEI
run: |
ant -DCOL_ID=${COL_ID} -f ./build_tei.xml
- uses: stefanzweifel/git-auto-commit-action@v4
with:
commit_message: Exported and Transformed ColId ${{ github.event.inputs.colId }}