diff --git a/scripts/generateRvkConcordance.sh b/scripts/generateRvkConcordance.sh new file mode 100644 index 000000000..62848d5fa --- /dev/null +++ b/scripts/generateRvkConcordance.sh @@ -0,0 +1,22 @@ +#/bin/bash +# Date: 2024-08 +# Description: gets the monthly generated aggregated data from culturegraph +# Is called from crontab every second Wednesday of the month. +# Takes 5.5h, single process on quaoar. +# Generated tsv: ~ 257 MB +# See https://github.com/hbz/lobid-resources/issues/1058. + +URL_ROOT="https://data.dnb.de/culturegraph/" +TARGET_FNAME="/data/other/cg/aggregate.marcxml.gz" + +FNAME=$(curl $URL_ROOT | grep '