X-Git-Url: https://code.communitydata.science/covid19.git/blobdiff_plain/34f8b9a23ee8dba8300d610c3aa88e86f7c5347b..ff96d52cb92966dd0c487e6452aeab70773cf3e6:/cron-wikipedia_revisions.sh diff --git a/cron-wikipedia_revisions.sh b/cron-wikipedia_revisions.sh new file mode 100644 index 0000000..a53bc3f --- /dev/null +++ b/cron-wikipedia_revisions.sh @@ -0,0 +1,17 @@ +#!/bin/bash -x + +TZ="UTC" +date_string=$(date +%Y%m%d) + +./wikipedia/scripts/wikiproject_scraper.py 2> >(tee wikipedia/logs/enwp-wikiproject_scraper-${date_string}.log) + +revs_log="enwp-revisions-${date_string}.log" +./wikipedia/scripts/fetch_enwiki_revisions.py 2> >(tee wikipedia/logs/${rev_log}) +mv wikipedia/logs/${revs_log} /var/www/covid19/wikipedia/logs/ + +revs_tsv="digobs_covid19-wikipedia-enwiki_revisions-${date_string}.tsv" +mv wikipedia/data/${revs_tsv} /var/www/covid19/wikipedia + +revs_json="digobs_covid19-wikipedia-enwiki_revisions-${date_string}.json" +xz wikipedia/data/${revs_json} +mv wikipedia/data/${revs_json}.xz /var/www/covid19/wikipedia