]> code.communitydata.science - covid19.git/blob - transliterations/src/compile_transliterated_phrases.sh
Loading data directly from github URL. Commenting out commands that assume cloned...
[covid19.git] / transliterations / src / compile_transliterated_phrases.sh
1 #!/bin/bash
2
3 # For now these scripts don't accept command line arguments. It's an MVP
4
5 echo "Reading Google trends"
6 python3 collect_trends.py
7
8 echo "Searching for Wikidata entities using base_terms.txt"
9 python3 wikidata_search.py ../data/input/base_terms.txt --output ../data/output/wikidata_search_results.csv
10
11 echo "Searching for Wikidata entities using Google trends"
12 python3 wikidata_search.py ../data/output/related_searches_rising.csv ../data/output/related_searches_top.csv --use-gtrends --output ../data/output/wikidata_search_results_from_gtrends.csv
13
14 echo "Finding transliterations from Wikidata using sparql"
15 python3 wikidata_transliterations.py  ../data/output/wikidata_search_results_from_gtrends.csv  ../data/output/wikidata_search_results.csv --topN 10 20 --output ../data/output/$(date '+%Y-%m-%d')_wikidata_entity_labels.csv
16

Community Data Science Collective || Want to submit a patch?