X-Git-Url: https://code.communitydata.science/covid19.git/blobdiff_plain/18118328ccb35d65a30d826129ef6f58c954fc9c..9e0c92242eca7c433fc244a8e121bd8338c911f0:/transliterations/analysis/related_searches_example.R diff --git a/transliterations/analysis/related_searches_example.R b/transliterations/analysis/related_searches_example.R index 19ddfc7..e1197b6 100644 --- a/transliterations/analysis/related_searches_example.R +++ b/transliterations/analysis/related_searches_example.R @@ -3,23 +3,31 @@ ### ### Minimal example analysis file using trending search data -### Identify data source directory and file -DataDir <- ("../data/output/") -DataFile <- ("related_searches_top.csv") - ### Import and cleanup data -related.searches.top <- read.table(paste(DataDir,DataFile, - sep=""), + +DataURL <- + url("https://github.com/CommunityDataScienceCollective/COVID-19_Digital_Observatory/blob/master/transliterations/data/output/related_searches_top.csv") + +related.searches.top <- read.table(DataURL, sep=",", header=TRUE, stringsAsFactors=FALSE) +### Alternatively, uncomment and run if working locally with full git tree +### Identify data source directory and file +## DataDir <- ("../data/output/") +## DataFile <- ("related_searches_top.csv") + +## related.searches.top <- read.table(paste(DataDir,DataFile, sep=""), +## sep=",", header=TRUE, +## stringsAsFactors=FALSE) + ### Aggregate top 5 search queries by term/day top5.per.term.date <- aggregate(query ~ term + date, data=related.searches.top, head, 5) ## Might cleanup a bit for further analysis or visualization... -top5.per.term.date$date <- asDate(top5.per.term.date$date) +top5.per.term.date$date <- as.Date(top5.per.term.date$date) ### Export write.table(top5.per.term.date,