]> code.communitydata.science - cdsc_reddit.git/blob - ngrams/run_tf_jobs.sh
add code for pulling activity time series from parquet.
[cdsc_reddit.git] / ngrams / run_tf_jobs.sh
1 #!/usr/bin/env bash
2 module load parallel_sql
3 source ./bin/activate
4 python3 tf_comments.py gen_task_list
5 psu --del --Y
6 cat tf_task_list | psu --load
7
8 for job in $(seq 1 50); do sbatch checkpoint_parallelsql.sbatch; done;

Community Data Science Collective || Want to submit a patch?