]> code.communitydata.science - cdsc_reddit.git/blob - run_tf_jobs.sh
Add code for running tf-idf at the weekly level.
[cdsc_reddit.git] / run_tf_jobs.sh
1 #!/usr/bin/env bash
2 module load parallel_sql
3 source ./bin/activate
4 python3 tf_comments.py gen_task_list
5 psu --del --Y
6 cat tf_task_list | psu --load
7
8 for job in $(seq 1 50); do sbatch checkpoint_parallelsql.sbatch; done;

Community Data Science Collective || Want to submit a patch?