Add code for running tf-idf at the weekly level.

[cdsc_reddit.git] / checkpoint_parallelsql.sbatch
diff --git a/checkpoint_parallelsql.sbatch b/checkpoint_parallelsql.sbatch

index 1975802daa4b26745d5e917fe6acde46a9303de6..dd61e65c3a0d90e9791e55bdbd5b6df9b623b3f8 100644 (file)
--- a/checkpoint_parallelsql.sbatch
+++ b/checkpoint_parallelsql.sbatch
@@ -13,8 +13,12 @@
  #SBATCH --mem=32G
  #SBATCH --cpus-per-task=4
  #SBATCH --ntasks=1
  #SBATCH --mem=32G
  #SBATCH --cpus-per-task=4
  #SBATCH --ntasks=1
+#SBATCH -D /gscratch/comdata/users/nathante/cdsc-reddit
+source ./bin/activate
  module load parallel_sql
  module load parallel_sql
-
+echo $(which perl)
+conda list pyarrow
+which python3
  #Put here commands to load other modules (e.g. matlab etc.)
  #Below command means that parallel_sql will get tasks from the database
  #and run them on the node (in parallel). So a 16 core node will have
  #Put here commands to load other modules (e.g. matlab etc.)
  #Below command means that parallel_sql will get tasks from the database
  #and run them on the node (in parallel). So a 16 core node will have