X-Git-Url: https://code.communitydata.science/cdsc_reddit.git/blobdiff_plain/2740f55915d6ecca7c5cd800747d9687c4cd9245..cd43a94865a0889dc0be91aef4d9179848e273e4:/checkpoint_parallelsql.sbatch diff --git a/checkpoint_parallelsql.sbatch b/checkpoint_parallelsql.sbatch index 1975802..dd61e65 100644 --- a/checkpoint_parallelsql.sbatch +++ b/checkpoint_parallelsql.sbatch @@ -13,8 +13,12 @@ #SBATCH --mem=32G #SBATCH --cpus-per-task=4 #SBATCH --ntasks=1 +#SBATCH -D /gscratch/comdata/users/nathante/cdsc-reddit +source ./bin/activate module load parallel_sql - +echo $(which perl) +conda list pyarrow +which python3 #Put here commands to load other modules (e.g. matlab etc.) #Below command means that parallel_sql will get tasks from the database #and run them on the node (in parallel). So a 16 core node will have