X-Git-Url: https://code.communitydata.science/cdsc_reddit.git/blobdiff_plain/2d1c8013f2a59cde10b5169ee61edea3a4f35aca..refs/heads/synced/master:/checkpoint_parallelsql.sbatch?ds=inline diff --git a/checkpoint_parallelsql.sbatch b/checkpoint_parallelsql.sbatch index a54aab1..dd61e65 100644 --- a/checkpoint_parallelsql.sbatch +++ b/checkpoint_parallelsql.sbatch @@ -10,13 +10,15 @@ ## Walltime (12 hours) #SBATCH --time=12:00:00 ## Memory per node -#SBATCH --mem=100G +#SBATCH --mem=32G #SBATCH --cpus-per-task=4 #SBATCH --ntasks=1 - - +#SBATCH -D /gscratch/comdata/users/nathante/cdsc-reddit +source ./bin/activate module load parallel_sql - +echo $(which perl) +conda list pyarrow +which python3 #Put here commands to load other modules (e.g. matlab etc.) #Below command means that parallel_sql will get tasks from the database #and run them on the node (in parallel). So a 16 core node will have