X-Git-Url: https://code.communitydata.science/cdsc_reddit.git/blobdiff_plain/2d1c8013f2a59cde10b5169ee61edea3a4f35aca..220a540beb70bf56c2fa4bb558153b303b2207ae:/checkpoint_parallelsql.sbatch diff --git a/checkpoint_parallelsql.sbatch b/checkpoint_parallelsql.sbatch index a54aab1..dd61e65 100644 --- a/checkpoint_parallelsql.sbatch +++ b/checkpoint_parallelsql.sbatch @@ -10,13 +10,15 @@ ## Walltime (12 hours) #SBATCH --time=12:00:00 ## Memory per node -#SBATCH --mem=100G +#SBATCH --mem=32G #SBATCH --cpus-per-task=4 #SBATCH --ntasks=1 - - +#SBATCH -D /gscratch/comdata/users/nathante/cdsc-reddit +source ./bin/activate module load parallel_sql - +echo $(which perl) +conda list pyarrow +which python3 #Put here commands to load other modules (e.g. matlab etc.) #Below command means that parallel_sql will get tasks from the database #and run them on the node (in parallel). So a 16 core node will have