X-Git-Url: https://code.communitydata.science/cdsc_reddit.git/blobdiff_plain/811a0d87c4d394c2c7849a613f6aec2d81e49138..07b0dff9bc0dae2ab6f7fb7334007a5269a512ad:/datasets/run_submissions_jobs.sbatch diff --git a/datasets/run_submissions_jobs.sbatch b/datasets/run_submissions_jobs.sbatch new file mode 100644 index 0000000..9f63e83 --- /dev/null +++ b/datasets/run_submissions_jobs.sbatch @@ -0,0 +1,23 @@ +#!/bin/bash +## tf reddit comments +#SBATCH --job-name="cdsc_reddit; parse submission dumps" +## Allocation Definition +#SBATCH --account=comdata-ckpt +#SBATCH --partition=ckpt +## Resources +## Nodes. This should always be 1 for parallel-sql. +#SBATCH --nodes=1 +## Walltime (12 hours) +#SBATCH --time=24:00:00 +## Memory per node +#SBATCH --mem=8G +#SBATCH --cpus-per-task=1 +#SBATCH --ntasks=1 +#SBATCH +#SBATCH --chdir /gscratch/comdata/users/nathante/cdsc_reddit/datasets +#SBATCH --output=submissions_jobs/%A_%a.out +#SBATCH --error=submissions_jobs/%A_%a.out + +TASK_NUM=$(( SLURM_ARRAY_TASK_ID + $1)) +TASK_CALL=$(sed -n ${TASK_NUM}p ./submissions_task_list.sh) +${TASK_CALL}