forked from philippinespire/pire_fq_gz_processing
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathrunCLUMPIFY_r1r2_array.sbatch
executable file
·60 lines (45 loc) · 1.54 KB
/
runCLUMPIFY_r1r2_array.sbatch
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
#!/bin/bash
# Called by runCLUMPIFY_r1r2_array.bash, which starts an array job.
# load modules
module load java/8u151
#FQPATTERN=${4}
#TEMPDIR=${3}
#INDIR=${1}
#OUTDIR=${2}
THREADS=1 #clumpify uses a ton of ram, be conservative
GROUPS=auto #controls how much ram is used, refer to manual
RAMPERTHREAD=233g #have had to set as high as 233g with groups=1, was originally 180g
ulimit -n 40960
ulimit -a
mkdir -p $OUTDIR
echo $SLURM_NODELIST
all_samples=$(ls $INDIR/$FQPATTERN | \
sed -e 's/r1\.fq\.gz//' -e 's/.*\///g')
all_samples=($all_samples)
sample_name=${all_samples[${SLURM_ARRAY_TASK_ID}]}
echo ${sample_name}
#systemctl status $PPID
#systemctl status $PPID | head -1 | awk '{print $2}' | xargs systemctl show -p TasksMax
#cat /proc/sys/kernel/threads-max
/hb/software/apps/bbtools/gnu-39.01/clumpify.sh \
in=${INDIR}/${sample_name}r1.fq.gz \
in2=${INDIR}/${sample_name}r2.fq.gz \
out=${OUTDIR}/${sample_name}clmp.r1.fq.gz \
out2=${OUTDIR}/${sample_name}clmp.r2.fq.gz \
groups=auto \
lowcomplexity=t \
overwrite=t \
usetmpdir=t \
tmpdir=${TEMPDIR} \
deletetemp=t \
dedupe=t \
addcount=t \
subs=2 \
containment=t \
consensus=f \
-Xmx=480g
#print some environment variables to stdout for records
echo ----------------------------------------------------------------------------------------
echo PRINTING SUBSET OF ENVIRONMENT VARIABLES:
(set -o posix ; set | grep -v ^_ | grep -v ^EB | grep -v ^BASH | grep -v PATH | grep -v LS_COLORS)
echo ----------------------------------------------------------------------------------------