-
Notifications
You must be signed in to change notification settings - Fork 7
/
Copy pathbwa_postalignment.sh
executable file
·53 lines (46 loc) · 2.82 KB
/
bwa_postalignment.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
#!/bin/bash
dataDIR=$1 #ARGV, contains folder with FASTQ files, right now needs full path
scriptDIR=$(pwd)
inputDIR=$dataDIR/trimmomatic/bwa
outputDIR=$dataDIR/trimmomatic/bwa
#find $dataDIR -name *R1_001.trim.fastq.gz > $dataDIR/filelist.txt
rm $dataDIR/samfilelist.txt
ls -1 $inputDIR/*.sam > $dataDIR/samfilelist.txt
FILENUMBER=$(wc -l $dataDIR/samfilelist.txt | cut -d' ' -f1)
#echo $FILENUMBER
rm $dataDIR/postBWA.qsub
echo \#!/bin/bash >> $dataDIR/postBWA.qsub
echo \#PBS -l nodes=1:ppn=16 >> $dataDIR/postBWA.qsub
echo \#PBS -l walltime=12:00:00 >> $dataDIR/postBWA.qsub
echo \#PBS -N bwa >> $dataDIR/postBWA.qsub
echo \#PBS -t 1-$FILENUMBER >> $dataDIR/postBWA.qsub
echo module load python >> $dataDIR/postBWA.qsub
echo module load R >> $dataDIR/postBWA.qsub
echo module load perl/5.16.3 >> $dataDIR/postBWA.qsub
echo module load samtools/1.2 >> $dataDIR/postBWA.qsub
echo module load bedtools >> $dataDIR/postBWA.qsub
echo FILESAM=\$\(head -n \$PBS_ARRAYID $dataDIR/samfilelist.txt \| tail -1\) >> $dataDIR/postBWA.qsub
echo FILESORTED=\$\(basename "\${FILESAM}" \| sed \'s/\.sam/_sorted\.sam/g\'\) >> $dataDIR/postBWA.qsub
echo java -Xms1g -Xmx4g -jar /opt/compsci/picard/1.95/SortSam.jar INPUT=\$FILESAM OUTPUT=$outputDIR/\$FILESORTED SO=coordinate >> $dataDIR/postBWA.qsub
echo FILERMDUP=\$\(basename \"\${FILESORTED}\" \| sed \'s/\.sam/_rmdup\.sam/g\'\) >> $dataDIR/postBWA.qsub
echo FILEMETRICS=\$\(basename \"\${FILESORTED}\" \| sed \'s/\.sam/_rmdup_metrics\.txt/g\'\) >>$dataDIR/postBWA.qsub
echo java -Xms1g -Xmx4g -jar /opt/compsci/picard/1.95/MarkDuplicates.jar INPUT=$outputDIR/\$FILESORTED OUTPUT=$outputDIR/\$FILERMDUP METRICS_FILE=$outputDIR/\$FILEMETRICS REMOVE_DUPLICATES=true >> $dataDIR/postBWA.qsub
echo FILEINSERT=\$\(basename \"\${FILERMDUP}\" \| sed \'s/\.sam/_insertSize\.txt/g\'\) >> $dataDIR/postBWA.qsub
echo FILEHISTO=\$\(basename \"\${FILERMDUP}\" \| sed \'s/\.sam/_insertSize\.pdf/g\'\) >> $dataDIR/postBWA.qsub
echo java -Xms1g -Xmx4g -jar /opt/compsci/picard/1.95/CollectInsertSizeMetrics.jar METRIC_ACCUMULATION_LEVEL=ALL_READS OUTPUT=$outputDIR/\$FILEINSERT HISTOGRAM_FILE=$outputDIR/\$FILEHISTO INPUT=$outputDIR/\$FILERMDUP >> $dataDIR/postBWA.qsub
echo FILENAME=\$\(basename \"\${FILERMDUP}\" \| sed \'s/\.sam/_shifted/g\'\) >> $dataDIR/postBWA.qsub
echo perl $scriptDIR/auyar/ATAC_BAM_shifter_gappedAlign.pl $outputDIR/\$FILERMDUP $outputDIR/\$FILENAME >> $dataDIR/postBWA.qsub
##
##
#
#for f in $(find "$outputDIR" -name '*shifted.bam')
#do#
# echo "process\n";
# fileName=$(basename "${f}" | sed 's/\.bam/_sorted.bam/g')
# fileName1=$(basename "${f}" | sed 's/\.bam/_sorted/g')
# fileName2=$(basename "${f}" | sed 's/\.bam/_sorted.bed/g')
# echo "\n Sorting and Indexing file: $f... \n"
# samtools sort $f $outputDIR$fileName1
# samtools index $outputDIR$fileName
# bedtools bamtobed -i $outputDIR$fileName > $outputDIR$fileName2
#done