-
Notifications
You must be signed in to change notification settings - Fork 7
/
Copy pathbqsr_recal.sh
executable file
·60 lines (50 loc) · 2.12 KB
/
bqsr_recal.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
#!/bin/bash
##########################################################################
#
# Platform: NCI Gadi HPC
# Usage: this script is run by bqsr_recal_run_parallel.pbs
# Version: 2.0
#
# For more details see: https://github.com/Sydney-Informatics-Hub/Fastq-to-BAM
#
# If you use this script towards a publication, please acknowledge the
# Sydney Informatics Hub (or co-authorship, where appropriate).
#
# Suggested acknowledgement:
# The authors acknowledge the support provided by the Sydney Informatics Hub,
# a Core Research Facility of the University of Sydney. This research/project
# was undertaken with the assistance of resources and services from the National
# Computational Infrastructure (NCI), which is supported by the Australian
# Government, and the Australian BioCommons which is enabled by NCRIS via
# Bioplatforms Australia funding.
#
##########################################################################
labSampleID=`echo $1 | cut -d ',' -f 1`
intNum=`echo $1 | cut -d ',' -f 2`
interval=`echo $1 | cut -d ',' -f 3`
echo $labSampleID $intNum $interval
bam=../Dedup_sort/${labSampleID}.coordSorted.dedup.bam
log=./Logs/BQSR_recal/${labSampleID}.${intNum}.log
err=./Logs/BQSR_recal_error_capture/${labSampleID}.${intNum}.err
out=../BQSR_tables/${labSampleID}.${intNum}.recal_data.table
ref=
thousandG_indels=../Reference/Known_vars/Homo_sapiens_assembly38.known_indels.vcf #hash out or replace depending on your data
gold_standard_indels=../Reference/Known_vars/Mills_and_1000G_gold_standard.indels.hg38.vcf #hash out or replace depending on your data
dbsnp=../Reference/Known_vars/Homo_sapiens_assembly38.dbsnp138.vcf #replace depending on your data
gatk BaseRecalibrator \
--java-options "-Xmx20g -DGATK_STACKTRACE_ON_USER_EXCEPTION=true" \
-R $ref \
-L $interval \
-I $bam \
--known-sites $dbsnp \
--known-sites $thousandG_indels \
--known-sites $gold_standard_indels \
-O $out >> $log 2>&1
if grep -q -i error $log
then
printf "Error in GATK log ${log}\n" >> $err
fi
if grep -q Exception $log
then
printf "Exception in GATK log ${log}\n" >> $err
fi