-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathGATKselectVariants.wdl
76 lines (60 loc) · 1.51 KB
/
GATKselectVariants.wdl
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
## GATK selectVariants
## script to filter variants using gatk
## useful for removing <NON_REF> arguments
##
## Inputs:
## - vcf.gz file
## - vcfgztbi: index file required if .gz file needed
## - referenceFasta: optional, only needed for some options
## - searchStrings e.g. "--exclude-non-variants --remove-unused-alternates"
##
## Outputs:
## - vcf filtered file
## - vcf index file
version 1.0
workflow runSelectVariants {
input {
File vcfgz
File? vcftbi
File? referenceFasta
String? searchString
}
call SelectVariants {
input:
vcfgz=vcfgz,
vcftbi=vcftbi,
referenceFasta=referenceFasta,
searchString=searchString
}
output {
File OutvcfgzSR = SelectVariants.Outvcfgz
File OutvcfgztbiSR = SelectVariants.Outvcfgztbi
}
}
task SelectVariants{
input {
File vcfgz
File? vcftbi
File? referenceFasta
String? searchString
}
String vcf_basename = basename(vcfgz, ".gvcf.gz")
Int disk_space_gb = 2*ceil(size(vcfgz, "GB")+ size(referenceFasta, "GB")+1)
command {
gunzip -c ~{vcfgz} > ~{vcf_basename}.gvcf
gatk SelectVariants -V ~{vcf_basename}.gvcf ~{"-R "+ referenceFasta} ~{searchString} -O ~{vcf_basename}.SVfilt.gvcf.gz
#bgzip ~{vcf_basename}.SVfilt.gvcf
#tabix -p vcf ~{vcf_basename}.SVfilt.gvcf.gz
}
runtime {
docker: "broadinstitute/gatk:4.2.4.0"
memory: "12 GB"
cpu: "1"
disks: "local-disk " + disk_space_gb + " HDD"
preemptible: 3
}
output {
File Outvcfgz = "~{vcf_basename}.SVfilt.gvcf.gz"
File Outvcfgztbi = "~{vcf_basename}.SVfilt.gvcf.gz.tbi"
}
}