-
Notifications
You must be signed in to change notification settings - Fork 29
/
Copy pathgffread.wdl
93 lines (84 loc) · 4.21 KB
/
gffread.wdl
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
version 1.0
# Copyright (c) 2017 Leiden University Medical Center
#
# Permission is hereby granted, free of charge, to any person obtaining a copy
# of this software and associated documentation files (the "Software"), to deal
# in the Software without restriction, including without limitation the rights
# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
# copies of the Software, and to permit persons to whom the Software is
# furnished to do so, subject to the following conditions:
#
# The above copyright notice and this permission notice shall be included in
# all copies or substantial portions of the Software.
#
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
# SOFTWARE.
task GffRead {
input {
File inputGff
File genomicSequence
Boolean outputGtfFormat = false
File? genomicIndex # Optional. GFFRead can create this by itself.
String? exonsFastaPath
String? CDSFastaPath
String? proteinFastaPath
String? filteredGffPath
String memory = "4GiB"
Int timeMinutes = 1 + ceil(size(inputGff, "GiB") * 10)
String dockerImage = "quay.io/biocontainers/gffread:0.9.12--0"
}
# The mkdirs below are hackish. It should be
# ~{"mkir -p $(dirname " + somePath + ")"} but this goes wrong.
# Cromwell will always use ')' even if somepath is not defined.
# Which leads to crashing.
command {
set -e
~{"mkdir -p $(dirname " + CDSFastaPath}~{true=")" false="" defined(CDSFastaPath)}
~{"mkdir -p $(dirname " + exonsFastaPath}~{true=")" false="" defined(exonsFastaPath)}
~{"mkdir -p $(dirname " + proteinFastaPath}~{true=")" false="" defined(proteinFastaPath)}
~{"mkdir -p $(dirname " + filteredGffPath}~{true=")" false="" defined(filteredGffPath)}
gffread \
~{inputGff} \
-g ~{genomicSequence} \
~{"-w " + exonsFastaPath} \
~{"-x " + CDSFastaPath} \
~{"-y " + proteinFastaPath} \
~{"-o " + filteredGffPath} \
~{true="-T " false="" outputGtfFormat}
}
output {
File? exonsFasta = exonsFastaPath
File? CDSFasta = CDSFastaPath
File? proteinFasta = proteinFastaPath
File? filteredGff = filteredGffPath
}
runtime {
memory: memory
time_minutes: timeMinutes
docker: dockerImage
}
parameter_meta {
# inputs
inputGff: {description: "The input GFF file.", category: "required"}
genomicSequence: {description: "The genome.", category: "required"}
outputGtfFormat: {description: "Equivalent to gffread's `-T` flag.", category: "advanced"}
genomicIndex: {description: "The genome's index.", category: "advanced"}
exonsFastaPath: {description: "The location the exons fasta should be written to.", category: "advanced"}
CDSFastaPath: {description: "The location the CDS fasta should be written to.", category: "advanced"}
proteinFastaPath: {description: "The location the protein fasta should be written to.", category: "advanced"}
filteredGffPath: {description: "The location the filtered GFF should be written to.", category: "advanced"}
memory: {description: "The amount of memory available to the job.", category: "advanced"}
timeMinutes: {description: "The maximum amount of time the job will run in minutes.", category: "advanced"}
dockerImage: {description: "The docker image used for this task. Changing this may result in errors which the developers may choose not to address.", category: "advanced"}
# outputs
exonsFasta: {description: "Fasta file containing exons."}
CDSFasta: {description: "Fasta file containing CDS's."}
proteinFasta: {description: "Fasta file containing proteins."}
filteredGff: {description: "Filtered GFF file."}
}
}