-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathparams_default_kinetoplastid.config
82 lines (68 loc) · 2.45 KB
/
params_default_kinetoplastid.config
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
params {
// input sequence
inseq = "${baseDir}/example-data/L_donovani.1.fasta"
// reference data -- paths must be absolute
ref_dir = "${baseDir}/example-data/references/kinetoplastida"
ref_species = "LmjF_01"
// output directory, if desired
dist_dir = "${baseDir}/example-output"
// enable/disable parts of the pipeline
run_exonerate = false
do_contiguation = true
run_braker = true
do_circos = true
do_pseudo = true
make_embl = true
use_reference = true
fix_polycistrons = true
truncate_input_headers = true
transfer_tool = "liftoff"
is_fungi = false
use_existing = true
is_softmasked = false
mit_bypass = false
// make submission-compatible EMBL files
embl_ena_submission = false
// naming patterns
GENOME_PREFIX = "LDON"
CHR_PATTERN = "LDON_(%w+)"
MAX_GENE_LENGTH = 20000
MAX_OVERLAP = 5
ABACAS_BIN_CHR = "LDON_0"
alphanumeric_ids = false
// ABACAS min match length and similarity
ABACAS_MATCH_SIZE = 500
ABACAS_MATCH_SIM = 85
// RATT parameters
RATT_TRANSFER_TYPE = 'Species'
// AUGUSTUS parameters
AUGUSTUS_GENEMODEL = 'partial'
AUGUSTUS_HINTS_MAXINTRONLEN = '1'
AUGUSTUS_SCORE_THRESHOLD = 0.8
// Weight description file
// This is a Lua script that needs to implement a function
// `get_weight(gene, regionmapping)'' and assigns a number to be used as
// weight in finding an optimal chain of genes in overlapping clusters
// The default is kinetoplastid-specific, use 'weight_multiexon_generic.lua'
// for a less biased setting.
WEIGHT_FILE = "${baseDir}/data/weight/weight_kinetoplastid.lua"
// covariance models for Infernal
NCRNA_MODELS = "${baseDir}/data/cm/kinetoplastid_rnas.cm"
// Template for spec check output
SPECK_TEMPLATE = "html"
// Transcript (e.g. RNA-seq) evidence file to use for hints generation
// (GTF as produced by cufflinks/cuffmerge/...)
//TRANSCRIPT_FILE = ""
// EMBL file metadata
EMBL_AUTHORS = "Foo Bar"
EMBL_TITLE = "Baz"
EMBL_PUBLICATION = "Quux"
EMBL_GENOME_TYPE = "XXX"
EMBL_CLASSIFICATION = "XXXX"
EMBL_ORGANISM = "Leishmania donovani"
EMBL_PROJ_ACCESSION = "123456"
EMBL_DESCRIPTION = "Foo bar"
// output GAF metadata
TAXON_ID = 5661
DB_ID = "Companion"
}