This repository has been archived by the owner on May 28, 2024. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 0
/
bl2seq.yaml
330 lines (330 loc) · 14.7 KB
/
bl2seq.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
!mobyle/program
name: bl2seq
title: BL2SEQ
description: Comparison between two sequences with Blast (NCBI)
inputs: !mobyle/inputparagraph
children:
- !mobyle/inputprogramparameter
prompt: Blast initiation
format: '"bl2seq"'
argpos: 1
name: blast_init
command: true
hidden: true
type: !mobyle/stringtype {}
- !mobyle/inputprogramparameter
comment: '- Blastp compares amino acid query sequences- Blastn compares nucleotide
query sequences- tBlastx compares translated a nucleotide sequence and
an amino acid sequence- tBlastn compares an amino acid sequence translated
and a nucleotide sequence- tBlastx compares translated nucleotide sequences'
prompt: Blast program (-p)
format: '" -p " + str(value)'
simple: true
argpos: 2
mandatory: true
name: bl2seq
command: false
type: !mobyle/stringtype
default: 'null'
options:
- {label: Choose a program, value: 'null'}
- {label: Blastp (protein/protein), value: blastp}
- {label: Blastn (nucleotide/nucleotide), value: blastn}
- {label: Blastx (translated nucleotide/ protein), value: blastx}
- {label: tBlastn (protein/translated nucleotide), value: tblastn}
- {label: tBlastx (translated nucleotide/translated nucleotide), value: tblastx}
- !mobyle/inputprogramparameter
prompt: First sequence (-i)
format: '" -i " + str( value )'
simple: true
argpos: 3
mandatory: true
name: first_sequence
command: false
type: !mobyle/formattedtype
format_terms: ['EDAM_format:2200']
data_terms: ['EDAM_data:2044']
- !mobyle/inputprogramparameter
comment: Location on query sequence
prompt: Start of required region in first query sequence (-I)
name: first_start_region
command: false
type: !mobyle/integertype {}
- !mobyle/inputprogramparameter
prompt: End of required region in first sequence (-I)
format: ( ' -I "%s "' % (str(first_start_region)), ' -I "%s %s"' % (str(first_start_region),
str(value)))[value is not None]
argpos: 3
name: first_end_region
precond:
first_start_region: {'#ne': None}
command: false
type: !mobyle/integertype {}
- !mobyle/inputprogramparameter
prompt: Second sequence (-j)
format: '" -j " + str(value)'
simple: true
argpos: 4
mandatory: true
name: second_sequence
command: false
type: !mobyle/formattedtype
format_terms: ['EDAM_format:2200']
data_terms: ['EDAM_data:2044']
- !mobyle/inputprogramparameter
prompt: Start of required region in second sequence (-J)
argpos: 4
name: second_start_region
command: false
type: !mobyle/integertype {}
- !mobyle/inputprogramparameter
prompt: End of required region in second sequence (-J)
format: ( ' -J "%s "' % (str(second_start_region)), ' -J "%s %s"' % (str(second_start_region),
str(value)))[value is not None]
argpos: 4
name: second_end_region
precond:
second_start_region: {'#ne': None}
command: false
type: !mobyle/integertype {}
- !mobyle/inputprogramparagraph
prompt: Scoring options
name: scoring_opt
argpos: 5
children:
- !mobyle/inputprogramparameter
comment: 'Default: 5 for blastn; 10 for blastp, blastx and 11 for tblastn'
prompt: Cost to open a gap (-G)
format: ("" , " -G "+str(value) )[value is not None]
name: open_a_gap
command: false
type: !mobyle/integertype {}
- !mobyle/inputprogramparameter
comment: 'Default: 2 for blastn; 1 for blastp, blastx and tblastnLimited
values for gap existence and extension are supported for these programs.Existence
-- Extension:BLOSUM909 -- 2, 8 -- 2, 7 -- 2, 6 -- 211 -- 1, 10 --
1, 9 -- 1BLOSUM8025 -- 2, 13 -- 2, 9 -- 2, 8 -- 2, 7 -- 2, 6 -- 211
-- 1, 10 -- 1, 9 -- 1BLOSUM6211 -- 2, 10 -- 2, 9 -- 2, 8 -- 2, 7 --
2, 6 -- 213 -- 1, 12 -- 1, 11 -- 1, 10 -- 1, 9 -- 1BLOSUM4513 -- 3,
12 -- 3, 11 -- 3, 10 -- 316 -- 2, 15 -- 2, 14 -- 2, 13 -- 2, 12 --
219 -- 1, 18 -- 1, 17 -- 1, 16 -- 1PAM307 -- 2, 6 -- 2, 5 -- 210 --
1, 9 -- 1, 8 -- 1PAM708 -- 2, 7 -- 2, 6 -- 211 -- 1, 10 -- 1, 9 --
1'
prompt: Cost to extend a gap (-E)
format: ("" , " -E "+str(value) )[value is not None]
name: extend_a_gap
command: false
type: !mobyle/integertype {}
- !mobyle/inputprogramparagraph
prompt: Protein penalty (not for blastn)
name: scoring_blast
precond:
bl2seq: {'#ne': blastn}
children:
- !mobyle/inputprogramparameter
prompt: Similarity matrix (-M)
format: ("" , " -M "+str(value) )[value is not None and value != vdef]
name: matrix
command: false
type: !mobyle/stringtype
default: BLOSUM62
options:
- {label: BLOSUM90, value: BLOSUM90}
- {label: BLOSUM80, value: BLOSUM80}
- {label: BLOSUM62, value: BLOSUM62}
- {label: BLOSUM50, value: BLOSUM50}
- {label: BLOSUM45, value: BLOSUM45}
- {label: PAM30, value: PAM30}
- {label: PAM70, value: PAM70}
- {label: PAM250, value: PAM250}
- !mobyle/inputprogramparagraph
prompt: Blastn penalty
name: scoring_blastn
precond: {bl2seq: blastn}
children:
- !mobyle/inputprogramparameter
prompt: Penalty for a nucleotide mismatch (-q)
format: ("" , " -q "+str(value) )[value is not None and value != vdef]
name: mismatch
command: false
type: !mobyle/integertype {default: -3}
- !mobyle/inputprogramparameter
prompt: Reward for a nucleotide match (-r)
format: ("" , " -r "+str(value) )[value is not None and value != vdef]
name: match
command: false
type: !mobyle/integertype {default: 1}
- !mobyle/inputprogramparagraph
comment: "Mask off segments of the query sequence that have low compositional\
\ complexity, as determined by the SEG program of Wootton & Federhen (Computers\
\ and Chemistry, 1993) or, for BLASTN, by the DUST program of Tatusov\
\ and Lipman (in preparation). Filtering can eliminate statistically significant\
\ but biologically uninteresting reports from the blast output (e.g.,\
\ hits against common acidic-, basic- or proline-rich regions), leaving\
\ the more biologically interesting regions of the query\n sequence\
\ available for specific matching against database sequences.Filtering\
\ is only applied to the query sequence (or its translation products),\
\ not to database sequences. Default filtering is DUST for BLASTN, SEG\
\ for other programs. It is not unusual for nothing at all to be masked\
\ by SEG, when applied to sequences in SWISS-PROT, so filtering should\
\ not be expected to always yield an effect. Furthermore, in some cases,\
\ sequences are masked in their entirety, indicating that the statistical\
\ significance of any matches reported against the unfiltered\n \
\ query sequence should be suspect."
prompt: Filtering and masking options
name: filter_opt
argpos: 6
children:
- !mobyle/inputprogramparameter
prompt: Filter or Masking query sequence (DUST with blastn, SEG with others)
(-F)
format: (" -F F" , "")[ value ]
name: filter
command: false
type: !mobyle/booleantype {default: false}
- !mobyle/inputprogramparameter
comment: A coiled-coiled filter, based on the work of Lupas et al. (Science,
vol 252, pp. 1162-4 (1991)) written by John Kuzio (Wilson et al.,
J Gen Virol, vol. 76, pp. 2923-32 (1995))
prompt: Filtering options (Filter must be true)
name: other_filters
precond:
'#and':
- filter
- other_masking: {'#eq': None}
command: false
type: !mobyle/stringtype {default: 'null'}
- !mobyle/inputprogramparameter
comment: 'A coiled-coiled filter, based on the work of Lupas et al. (Science,
vol 252, pp. 1162-4 (1991)) written by John Kuzio (Wilson et al.,
J Gen Virol, vol. 76, pp. 2923-32 (1995)).It is possible to specify
that the masking should only be done during the process of building
the initial words .If the -U option (to mask any lower-case sequence
in the input FASTA file) is used and one does not wish any other filtering,
but does wish to mask when building the lookup tables then one should
specify: -F ''m'''
prompt: Masking options (Filter must be true)
name: other_masking
precond:
'#and':
- {filter: '1'}
- other_filters: {'#eq': None}
command: false
type: !mobyle/stringtype {default: 'null'}
- !mobyle/inputprogramparameter
comment: This option specifies that any lower-case letters in the input
FASTA file should be masked.
prompt: Use lower case filtering (-U)
format: ("", " -U T")[value]
name: lower_case
command: false
type: !mobyle/booleantype {default: false}
- !mobyle/inputprogramparagraph
prompt: Selectivity options
name: selectivity_opt
argpos: 7
children:
- !mobyle/inputprogramparameter
comment: "The statistical significance threshold for reporting matches\
\ against database sequences; the default value is 10, such that 10\
\ matches are expected to be found merely by chance, according to\
\ the stochastic model of Karlin and Altschul (1990). If the statistical\
\ significance ascribed to a match is greater than the EXPECT threshold,\
\ the match will not be reported. Lower EXPECT thresholds are more\
\ stringent, leading to fewer chance matches being reported. Fractional\
\ values are\n acceptable."
prompt: Expected value (-e)
format: ("" , " -e "+str(value) )[value is not None and value != vdef]
simple: true
name: Expect
command: false
type: !mobyle/floattype {default: 10.0}
- !mobyle/inputprogramparameter
comment: Use words of size N.Zero invokes default behaviorDefault values:-
11 for blastn- 3 for others
prompt: Word Size (-W)
format: ("" , " -W "+str(value) )[value is not None]
name: word_size
command: false
type: !mobyle/integertype {}
- !mobyle/inputprogramparameter
comment: This is the value that control the path graph region explored
by Blast during a gapped extension (Xg in the NAR paper) (default
for blastp is 15).Default values:- 30 for blastn- 0 for tblastx- 15
for others
prompt: X dropoff value for gapped alignment (-X)
format: ("" , " -X "+str(value))[value is not None]
name: dropoff_extent
command: false
type: !mobyle/floattype {}
- !mobyle/inputprogramparameter
comment: Use zero for the real size
prompt: Effective length of the search space (-Y)
format: ("" , " -Y "+str(value) )[value is not None]
name: eff_len
command: false
type: !mobyle/integertype {}
- !mobyle/inputprogramparameter
prompt: Perform or not gapped alignment (not available with tblastx) (-g)
format: (" -g F " , "")[value]
name: gapped_alig
precond:
bl2seq: {'#ne': tblastx}
command: false
type: !mobyle/booleantype {default: false}
- !mobyle/inputprogramparagraph
prompt: Translation options
name: translation_opt
precond:
bl2seq:
'#in': [blastx, tblastx, tblastn]
argpos: 8
children:
- !mobyle/inputprogramparameter
prompt: Query strand to search against second sequence (for blastx, tblastx
or tblastn) (-S)
format: ( "" , " -S " + str(value) )[ value is not None and value!= vdef]
simple: true
mandatory: true
name: strand
command: false
type: !mobyle/stringtype
default: '3'
options:
- {label: Top (1), value: '1'}
- {label: Bottom (2), value: '2'}
- {label: Both (3), value: '3'}
- !mobyle/inputprogramparagraph
prompt: Output options
name: output_opt
argpos: 10
children:
- !mobyle/inputprogramparameter
prompt: Output format (-D)
format: ( "" , " -D " + str( value ) )[ value is not None and value !=
vdef]
name: outformat
command: false
type: !mobyle/stringtype
default: '0'
options:
- {label: Traditional (0), value: '0'}
- {label: Tabulated (1), value: '1'}
outputs: !mobyle/outputparagraph
children:
- !mobyle/outputprogramparameter
prompt: Standard output
filenames: '"bl2seq.out"'
name: stdout
output_type: stdout
type: !mobyle/formattedtype
data_terms: ['EDAM_data:2048']
- !mobyle/outputprogramparameter
prompt: Standard error
filenames: '"bl2seq.err"'
name: stderr
type: !mobyle/formattedtype
data_terms: ['EDAM_data:2048']
operations: ['EDAM_operation:0493']
topics: ['EDAM_topic:0182']
env: {}