This repository has been archived by the owner on May 28, 2024. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathblast2mydb.yaml
551 lines (551 loc) · 24 KB
/
blast2mydb.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
!mobyle/program
name: blast2mydb
title: BLAST2MYDB
description: NCBI BLAST, with gaps against my sequences database
inputs: !mobyle/inputparagraph
children:
- !mobyle/inputprogramparagraph
prompt: Create my Database
name: db
children:
- !mobyle/inputprogramparameter
format: '"formatdb "'
argpos: 1
name: formatdb
command: false
hidden: true
type: !mobyle/stringtype {}
- !mobyle/inputprogramparameter
comment: Create a protein database for blastx
prompt: Protein db
format: '" -i "+ str(value)'
simple: true
argpos: 2
mandatory: true
name: protein_db
precond:
blast2:
'#in': [blastx, blastp]
command: false
type: !mobyle/formattedtype
format_terms: ['EDAM_format:2200']
data_terms: ['EDAM_data:2044']
- !mobyle/inputprogramparameter
comment: Create a nucleotid database for blastn, tblastn or tblastx
prompt: Nucleotid db
format: '"-p F -i "+ str(value)'
simple: true
argpos: 2
mandatory: true
name: nucleotid_db
precond:
blast2:
'#in': [blastn, tblastx, tblastn, psitblastn]
command: false
type: !mobyle/formattedtype
format_terms: ['EDAM_format:2200']
data_terms: ['EDAM_data:2044']
- !mobyle/inputprogramparameter
prompt: the name of my db
format: '" -n " + str( value )'
simple: true
argpos: 3
mandatory: true
name: db_name
command: false
type: !mobyle/stringtype {default: myDatabase}
- !mobyle/inputprogramparameter
prompt: Blast initiation
format: '" && blastall "'
argpos: 4
name: blast_init
command: true
hidden: true
type: !mobyle/stringtype {}
- !mobyle/inputprogramparameter
comment: '- Blastp compares an amino acid query sequence against a protein
sequence database;- Blastn compares a nucleotide query sequence against
a nucleotide sequence database;- Blastx compares the six-frame conceptual
translation products of a nucleotide query sequence (both strands) against
a protein sequence database;- tBlastn compares a protein query sequence
against a nucleotide sequence database dynamically translated in all six
reading frames (both strands).- tBlastx compares the six-frame translations
of a nucleotide query sequence against the six-frame translations of a
nucleotide sequence database.- psitBlastn compares a protein query sequence
against a nucleotide sequence database dynamically translated in all six
reading frames (both strands) using a position specific matrix created
by PSI-BLAST.'
prompt: Blast program (-p)
format: '" -p "+ str(value)'
simple: true
argpos: 5
mandatory: true
name: blast2
command: false
type: !mobyle/stringtype
default: 'null'
options:
- {label: Choose a program, value: 'null'}
- {label: Blastn (nucleotide query / nucleotide db), value: blastn}
- {label: Blastx (translated nucleotide query / protein db), value: blastx}
- {label: tBlastx (translated nucleotide query / translated nucleotide
db), value: tblastx}
- {label: Blastp (protein query / protein db), value: blastp}
- {label: tBlastn (protein query / translated nucleotide db), value: tblastn}
- {label: psitBlastn (protein query / translated nucleotide db), value: psitblastn}
- !mobyle/inputprogramparameter
format: '" -d "+ str( db_name )'
argpos: 6
name: blastdb
command: false
hidden: true
type: !mobyle/stringtype {}
- !mobyle/inputprogramparagraph
prompt: Query Sequence
name: query
argpos: 10
children:
- !mobyle/inputprogramparameter
comment: Read (first, query) sequence or set from file
prompt: Query (-i)
format: '" -i "+ str(query_seq)'
simple: true
mandatory: true
name: query_seq
command: false
type: !mobyle/formattedtype
format_terms: ['EDAM_format:2200']
data_terms: ['EDAM_data:2044']
- !mobyle/inputprogramparameter
comment: Location on query sequence
prompt: Start of required region in query sequence (-L)
name: start_region
command: false
type: !mobyle/integertype {}
- !mobyle/inputprogramparameter
comment: Location on query sequence
prompt: End of required region in query sequence (-L)
format: (' -L "%s"' % (str(start_region)), ' -L "%s %s"' % (str(start_region),
str(value)))[value is not None]
name: end_region
precond:
start_region: {'#ne': None}
command: false
type: !mobyle/integertype {}
- !mobyle/inputprogramparameter
prompt: Number of concatenated queries (blastn or tblastn) (-B)
format: ("" , " -B "+str(value))[value is not None]
name: concat
precond:
blast2:
'#in': [blastn, tblastn]
command: false
type: !mobyle/integertype {}
- !mobyle/inputprogramparagraph
prompt: Scoring options
name: scoring_opt
argpos: 5
children:
- !mobyle/inputprogramparameter
comment: 'Default: 5 for blastn; 10 for blastp, blastx and tblastn'
prompt: Cost to open a gap (-G)
format: ("" , " -G "+str(value))[value is not None]
name: open_a_gap
command: false
type: !mobyle/floattype {}
- !mobyle/inputprogramparameter
comment: 'Default: 2 for blastn; 1 for blastp, blastx and tblastnLimited
values for gap existence and extension are supported for these programs.
Some supported and suggested values are:Existence Extension10 -- 110
-- 211 -- 18 -- 29 -- 2'
prompt: Cost to extend a gap (-E)
format: ("" , " -E "+str(value))[value is not None]
name: extend_a_gap
command: false
type: !mobyle/floattype {}
- !mobyle/inputprogramparagraph
prompt: Protein penalty (not for blastn)
name: scoring_blast
precond:
blast2: {'#ne': blastn}
children:
- !mobyle/inputprogramparameter
prompt: Similarity matrix (-M)
format: ("" , " -M "+str(value))[value is not None and value != vdef]
name: matrix
command: false
type: !mobyle/stringtype
default: BLOSUM62
options:
- {label: BLOSUM62, value: BLOSUM62}
- {label: BLOSUM45, value: BLOSUM45}
- {label: BLOSUM80, value: BLOSUM80}
- {label: PAM30, value: PAM30}
- {label: PAM70, value: PAM70}
- !mobyle/inputprogramparagraph
prompt: Blastn penalty
name: scoring_blastn
precond: {blast2: blastn}
children:
- !mobyle/inputprogramparameter
prompt: Penalty for a nucleotide mismatch (-q)
format: ("" , " -q "+str(value))[value is not None and value != vdef]
name: mismatch
command: false
type: !mobyle/floattype {default: -3.0}
- !mobyle/inputprogramparameter
prompt: Reward for a nucleotide match (-r)
format: ("" , " -r "+str(value))[value is not None and value != vdef]
name: match
command: false
type: !mobyle/floattype {default: 1.0}
- !mobyle/inputprogramparameter
prompt: Frame shift penalty (-w)
format: ("", " -w "+str(value))[value is not None]
name: frameshift
command: false
type: !mobyle/floattype {}
- !mobyle/inputprogramparagraph
comment: BLAST 2.0 uses the dust low-complexity filter for blastn and seg
for the other programs.If one uses '-F T' then normal filtering by seg
or dust (for blastn) occurs (likewise '-F F' means no filtering whatsoever).
prompt: Filtering and masking options
name: filter_opt
argpos: 20
children:
- !mobyle/inputprogramparameter
prompt: Filter or Masking query sequence (DUST with blastn, SEG with others)
(-F)
format: (" -F F" , "")[ value ]
name: filter
command: false
type: !mobyle/booleantype {default: false}
- !mobyle/inputprogramparameter
comment: A coiled-coiled filter, based on the work of Lupas et al. (Science,
vol 252, pp. 1162-4 (1991)) written by John Kuzio (Wilson et al.,
J Gen Virol, vol. 76, pp. 2923-32 (1995))
prompt: Filtering options (Filter must be true)
name: other_filters
precond:
'#and':
- filter
- {'#not': other_masking}
command: false
type: !mobyle/stringtype {default: 'null'}
- !mobyle/inputprogramparameter
comment: 'A coiled-coiled filter, based on the work of Lupas et al. (Science,
vol 252, pp. 1162-4 (1991)) written by John Kuzio (Wilson et al.,
J Gen Virol, vol. 76, pp. 2923-32 (1995)).It is possible to specify
that the masking should only be done during the process of building
the initial words .If the -U option (to mask any lower-case sequence
in the input FASTA file) is used and one does not wish any other filtering,
but does wish to mask when building the lookup tables then one should
specify: -F ''m'''
prompt: Masking options (Filter must be true)
name: other_masking
precond:
'#and':
- filter
- {'#not': other_filters}
command: false
type: !mobyle/stringtype {default: 'null'}
- !mobyle/inputprogramparameter
comment: This option specifies that any lower-case letters in the input
FASTA file should be masked.
prompt: Use lower case filtering (-U)
format: ("", " -U T")[ bool(value) ]
name: lower_case
command: false
type: !mobyle/booleantype {default: false}
- !mobyle/inputprogramparagraph
comment: The programs blastn and blastp offer fully gapped alignments. blastx
and tblastn have 'in-frame' gapped alignments and use sum statistics to
link alignments from different frames. tblastx provides only ungapped
alignments.
prompt: Selectivity options
name: selectivity_opt
argpos: 7
children:
- !mobyle/inputprogramparameter
comment: "The statistical significance threshold for reporting matches\
\ against database sequences; the default value is 10, such that 10\
\ matches are expected to be found merely by chance, according to\
\ the stochastic model of Karlin and Altschul (1990). If the statistical\
\ significance ascribed to a match is greater than the EXPECT threshold,\
\ the match will not be reported. Lower EXPECT thresholds are more\
\ stringent, leading to fewer chance matches being reported. Fractional\
\ values are\n acceptable."
prompt: Expected value (-e)
format: ("" , " -e "+str(value))[value is not None and value != vdef]
simple: true
name: Expect
command: false
type: !mobyle/floattype {default: 10.0}
- !mobyle/inputprogramparameter
comment: Use words of size N.Zero invokes default behaviorDefault values:-
11 for blastn- 3 for others
prompt: Word Size (-W)
format: ("" , " -W "+str(value))[value is not None]
name: word_size
command: false
type: !mobyle/integertype {}
- !mobyle/inputprogramparameter
comment: 'Default: zero for all programs'
prompt: Multiple Hits window size (-A)
format: ("" , " -A "+str(value))[value is not None]
name: dist_hits
command: false
type: !mobyle/integertype {}
- !mobyle/inputprogramparameter
comment: Blast seeks first short word pairs whose aligned score reaches
at least this value.Default values:- 0 for blastn- 11 for blastp-
12 for blastx- 13 for tblastn and tblastx
prompt: Threshold for extending hits (-f)
format: ("" , " -f "+str(value))[value is not None]
name: extend_hit
command: false
type: !mobyle/floattype {}
- !mobyle/inputprogramparameter
comment: This is the value that control the path graph region explored
by Blast during a gapped extension (Xg in the NAR paper) (default
for blastp is 15).Default values:- 30 for blastn- 0 for tblastx- 15
for others
prompt: X dropoff value for gapped alignment (-X)
format: ("" , " -X "+str(value))[value is not None]
name: dropoff_extent
command: false
type: !mobyle/floattype {}
- !mobyle/inputprogramparameter
comment: Default values:- 50 for blastn- 0 for tblastx- 25 for others
prompt: X dropoff value for final alignment gapped alignment (-Z)
format: ("" , " -Z "+str(value))[value is not None]
name: dropoff_final
command: false
type: !mobyle/floattype {}
- !mobyle/inputprogramparameter
comment: Use zero for the real size
prompt: Effective length of the search space (-Y)
format: ("" , " -Y "+str(value))[value is not None]
name: eff_len
command: false
type: !mobyle/integertype {}
- !mobyle/inputprogramparameter
comment: If this option is used, a value of 100 is recommended.
prompt: Number of best hits from a region to keep (-K)
format: ("" , " -K "+str(value))[value is not None]
name: keep_hits
command: false
type: !mobyle/integertype {}
- !mobyle/inputprogramparameter
prompt: Perform or not gapped alignment (not available with tblastx) (-g)
format: (" -g F " , "")[value]
name: gapped_alig
precond:
blast2: {'#ne': tblastx}
command: false
type: !mobyle/booleantype {default: false}
- !mobyle/inputprogramparameter
prompt: Single-hit or multiple-hit mode (-P)
format: ("" , " -P "+str(value))[value != "0"]
name: mode
precond:
blast2: {'#ne': blastn}
command: false
type: !mobyle/stringtype
default: '0'
options:
- {label: Multiple-hit (0), value: '0'}
- {label: Single-hit (1), value: '1'}
- !mobyle/inputprogramparagraph
prompt: Translation options
name: translation_opt
argpos: 30
children:
- !mobyle/inputprogramparameter
prompt: Genetic code used for query translation (-Q)
format: ("" , " -Q "+str(value))[value is not None and value != vdef]
name: gc_query
precond:
blast2:
'#in': [blastx, tblastx]
command: false
type: !mobyle/stringtype
default: '1'
options:
- {label: Standard (1), value: '1'}
- {label: Vertebrate Mitochondrial (2), value: '2'}
- {label: Yeast Mitochondrial (3), value: '3'}
- {label: 'Mold, Protozoan, Coelenterate Mitochondrial and Mycoplasma/Spiroplasma
(4)', value: '4'}
- {label: Invertebrate Mitochondrial (5), value: '5'}
- {label: Ciliate Macronuclear and Dasycladacean (6), value: '6'}
- {label: Echinoderm Mitochondrial (9), value: '9'}
- {label: Euplotid Nuclear (10), value: '10'}
- {label: Bacterial (11), value: '11'}
- {label: Alternative Yeast Nuclear (12), value: '12'}
- {label: Ascidian Mitochondrial (13), value: '13'}
- {label: Flatworm Mitochondrial (14), value: '14'}
- {label: Blepharisma Macronuclear (15), value: '15'}
- !mobyle/inputprogramparameter
prompt: Genetic code used for database translation (-D)
format: ("" , " -D "+str(value))[value != vdef]
name: gc_db
precond:
blast2:
'#in': [tblastn, tblastx]
command: false
type: !mobyle/stringtype
default: '1'
options:
- {label: Standard (1), value: '1'}
- {label: Vertebrate Mitochondrial (2), value: '2'}
- {label: Yeast Mitochondrial (3), value: '3'}
- {label: 'Mold, Protozoan, Coelenterate Mitochondrial and Mycoplasma/Spiroplasma
(4)', value: '4'}
- {label: Invertebrate Mitochondrial (5), value: '5'}
- {label: Ciliate Macronuclear and Dasycladacean (6), value: '6'}
- {label: Echinoderm Mitochondrial (9), value: '9'}
- {label: Euplotid Nuclear (10), value: '10'}
- {label: Bacterial (11), value: '11'}
- {label: Alternative Yeast Nuclear (12), value: '12'}
- {label: Ascidian Mitochondrial (13), value: '13'}
- {label: Flatworm Mitochondrial (14), value: '14'}
- {label: Blepharisma Macronuclear (15), value: '15'}
- !mobyle/inputprogramparameter
prompt: Query strands to search against database (-S)
format: ("" , " -S "+str(value))[value is not None and value != vdef]
name: strand
precond:
blast2:
'#in': [blastn, blastx, tblastx]
command: false
type: !mobyle/stringtype
default: '3'
options:
- {label: Top (1), value: '1'}
- {label: Bottom (2), value: '2'}
- {label: Both (3), value: '3'}
- !mobyle/inputprogramparagraph
prompt: Report options
name: affichage
argpos: 40
children:
- !mobyle/inputprogramparameter
comment: Maximum number of database sequences for which one-line descriptions
will be reported.
prompt: Number of one-line descriptions to show (-v)
format: ("" , " -v "+str(value))[value is not None and value != vdef]
name: Descriptions
command: false
type: !mobyle/integertype {default: 500}
- !mobyle/inputprogramparameter
comment: Maximum number of database sequences for which high-scoring segment
pairs will be reported (-b).
prompt: Number of database sequences to show alignments (-b)
format: ("" , " -b "+str(value))[value is not None and value != vdef]
name: Alignments
command: false
type: !mobyle/integertype {default: 250}
- !mobyle/inputprogramparameter
prompt: Alignment view options (-m)
format: ("" , " -m "+str(value))[value is not None and value != vdef]
name: view_alignments
command: false
type: !mobyle/stringtype
default: '0'
options:
- {label: Pairwise (0), value: '0'}
- {label: Query-anchored showing identities (1), value: '1'}
- {label: Query-anchored no identities (2), value: '2'}
- {label: 'Flat query-anchored, show identities (3)', value: '3'}
- {label: 'Flat query-anchored, no identities (5)', value: '4'}
- {label: Query-anchored no identities and blunt ends (5), value: '5'}
- {label: 'Flat query-anchored, no identities and blunt ends (6)',
value: '6'}
- {label: XML Blast output (7), value: '7'}
- {label: Tabular output (8), value: '8'}
- !mobyle/inputprogramparameter
prompt: Text output file
format: '" -o blast2.txt"'
argpos: 50
name: txtoutput
precond:
view_alignments: {'#ne': '7'}
command: false
hidden: true
type: !mobyle/stringtype {}
- !mobyle/inputprogramparameter
prompt: Xml output file
format: '" -o blast2.xml"'
argpos: 60
name: xmloutput
precond: {view_alignments: '7'}
command: false
hidden: true
type: !mobyle/stringtype {}
- !mobyle/inputprogramparameter
prompt: Html output
format: ("" , " && html4blast -g -o blast2.html blast2.txt")[value]
argpos: 61
name: htmloutput
precond:
view_alignments:
'#nin': ['7', '8']
command: false
type: !mobyle/booleantype {default: false}
outputs: !mobyle/outputparagraph
children:
- !mobyle/outputprogramparameter
prompt: Blast text report
filenames: '"blast2.txt"'
name: txtfile
precond:
view_alignments: {'#ne': '7'}
type: !mobyle/formattedtype
data_terms: ['EDAM_data:0857']
- !mobyle/outputprogramparameter
prompt: Blast xml report
filenames: '"blast2.xml"'
name: xmlfile
precond: {view_alignments: '7'}
type: !mobyle/formattedtype
data_terms: ['EDAM_data:2048']
- !mobyle/outputprogramparameter
prompt: Blast html report
filenames: '"blast2.html"'
name: htmlfile
precond:
view_alignments:
'#nin': ['7', '8']
type: !mobyle/formattedtype
data_terms: ['EDAM_data:2048']
- !mobyle/outputprogramparameter
filenames: '"*.gif"'
name: imgfile
precond:
view_alignments:
'#nin': ['7', '8']
hidden: true
- !mobyle/outputprogramparameter
prompt: Standard output
filenames: '"blast2mydb.out"'
name: stdout
output_type: stdout
type: !mobyle/formattedtype
data_terms: ['EDAM_data:2048']
- !mobyle/outputprogramparameter
prompt: Standard error
filenames: '"blast2mydb.err"'
name: stderr
type: !mobyle/formattedtype
data_terms: ['EDAM_data:2048']
operations: ['EDAM_operation:0352', 'EDAM_operation:0227']
topics: ['EDAM_topic:0182', 'EDAM_topic:0220']
references:
- {doi: null, label: 'Altschul, Stephen F., Thomas L. Madden, Alejandro A. Schaeffer,Jinghui
Zhang, Zheng Zhang, Webb Miller, and David J. Lipman (1997), Gapped BLAST
and PSI-BLAST: a new generation of protein database search programs, Nucleic
Acids Res. 25:3389-3402.', url: null}
documentation_links: ['http://www.ncbi.nlm.nih.gov/books/bv.fcgi?rid=handbook.chapter.ch16',
'http://www.ncbi.nlm.nih.gov/Education/BLASTinfo/tut1.html']
env: {}