root/galaxy-central/tools/sr_mapping/lastz_wrapper.xml

リビジョン 2, 33.4 KB (コミッタ: hatakeyama, 14 年 前)

import galaxy-central

行番号 
1<tool id="lastz_wrapper_2" name="Lastz" version="1.1.1">
2    <description> map short reads against reference sequence</description>
3    <command interpreter="python">lastz_wrapper.py
4#if $seq_name.how_to_name=="yes":
5--ref_name=$seq_name.ref_name
6#else:
7--ref_name="None"
8#end if
9--ref_source=$source.ref_source --source_select=$params.source_select --out_format=$out_format --input2=$input2
10#if $source.ref_source=="history":
11--input1=$source.input1
12--ref_sequences=$input1.metadata.sequences
13#else:
14--input1=$source.input1_2bit
15--ref_sequences="None"
16#end if
17#if $params.source_select=="pre_set":
18--pre_set_options=${params.pre_set_options} --strand="None" --seed="None" --gfextend="None" --chain="None" --transition="None" --O="None" --E="None" --X="None" --Y="None" --K="None" --L="None" --entropy="None"
19#else:
20--pre_set_options="None" --strand=$params.strand --seed=$params.seed --gfextend=$params.gfextend --chain=$params.chain --transition="$params.transition" --O=$params.O --E=$params.E --X=$params.X --Y=$params.Y --K=$params.K --L=$params.L --entropy=$params.entropy
21#end if
22--identity_min=$min_ident --identity_max=$max_ident --coverage=$min_cvrg --output=$output1 --unmask=$unmask --lastzSeqsFileDir=${GALAXY_DATA_INDEX_DIR}
23    </command>
24    <inputs>
25        <param name="input2" format="fasta" type="data" label="Align sequencing reads in" />
26        <conditional name="source">
27            <param name="ref_source" type="select" label="Against reference sequences that are">
28                <option value="cached">locally cached</option>
29                <option value="history">in your history</option>
30            </param>
31            <when value="cached">
32                <param name="input1_2bit" type="select" label="Using reference genome" help="If your genome of interest is not listed, contact the Galaxy team">
33                    <options from_file="lastz_seqs.loc">
34                        <column name="value" index="1" />
35                        <column name="name" index="0" />
36                    </options>
37                </param>
38            </when>
39            <when value="history">
40                <param name="input1" type="data" format="fasta" label="Select a reference dataset" />
41            </when>
42        </conditional>
43        <param name="out_format" type="select" label="Output format">
44            <option value="sam">SAM</option>
45            <option value="diffs">Polymorphisms</option>
46            <option value="tabular">Tabular</option>
47        </param>
48        <conditional name="params">
49            <param name="source_select" type="select" label="Lastz settings to use" help="For most mapping needs use Commonly used settings. If you want full control use Full List">
50                <option value="pre_set">Commonly used</option>
51                <option value="full">Full Parameter List</option>
52            </param>
53            <when value="pre_set">
54                <param name="pre_set_options" type="select" label="Select mapping mode">
55                    <option value="yasra98">Roche-454 98% identity</option>
56                    <option value="yasra95">Roche-454 95% identity</option>
57                    <option value="yasra90">Roche-454 90% identity</option>
58                    <option value="yasra85">Roche-454 85% identity</option>
59                    <option value="yasra75">Roche-454 75% identity</option>
60                    <option value="yasra95short">Illumina 95% identity</option>
61                    <option value="yasra85short">Illumina 85% identity</option>
62                </param>
63            </when>
64            <when value="full">
65                <param name="strand" type="select" label="Which strand to search?">
66                    <option value="both">Both</option>
67                    <option value="plus">Search forward strand only (the one in the reference)</option>
68                    <option value="minus">Search the reverse complement strand only (opposite of the reference)</option>
69                </param>
70                <param name="seed" type="select" label="Select seeding settings" help="allows you set word size and number of mismatches">
71                    <option value="12of19">Seed hits require a 19 bp word with matches in 12 specific positions</option>
72                    <option value="14of22">Seed hits require a 22 bp word with matches in 14 specific positions</option>
73                </param>
74                <param name="transition" type="select" label="Select transition settings" help="affects the number of allowed transition substitutions">
75                    <option value="transition">Allow one transition in each seed hit</option>
76                    <option value="transition=2">Allow two transitions in a seed hit </option>
77                    <option value="notransition">Don't allow any transitions in seed hits</option>
78                </param>
79                <param name="gfextend" type="select" label="Perform gap-free extension of seed hits to HSPs (high scoring segment pairs)?">
80                    <option value="nogfextend">No</option>
81                    <option value="gfextend">Yes</option>
82                </param>
83                <param name="chain" type="select" label="Perform chaining of HSPs?">
84                    <option value="nochain">No</option>
85                    <option value="chain">Yes</option>
86                </param>
87                <param name="O" type="integer" size="5" value="400" label="Gap opening penalty"/>
88                <param name="E" type="integer" size="5" value="30" label="Gap extension penalty"/>
89                <param name="X" type="integer" size="5" value="910" label="X-drop threshold"/>
90                <param name="Y" type="integer" size="5" value="9370" label="Y-drop threshold"/>
91                <param name="K" type="integer" size="5" value="3000" label="Set the threshold for HSPs (ungapped extensions scoring lower are discarded)"/>
92                <param name="L" type="integer" size="5" value="3000" label="Set the threshold for gapped alignments (gapped extensions scoring lower are discarded)"/>
93                <param name="entropy" type="select" label="Involve entropy when filtering HSPs?">
94                    <option value="noentropy">No</option>
95                    <option value="entropy">Yes</option>
96                </param>
97            </when>   
98        </conditional>
99        <conditional name="seq_name">
100            <param name="how_to_name" type="select" label="Do you want to modify the reference name?">
101                <option value="no">No</option>
102                <option value="yes">Yes</option>
103            </param>
104            <when value="yes">
105                <param name="ref_name" type="text" size="25" value="Type sequence name here" label="Enter name for the Reference sequence"/>
106            </when>
107            <when value="no" />
108        </conditional>
109        <param name="min_ident" type="integer" size="3" value="0" label="Do not report matches below this identity (%)"/>
110        <param name="max_ident" type="integer" size="3" value="100" label="Do not report matches above this identity (%)"/>
111        <param name="min_cvrg" type="integer" size="3" value="0" label="Do not report matches that cover less than this percentage of each read"/>
112        <param name="unmask" type="select" label="Convert lowercase bases to uppercase">
113            <option value="yes">Yes</option>
114            <option value="no">No</option>
115        </param>
116    </inputs>
117    <outputs>
118        <data format="tabular" name="output1">
119            <change_format>
120                <when input="out_format" value="sam" format="sam" />
121            </change_format>
122        </data>
123    </outputs>
124    <requirements>
125        <requirement type="package">lastz</requirement>
126    </requirements>
127    <tests>
128        <test>
129            <!--
130                Lastz command:
131                lastz phiX.2bit/PHIX174[nickname=Ref] test-data/b1.fasta +nogfextend +nochain +gapped +strand=both +seed=12of19 +transition O=400 E=30 X=910 Y=9370 K=3000 L=3000 +noentropy +ambiguousn +nolaj +identity=0..100 +coverage=0 +format=sam- > lastz_wrapper_out2.sam
132                You need to point to phiX.2bit somewhere on your system. b1.fasta is located in galaxy's test-data.  You will have to replace all the pluses before the
133                commands with 2 dashes, as double-dash can't appear in an XML comment.
134            -->
135            <param name="input2" value="b1.fasta" ftype="fasta" />
136            <param name="ref_source" value="cached" />
137            <param name="input1_2bit" value="phiX" />
138            <param name="out_format" value="sam" />
139            <param name="source_select" value="full" />
140            <param name="strand" value="both" />
141            <param name="seed" value="12of19" />
142            <param name="transition" value="transition" />
143            <param name="gfextend" value="nogfextend" />
144            <param name="chain" value="nochain" />
145            <param name="O" value="400" />
146            <param name="E" value="30" />
147            <param name="X" value="910" />
148            <param name="Y" value="9370" />
149            <param name="K" value="3000" />
150            <param name="L" value="3000" />
151            <param name="entropy" value="noentropy" />
152            <!--
153                 how_to_name is not the default. It is changed to modify
154                input1_2bit by adding the ref_name as a nickname
155            -->
156            <param name="how_to_name" value="yes" />
157            <param name="ref_name" value="Ref" />
158            <param name="min_ident" value="0" />
159            <param name="max_ident" value="100" />
160            <param name="min_cvrg" value="0" />
161            <param name="unmask" value="yes" />
162            <output name="output1" file="lastz_wrapper_out2.sam" />
163        </test>
164        <test>
165            <!--
166                Lastz command:
167                lastz test-data/phiX.fasta test-data/b1.fasta[fullnames] +yasra95short +ambiguousn +nolaj +identity=0..100 +coverage=0 +format=diffs > lastz_wrapper_out3.tabular
168                phiX.fasta and b1.fasta are located in galaxy's test-data.  You will have to replace all the pluses before the commands with 2 dashes,
169                as double-dash can't appear in an XML comment.
170            -->
171            <param name="input2" value="b1.fasta" ftype="fasta" />
172            <param name="ref_source" value="history" />
173            <param name="input1" value="phiX.fasta" ftype="fasta" />
174            <param name="out_format" value="diffs" />
175            <param name="source_select" value="pre_set" />
176            <param name="pre_set_options" value="yasra95short" />
177            <param name="how_to_name" value="no" />
178            <param name="min_ident" value="0" />
179            <param name="max_ident" value="100" />
180            <param name="min_cvrg" value="0" />
181            <param name="unmask" value="yes" />
182            <output name="output1" file="lastz_wrapper_out3.tabular" />
183        </test>
184        <test>
185            <!--
186                Lastz command: first you will need to split the file phiX_split.fasta into two files,
187                phiX1.fasta and phiX2.fasta, each with 1 sequence (phiX1 and phiX2, respectively). Then:
188                lastz phiX1.fasta test-data/b1.fasta *yasra95short *ambiguousn *nolaj *identity=0..100 *coverage=0 *format=general-:score,name1,strand1,size1,start1,zstart1,end1,length1,text1,name2,strand2,size2,start2,zstart2,end2,start2+,zstart2+,end2+,length2,text2,diff,cigar,identity,coverage,gaprate,diagonal,shingle > lastz_wrapper_out4.tabular
189                lastz phiX2.fasta test-data/b1.fasta *yasra95short *ambiguousn *nolaj *identity=0..100 *coverage=0 *format=general-:score,name1,strand1,size1,start1,zstart1,end1,length1,text1,name2,strand2,size2,start2,zstart2,end2,start2+,zstart2+,end2+,length2,text2,diff,cigar,identity,coverage,gaprate,diagonal,shingle >> lastz_wrapper_out4.tabular
190                You need to point to phiX1.fasta and phiX2.fasta somewhere on your system.
191                phiX_split.fasta and b1.fasta are located in galaxy's test-data
192                You will have to replace all the asterisks before the commands with 2 dashes,
193                as double-dash can't appear in an XML comment
194               
195                NOTE: since the input file include more than 1 sequence, the output must be sorted in
196                order for functional test to pass.  This is done using the sort="True" attribute on the output.
197            -->
198            <param name="input2" value="b1.fasta" ftype="fasta" />
199            <param name="ref_source" value="history" />
200            <param name="input1" value="phiX_split.fasta" ftype="fasta"  />
201            <param name="out_format" value="tabular" />
202            <param name="source_select" value="pre_set" />
203            <param name="pre_set_options" value="yasra95short" />
204            <param name="how_to_name" value="no" />
205            <param name="min_ident" value="0" />
206            <param name="max_ident" value="100" />
207            <param name="min_cvrg" value="0" />
208            <param name="unmask" value="yes" />
209            <output name="output1" file="lastz_wrapper_out4.tabular" sort="True" />
210        </test>
211    </tests>
212    <help>
213       
214**What it does**   
215       
216**LASTZ** is a high performance pairwise sequence aligner derived from BLASTZ. It is written by Bob Harris in Webb Miller's laboratory at Penn State University. Special scoring sets were derived to improve runtime performance and quality. This Galaxy version of LASTZ is geared towards aligning short (Illumina/Solexa, AB/SOLiD) and medium (Roche/454) reads against a reference sequence. There is excellent, extensive documentation on LASTZ available here_.
217
218 .. _here: http://www.bx.psu.edu/miller_lab/dist/README.lastz-1.02.00/README.lastz-1.02.00.html
219 
220------
221
222**Input formats**
223
224LASTZ accepts reference and reads in FASTA format. However, because Galaxy supports implicit format conversion the tool will recognize fastq and other method specific formats.
225
226------
227
228**Outputs**
229
230LASTZ generates one output. Depending on the choice you make in the *Select output format* drop-down, LASTZ will produce a SAM file showing sequence alignments, a list of differences between the reads and reference (Polymorphisms), or a general table with one line per alignment block (Tabular). Examples of these outputs are shown below.
231
232**SAM output**
233
234SAM has 12 columns::
235
236                                   1     2     3         4   5    6  7         8     9                                    10                                     11  12
237  ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
238  HWI-EAS91_1_30788AAXX:1:2:1670:915    99  chr9  58119878  60  36M  =  58120234   392  GACCCCTACCCCACCGTGCTCTGGATCTCAGTGTTT   IIIIIIIIIIIIIIIIEIIIIIII7IIIIIIIIIII  XT:A:U  NM:i:0  SM:i:37  AM:i:37  X0:i:1  X1:i:0  XM:i:0  XO:i:0  XG:i:0  MD:Z:36
239  HWI-EAS91_1_30788AAXX:1:2:1670:915   147  chr9  58120234  60  36M  =  58119878  -392  ATGAGTCGAATTCTATTTTCCAAACTGTTAACAAAA   IFIIDI;IIICIIIIIIIIIIIIIIIIIIIIIIIII  XT:A:U  NM:i:0  SM:i:37  AM:i:37  X0:i:1  X1:i:0  XM:i:0  XO:i:0  XG:i:0  MD:Z:36
240
241
242where::
243
244     Column  Description
245  ---------  ---------------------------------------------------------------------   
246   1. QNAME  Query (pair) NAME
247   2. FLAG   bitwise FLAG
248   3. RNAME  Reference sequence NAME
249   4. POS    1-based leftmost POSition/coordinate of clipped sequence
250   5. MAPQ   MAPping Quality (Phred-scaled)
251   6. CIGAR  extended CIGAR string
252   7. MRNM   Mate Reference sequence NaMe ('=' if same as RNAME)
253   8. MPOS   1-based Mate POSition
254   9. ISIZE  Inferred insert SIZE
255  10. SEQ    query SEQuence on the same strand as the reference
256  11. QUAL   query QUALity (ASCII-33 gives the Phred base quality)
257  12. OPT    variable OPTional fields in the format TAG:VTYPE:VALUE, tab-separated
258 
259The flags are as follows::
260
261    Flag  Description
262  ------  -------------------------------------
263  0x0001  the read is paired in sequencing
264  0x0002  the read is mapped in a proper pair
265  0x0004  the query sequence itself is unmapped
266  0x0008  the mate is unmapped
267  0x0010  strand of the query (1 for reverse)
268  0x0020  strand of the mate
269  0x0040  the read is the first read in a pair
270  0x0080  the read is the second read in a pair
271  0x0100  the alignment is not primary
272
273**Polymorphism (SNP or differences) output**
274
275Polymorphism output contains 14 columns::
276
277     1     2     3  4     5                                   6   7   8  9  10  11 12                                   13                                    14
278  --------------------------------------------------------------------------------------------------------------------------------------------------------------
279  chrM  2490  2491  +  5386  HWI-EAS91_1_306UPAAXX:6:1:486:822   10  11  -  36  C  A  ACCTGTTTTACAGACACCTAAAGCTACATCGTCAAC  ACCTGTTTTAAAGACACCTAAAGCTACATCGTCAAC
280  chrM  2173  2174  +  5386  HWI-EAS91_1_306UPAAXX:6:1:259:1389  26  27  +  36  G  T  GCGTACTTATTCGCCACCATGATTATGACCAGTGTT  GCGTACTTATTCGCCACCATGATTATTACCAGTGTT
281
282where::
283
284  1. (chrM)   - Reference sequence id
285  2. (2490)   - Start position of the difference in the reference
286  3. (2491)   - End position of the difference in the reference
287  4. (+)      - Strand of the reference (always plus)
288  5. (5386)   - Length of the reference sequence
289  6. (HWI...) - read id
290  7. (10)     - Start position of the difference in the read
291  8. (11)     - End position of the difference in the read
292  9. (+)      - Strand of the read
293 10. (36)     - Length of the read
294 11. (C)      - Nucleotide in the reference
295 12. (A)      - Nucleotide in the read
296 13. (ACC...) - Reference side os the alignment
297 14. (ACC...) - Read side of the alignment
298 
299**Tabular output**
300
301Tabular output is a tab-separated format with 30 columns::
302
303   1        2  3     4     5     6     7   8                 9              10  11   12   13   14   15   16   17   18  19                20                21   22     23      24      25    26    27    28    29  30
304  -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
305  14  PHIX174  +  5386  4648  4647  4661  14  ATTTTCGTGATATT    EYKX4VC01BV8HS  +   204  154  153  167  154  153  167  14  ATTTTCGTGATATT    ..............    14M  14/14  100.0%  14/204  6.9%  0/14  0.0%  4494  NA
306  16  PHIX174  +  5386  3363  3362  3378  16  GACGCCGGATTTGAGA  EYKX4VC01AWJ88  -   259   36   35   51  209  208  224  16  GACGCCGGATTTGAGA  ................  16M  16/16  100.0%  16/259  6.2%  0/16  0.0%  3327  NA
307
308The following columns are present::
309
310             Field  Meaning
311  ----------------  -------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------
312   1.        score  Score of the alignment block. The scale and meaning of this number will vary, depending on the final stage performed and other command-line options.
313   2.        name1  Name of the target sequence.
314   3.      strand1  Target sequence strand, either "+" or "竏�.
315   4.        size1  Size of the entire target sequence.
316   5.       start1  Starting position of the alignment block in the target, origin-one.
317   6.      zstart1  Starting position of the alignment block in the target, origin-zero.
318   7.         end1  Ending position of the alignment block in the target, expressed either as origin-one closed or origin-zero half-open (the ending value is the same in both systems).
319   8.      length1  Length of the alignment block in the target (excluding gaps).
320   9.        text1  Aligned characters in the target, including gap characters.
321  10.        name2  Name of the query sequence.
322  11.      strand2  Query sequence strand, either "+" or "竏�.
323  12.        size2  Size of the entire query sequence.
324  13.       start2  Starting position of the alignment block in the query, origin-one.
325  14.      zstart2  Starting position of the alignment block in the query, origin-zero.
326  15.         end2  Ending position of the alignment block in the query, expressed either as origin-one closed or origin-zero half-open (the ending value is the same in both systems).
327  16.      start2+  Starting position of the alignment block in the query, counting along the query sequence's positive strand (regardless of which query strand was aligned), origin-one. Note that if strand2 is "竏�, then this is the other end of the block from start2.
328  17.     zstart2+  Starting position of the alignment block in the query, counting along the query sequence's positive strand (regardless of which query strand was aligned), origin-zero. Note that if strand2 is "竏�, then this is the other end of the block from zstart2.
329  18.        end2+  Ending position of the alignment block in the query, counting along the query sequence's positive strand (regardless of which query strand was aligned), expressed either as origin-one closed or origin-zero half-open (the ending value is the same in both systems). Note that if strand2 is "竏�, then this is the other end of the block from end2.
330  19.      length2  Length of the alignment block in the query (excluding gaps).
331  20.        text2  Aligned characters in the query, including gap characters.
332  21.         diff  Differences between what would be written for text1 and text2. Matches are written as . (period), transitions as : (colon), transversions as X, and gaps as - (hyphen).
333  22.        cigar  A CIGAR-like representation of the alignment's path through the Dynamic Programming matrix. This is the short representation, without spaces, described in the Ensembl CIGAR specification.
334  23./24. identity  Fraction of aligned bases in the block that are matches (see Identity). This is written as two fields. The first field is a fraction, written as &lt;n&gt;/&lt;d&gt;. The second field contains the same value, computed as a percentage.
335  25./26. coverage  Fraction of the entire input sequence (target or query, whichever is shorter) that is covered by the alignment block (see Coverage). This is written as two fields. The first field is a fraction, written as &lt;n&gt;/&lt;d&gt;. The second field contains the same value, computed as a percentage.
336  27./28.  gaprate  Rate of gaps (also called indels) in the alignment block. This is written as two fields. The first field is a fraction, written as &lt;n&gt;/&lt;d&gt;, with the numerator being the number of alignment columns containing gaps and the denominator being the number without gaps. The second field contains the same value, computed as a percentage.
337  29.     diagonal  The diagonal of the start of the alignment block in the dynamic programming matrix, expressed as an identifying number start1-start2.
338  30.      shingle  A measurement of the shingle overlap between the target and the query. This is intended for the case where both the target and query are relatively short, and their ends are expected to overlap. 
339
340-------
341
342**LASTZ Settings**
343
344There are two setting modes: (1) **Commonly used settings** and (2) **Full Parameter List**.
345
346**Commonly used settings**
347
348There are seven modes::
349
350  Illumina-Solexa/AB-SOLiD 95% identity
351  Illumina-Solexa/AB-SOLiD 85% identity
352  Roche-454 98% identity
353  Roche-454 95% identity
354  Roche-454 90% identity
355  Roche-454 85% identity
356  Roche-454 75% identity
357
358When deciding which one to use, consider the following: a 36 bp read with two differences will be 34/36 = 94% identical to the reference. 
359
360**Full Parameter List**
361
362This mode gives you fuller control over lastz. The description of these and other parameters is found at the end of this page. Note that not all parameters are included in this interface. If you would like to make additional options available through Galaxy, e-mail us at galaxy-bugs@bx.psu.edu.
363
364------
365
366**Do you want to modify the reference name?**
367
368This option allows you to set the name of the reference sequence manually. This is helpful when, for example, you would like to make the reference name compatible with the UCSC naming conventions to be able to display your lastz results as a custom track at the UCSC Genome Browser.
369
370------
371
372**LASTZ parameter list**
373
374This is an exhaustive list of LASTZ options. Once again, please note that not all options are included in this interface. If you would like to make additional options available through Galaxy, e-mail us at galaxy-bugs@bx.psu.edu::
375
376  target[[s..e]][-]       spec/file containing target sequence (fasta or nib)
377                          [s..e] defines a subrange of the file
378                          - indicates reverse-complement
379                          (use --help=files for more details)
380  query[[s..e]][-]        spec/file containing query sequences (fasta or nib)
381                          if absent, queries come from stdin (unless they
382                          aren't needed, as for --self or --tableonly)
383                          (use --help=files for more details)
384  --self                  the target sequence is also the query
385  --quantum               the query sequence contains quantum DNA
386  --seed=match&lt;length&gt;    use a word with no gaps instead of a seed pattern
387  --seed=half&lt;length&gt;     use space-free half-weight word instead of seed pattern
388  --match=&lt;reward&gt;[,&lt;penalty&gt;]   set the score values for a match (+&lt;reward&gt;)
389                          and mismatch (-&lt;penalty&gt;)
390  --[no]trans[ition][=2]         allow one or two transitions in a seed hit
391                          (by default a transition is allowed)
392  --word=&lt;bits&gt;           set max bits for word hash;  use this to trade time for
393                          memory, eliminating thrashing for heavy seeds
394                          (default is 28 bits)
395  --[no]filter=[&lt;T&gt;:]&lt;M&gt;     filter half-weight seed hits, requiring at least M
396                          matches and allowing no more than T transversions
397                          (default is no filtering)
398  --notwins               require just one seed hit
399  --twins=[&lt;min&gt;:]&lt;maxgap&gt;   require two nearby seed hits on the same diagonal
400                          (default is twins aren't required)
401  --notwins               allow single, isolated seeds
402  --[no]recoverseeds      avoid losing seeds in hash collisions. Cannot be used with --twins
403  --seedqueue=&lt;entries&gt;   set number of entries in seed hit queue
404                          (default is 262144)
405  --anchors=&lt;file&gt;        read anchors from a file, instead of discovering anchors
406                          via seeding
407  --recoverhits           recover hash-collision seed hits
408                          (default is not to recover seed hits)
409  --step=&lt;length&gt;         set step length (default is 1)
410  --maxwordcount=&lt;limit&gt;  words occurring more often than &lt;limit&gt; in the target
411                          are not eligible for seeds
412  --strand=both           search both strands
413  --strand=plus           search + strand only (matching strand of query spec)
414  --strand=minus          search - strand only (opposite strand of query spec)
415                          (by default both strands are searched)
416  --ambiguousn            treat N as an ambiguous nucleotide
417                          (by default N is treated as a sequence splicing character)
418  --[no]gfextend          perform gap-free extension of seed hits to HSPs
419                          (by default no extension is performed)
420  --[no]chain             perform chaining
421  --chain=&lt;diag,anti&gt;     perform chaining with given penalties for diagonal and
422                          anti-diagonal
423                          (by default no chaining is performed)
424  --[no]gapped            perform gapped alignment (instead of gap-free)
425                          (by default gapped alignment is performed)
426  --score[s]=&lt;file&gt;         read substitution scores from a file
427                          (default is HOXD70)
428  --unitscore[s]          scores are +1/-1 for match/mismatch
429  --gap=&lt;[open,]extend&gt;   set gap open and extend penalties (default is 400,30)
430  --xdrop=&lt;score&gt;         set x-drop threshold (default is 10*sub[A][A])
431  --ydrop=&lt;score&gt;         set y-drop threshold (default is open+300extend)
432  --infer[=&lt;control&gt;]     infer scores from the sequences, then use them
433  --inferonly[=&lt;control&gt;]   infer scores, but don't use them (requires --infscores)
434                          all inference options are read from the control file
435  --infscores[=&lt;file&gt;]    write inferred scores to a file
436  --hspthresh=&lt;score&gt;     set threshold for high scoring pairs (default is 3000)
437                          ungapped extensions scoring lower are discarded
438                          &lt;score&gt; can also be a percentage or base count
439  --entropy               adjust for entropy when qualifying HSPs in the x-drop extension
440                          method
441  --noentropy             don't adjust for entropy when qualifying HSPs
442  --exact=&lt;length&gt;        set threshold for exact matches
443                          if specified, exact matches are found rather than high
444                          scoring pairs (replaces --hspthresh)
445  --inner=&lt;score&gt;         set threshold for HSPs during interpolation
446                          (default is no interpolation)
447  --gappedthresh=&lt;score&gt;  set threshold for gapped alignments
448                          gapped extensions scoring lower are discarded
449                          &lt;score&gt; can also be a percentage or base count
450                          (default is to use same value as --hspthresh)
451  --ball=&lt;score&gt;          set minimum score required of words 'in' a quantum ball
452  --[no]entropy           involve entropy in filtering high scoring pairs
453                          (default is "entropy")
454  --[no]mirror            report/use mirror image of all gap-free alignments
455                          (default is "mirror" for self-alignments only)
456  --traceback=&lt;bytes&gt;     space for trace-back information
457                          (default is 80.0M)
458  --masking=&lt;count&gt;       mask any position in target hit this many times
459                          zero indicates no masking
460                          (default is no masking)
461  --targetcapsule=&lt;capsule_file&gt;   the target seed word position table and seed
462                          (as well as the target sequence)are read from specified file
463  --segments=&lt;segment_file&gt;   read segments from a file, instead of discovering
464                          them via seeding. Replaces other seeding or gap-free extension
465                          options
466  --[no]census[=&lt;file&gt;]     count/report how many times each target base aligns
467                          (default is to not report census)
468  --identity=&lt;min&gt;[..&lt;max&gt;]   filter alignments by percent identity
469                          0&lt;=min&lt;=max&lt;=100;  blocks (or HSPs) outside min..max
470                          are discarded
471                          (default is no identity filtering)
472  --coverage=&lt;min&gt;[..&lt;max&gt;]   filter alignments by percentage pf query covered
473                          0&lt;=min&lt;=max&lt;=100;  blocks (or HSPs) outside min..max
474                          are discarded
475                          (default is no query coverage filtering)
476  --notrivial             do not output trivial self-alignment block if the target and query
477                          sequences are identical. Using --self enables this option automatically
478  --output=&lt;output_file&gt;  write the alignments to the specified file name instead of stdout
479  --code=&lt;file&gt;           give quantum code for query sequence (only for display)
480  --format=&lt;type&gt;         specify output format; one of lav, axt, maf, maf+, maf-, text,
481                          lav+text, cigar, text, rdplot, general, or general:&lt;fields&gt;
482                          (by default output is LAV)
483  --rdotplot=&lt;file&gt;       create an additional output file suitable for plotting the alignments
484                          with the R statistical package.
485  --markend               Just before normal completion, write "# lastz end-of-file" to output file
486  --census[=&lt;output_file&gt;]    count and report how many times each target base aligns, up
487                          to 255. Ns are included in the count
488  --census16[=&lt;output_file&gt;]  count and report how many times each target base aligns, up
489                          up 65 thousand
490  --census32[=&lt;output_file&gt;]  count and report how many times each target bas aligns, up
491                          to 4 billion
492  --writecapsule=&lt;capsule_file&gt;    just write out a targegt capsule file and quit; don't
493                          search for seeds or perform subsequent stages
494  --verbosity=&lt;level&gt;     set info level (0 is minimum, 10 is everything)
495                          (default is 0)
496  --[no]runtime           report runtime in the output file
497                          (default is to not report runtime)
498  --tableonly[=count]     just produce the target position table, don't
499                          search for seeds
500  --[no]stats[=&lt;file&gt;]    show search statistics (or don't)
501                          (not available in this build)
502  --version               report the program version and quit
503  --help                  list all options
504  --help=files            list information about file specifiers
505  --help=short[cuts]      list blastz-compatible shortcuts
506  --help=yasra            list yasra-specific shortcuts
507
508    </help>
509</tool>
Note: リポジトリブラウザについてのヘルプは TracBrowser を参照してください。