# HG changeset patch # User iuc # Date 1572707537 14400 # Node ID 5804f786060d9fd1ef1b8574847c75d78f0e0061 # Parent efe8f0e53d3efac60675966000329f088207010a "planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/snp-sites commit e4222f6179041846870721bfcb4d8e587ead8d8f" diff -r efe8f0e53d3e -r 5804f786060d snp-sites.xml --- a/snp-sites.xml Fri Jun 30 16:43:26 2017 -0400 +++ b/snp-sites.xml Sat Nov 02 11:12:17 2019 -0400 @@ -1,30 +1,140 @@ - + from a multi-FASTA alignment file + + 2.5.1 + - snp-sites + snp-sites snp-sites -V &2 && exit 1 ; + #set outputs="" + #else + #set outputs=" ".join(str($out_type.formats).split(",")) + #end if +#end if + snp-sites --mvp --o output -'$input_fasta' +#if str($out_type.ot_select) == "alignment" + $outputs + $out_type.b + $out_type.c +#else if str($out_type.ot_select) == "counts" + -C +#end if + -o output + '$input_fasta' + +#if str($out_type.ot_select) == "counts" + && mv output $output_counts +#else if ',' in str($out_type.formats) + #if '-m' in str($out_type.formats) + && mv 'output.snp_sites.aln' '$output_fasta' + #end if + #if '-v' in str($out_type.formats) + && mv 'output.vcf' '$output_vcf' + #end if + #if '-p' in str($out_type.formats) + && mv 'output.phylip' '$output_phylip' + #end if +#else + #if str($out_type.formats) == '-m' + && mv 'output' '$output_fasta' + #else if str($out_type.formats) == '-v' + && mv 'output' '$output_vcf' + #else if str($out_type.formats) == '-p' + && mv 'output' '$output_phylip' + #end if +#end if ]]> + + + + + + + + + + + + + + + + + + - - - + + + (out_type["ot_select"] == "alignment" and out_type["formats"] is not None and '-m' in out_type["formats"]) or (out_type["ot_select"] == "alignment" and out_type.formats is None) + + + out_type["ot_select"] == "alignment" and out_type["formats"] is not None and '-v' in out_type["formats"] + + + out_type["ot_select"] == "alignment" and out_type["formats"] is not None and '-p' in out_type["formats"] + + + out_type["ot_select"] == "counts" + - + + + + + + + + + + + + + + + + + + + + - - - + + + + + + + + + + + + + + + + + + + + + + + + @@ -32,7 +142,11 @@ **SNP-sites** -This tool can rapidly extract SNPs from a multi-FASTA alignment using modest resources and can output results in multiple formats for downstream analysis. SNPs can be extracted from a 8.3 GB alignment file (1,842 taxa, 22,618 sites) in 267 seconds using 59 MB of RAM and 1 CPU core, making it feasible to run on modest computers. SNP-sites is implemented in C and is available under the open source license GNU GPL version 3. +This tool can rapidly extract SNPs from a multi-FASTA alignment using modest resources and can output results in multiple formats for downstream analysis. SNPs can be extracted from a 8.3 GB alignment file (1,842 taxa, 22,618 sites) in 267 seconds using 59 MB of RAM and 1 CPU core, making it feasible to run on modest computers. +SNP-sites is implemented in C and is available under the open source license GNU GPL version 3. + +Alternatively it can report on the number of constant sites in an alignment in a format (A count, C count, G count, T count) suitable for passing +to IQ-TREE's `-fconst` option. **Input FASTA format:** @@ -49,6 +163,16 @@ >sample1 AAACGCATTCAN +**Options** + +In addition to the default output mode, this tool supports three other options: + +1. Output only constant (monomorphic) (i.e. not polymorphic) sites (useful for input to BEAST) + +2. Output only columns that have purely ACTGs in them (i.e. no gaps or ambiguous nucleotides). This can be used together with the previous option. + +3. Output only a count of constant sites, in a format suitable for use with IQ-TREE `-fconst`. This option cannot be used together with the previously mentioned options. + **Output files:** The output of the tool are three different files in following format: @@ -56,6 +180,7 @@ - a multi fasta alignment, - relaxed phylip format and, - VCF. +- alternatively constant site counts (As, Cs, Gs and Ts). The VCF file for the above specified input is diff -r efe8f0e53d3e -r 5804f786060d test-data/output_actg.fasta --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/output_actg.fasta Sat Nov 02 11:12:17 2019 -0400 @@ -0,0 +1,6 @@ +>sample1 +GA +>sample1 +GA +>sample1 +AG diff -r efe8f0e53d3e -r 5804f786060d test-data/output_counts.tabular --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/output_counts.tabular Sat Nov 02 11:12:17 2019 -0400 @@ -0,0 +1,1 @@ +4,4,0,1 diff -r efe8f0e53d3e -r 5804f786060d test-data/output_monomorphic.fasta --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/output_monomorphic.fasta Sat Nov 02 11:12:17 2019 -0400 @@ -0,0 +1,6 @@ +>sample1 +AGACACAGTCAC +>sample1 +AGACAC----AC +>sample1 +AAACGCATTCAN diff -r efe8f0e53d3e -r 5804f786060d test-data/output_monomorphic_actg.fasta --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/output_monomorphic_actg.fasta Sat Nov 02 11:12:17 2019 -0400 @@ -0,0 +1,6 @@ +>sample1 +AGACACA +>sample1 +AGACACA +>sample1 +AAACGCA