Mercurial > repos > earlhaminst > ete
changeset 6:f1eca1158f21 draft
planemo upload for repository https://github.com/TGAC/earlham-galaxytools/tree/master/tools/ete commit 133bb57feca9672734d664e6b34e428488cf2e73
| author | earlhaminst |
|---|---|
| date | Wed, 10 Oct 2018 05:24:04 -0400 |
| parents | 817031b8486d |
| children | 6a5282f71f82 |
| files | ete_genetree_splitter.xml ete_homology_classifier.py ete_lineage_generator.py ete_lineage_generator.xml ete_macros.xml ete_species_tree_generator.xml test-data/lineage-compress-lower.txt test-data/lineage-compress.txt test-data/lineage-full.txt test-data/lineage-wid.txt test-data/lineage.txt |
| diffstat | 11 files changed, 99 insertions(+), 15 deletions(-) [+] |
line wrap: on
line diff
--- a/ete_genetree_splitter.xml Thu May 10 06:15:17 2018 -0400 +++ b/ete_genetree_splitter.xml Wed Oct 10 05:24:04 2018 -0400 @@ -1,4 +1,4 @@ -<tool id="ete_genetree_splitter" name="ETE GeneTree splitter" version="@VERSION@.1"> +<tool id="ete_genetree_splitter" name="ETE GeneTree splitter" version="@VERSION@"> <description>from a genetree using the ETE Toolkit</description> <macros> <import>ete_macros.xml</import>
--- a/ete_homology_classifier.py Thu May 10 06:15:17 2018 -0400 +++ b/ete_homology_classifier.py Wed Oct 10 05:24:04 2018 -0400 @@ -17,8 +17,13 @@ if options.genetree is None: parser.error("--genetree option must be specified, GeneTree in nhx format") + with open(options.genetree, 'r') as f: + contents = f.read() + + # Remove empty NHX features that can be produced by TreeBest but break ete3 + contents = contents.replace('[&&NHX]', '') # reads single gene tree - genetree = PhyloTree(options.genetree) + genetree = PhyloTree(contents) leaves_list = genetree.get_leaf_names() # Genetree nodes are required to be in gene_species format
--- a/ete_lineage_generator.py Thu May 10 06:15:17 2018 -0400 +++ b/ete_lineage_generator.py Wed Oct 10 05:24:04 2018 -0400 @@ -69,6 +69,8 @@ help='Prefer lower levels when compressed') parser.add_option('-r', '--rank', dest='ranks', action="append", help='include rank - multiple ones can be specified') +parser.add_option('-i', '--includeid', dest="addid", action="store_true", default=False, + help='add taxid column') options, args = parser.parse_args() # check command line options @@ -106,8 +108,13 @@ for ilr in range(len(LONG_RANKS)): if RANKS[ir] in LONG_RANKS[ilr]: COMP_RANK_IDX[LONG_RANKS[ilr]] = ir + # write header -of.write("#species/taxid\t%s\n" % ("\t".join(RANKS))) +of.write("# query") +if options.addid: + of.write("\ttaxid") +of.write("\t%s\n" % ("\t".join(RANKS))) + # get and write data with open(options.input_species_filename) as f: for line in f.readlines(): @@ -128,5 +135,8 @@ process_taxid(ncbi, taxid, ranks, RANK_IDX) if options.compress: process_taxid(ncbi, taxid, ranks, COMP_RANK_IDX, options.lower) - of.write("%s\t%s\n" % (line, "\t".join(ranks))) + of.write("%s" % line) + if options.addid: + of.write("\t%d" % taxid) + of.write("\t%s\n" % "\t".join(ranks)) of.close()
--- a/ete_lineage_generator.xml Thu May 10 06:15:17 2018 -0400 +++ b/ete_lineage_generator.xml Wed Oct 10 05:24:04 2018 -0400 @@ -20,6 +20,7 @@ $compresscond.compress $compresscond.lower #end if +$includeid ]]></command> <inputs> <param name="speciesFile" type="data" format="txt" label="Species file" help="List with one species/taxid per line" /> @@ -68,17 +69,16 @@ </conditional> <conditional name="compresscond"> <param name="compress" type="select" label="Fill unnamed ranks" help="Fill unnamed ranks with super/sub ranks (see -l)"> - <option value="-c">Yes</option> + <option value="-c" selected="True">Yes</option> <option value="">No</option> </param> <when value="-c"> - <param name="lower" type="select" label="Prefer lower ranks for filling" help="Prefer lower levels for filling"> - <option value="-l">Yes</option> - <option value="">No</option> - </param> + <param name="lower" type="boolean" truevalue="-l" falsevalue="" checked="False" label="Prefer lower ranks" help="Take the next available lower rank (default: higher)"/> </when> <when value="" /> </conditional> + <param name="includeid" type="boolean" truevalue="--includeid" falsevalue="" label="Include taxid in the table" + help="For the case when the input consists of taxon names" /> </inputs> <outputs> <data name="outputFile" format="tsv" label="${tool.name} on ${on_string}"/> @@ -114,6 +114,12 @@ <param name="manualranks" value="kingdom,family" /> <output name="outputFile" file="lineage-full.txt" /> </test> + <test> + <param name="speciesFile" ftype="txt" value="species.txt" /> + <param name="database" ftype="sqlite" value="taxdump.sqlite" /> + <param name="includeid" value="--includeid" /> + <output name="outputFile" file="lineage-wid.txt" /> + </test> </tests> <help><