# HG changeset patch # User dcorreia # Date 1461326693 14400 # Node ID aea74cec21e07aafb70f34c17431391e8b7953e2 # Parent df98a0425c8d74cafd33e996fc6d27b8514f3dfa Uploaded diff -r df98a0425c8d -r aea74cec21e0 fastme.xml --- a/fastme.xml Fri Dec 11 09:51:04 2015 -0500 +++ b/fastme.xml Fri Apr 22 08:04:53 2016 -0400 @@ -1,193 +1,201 @@ - - - - Calculate distance tree for an alignment file - - + + Distance-based inference of phylogenetic trees - perl - fastme + fastme - - + + + - + fastme --input_data=$input + --output_tree=$outputTree + --output_matrix=$outputMatrix + --output_info=$outputLog + --nb_threads=\${GALAXY_SLOTS:-1} - - - - fastme --input_data=$input_data --dna=$model --output_tree=$fileout - #if str( $distance ) == "SPR": - --spr - #elif str( $distance )[:3] == "NNI" : - #if str( $distance ) == "NNI_B" : - --nni=B - #else : - --nni=O - #end if + #if $typeChoice.datatype =="d" + --dna=$typeChoice.modeldna + + #else if $typeChoice.datatype =="p" + --protein=$typeChoice.modelprot + + #else if $typeChoice.datatype =="cfg": + ## Read information of sequence type + ## read an info file to choose which option set and set a model by default + #set $info = open( str($input_info) ).read() + #if 'dna' in $info: + --dna=T + #else if 'protein' in $info: + --protein=L + #end if + #end if + + #if $gammaChoice.gamma == "true" + --gamma=$gammaChoice.rate + #end if + + $distance + $equilibrium + $removeGap + $treeRefinement + + #if $bootChoice.boot == "true" + --output_boot=$outputBoostrap + --bootstrap=$bootChoice.replicates + #end if + + >> tmp_stdout; + cat tmp_stdout > $outputLog; - #else : - --method=$distance - #end if - > $fileout_log - - - - - - - - - - - - - - - - + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + - - - - - - - - - + + + + + + + + + + + + + - - - + + + + + + + + + + + - - + + + + bootChoice['boot'] == "true" + + - - - - - - - - + + + + + + - - - - - .. class:: infomark -**Authors** - | Richard Desper and Olivier Gascuel, - | Journal of Computational Biology 19(5), 687-705, 2002. - | Molecular Biology and Evolution 21(3), 587-598, 2004. - | Please cite these papers if you use this software in your publications. +**FastME version 2.1.4** .. class:: infomark -**Galaxy integration** Andres Gwendoline, Institut Français de Bioinformatique. -.. class:: infomark - -**Support** For any questions about Galaxy integration, please send an e-mail to support.abims@sb-roscoff.fr - ---------------------------------------------------- +**Galaxy integration** Andres Gwendoline, Institut Français de Bioinformatique. Correia Damien, CNRS. +**Support** For any questions about Galaxy integration, please send an e-mail to vincent.lefort@lirmm.fr -====== -FastMe -====== +----- + + +############ +FastME 2.0 +############ + +Comprehensive, accurate and fast distance-based phylogeny inference program + ----------- Description ----------- - - FastME - A distance based phylogeny reconstruction algorithm. - - FastME showed better topological accuracy than NJ, - BIONJ, WEIGHBOR and FITCH, in all evolutionary - conditions we tested, which include large range - deviations from molecular clock and substitution rates. - - - ------------------ -Workflow position ------------------ - -**Upstream tools** - -=========== ========================== ======= -Name output file(s) format -=========== ========================== ======= -Readseq phylip conversion phylip -=========== ========================== ======= - - -**Downstream tools** - -=========== ========================== ======= -Name output file(s) format -=========== ========================== ======= -Rooting out tree Newick -=========== ========================== ======= +FastME provides distance algorithms to infer phylogenies. It's based on balanced minimum evolution, which is the very principle of NJ. - ----------- -Input file ----------- - -Phylip file - Phylip file with sequence alignments - - ----------- -Parameters ----------- - -Output name - Output base name for the ouput files - -Evolutionary model - Indicate the evolutionary [model] which can be choosen from:p-distance, RY symmetric, RY, JC69, K2P, F81, F84 (default), TN93, LogDet. - -Distance methode - FastME computes a tree using a distance algorithm. You may choose this method/topologie from: TaxAdd_BalME, TaxAdd_OLSME, BIONJ (default), NJ, UNJ, NNI_BalME, NNI_OLS or SPR - ------------- -Output files ------------- - -Output_name - Resulting tree at Newick format - -Output_name.log - Log file +FastME included Nearest Neighbor Interchange (NNI) and also Subtree Pruning and Regrafting (SPR), while remaining as fast as NJ and providing a number of facilities: distance estimation for DNA and proteins with various models and options, bootstrapping, and parallel computations. ------------ Dependencies ------------ FastME - http://www.atgc-montpellier.fr/fastme - + http://www.atgc-montpellier.fr/fastme + --------------------------------------------------- @@ -199,54 +207,154 @@ Input files =========== -Philip file ------------ +**Phylip file**:: + -:: + 4 120 + Orangutan CCAAACGACA TTTCATATGC TGTCATTTCT GAAGATATGA GACAAGTGAG CTGTCCGGAA + Gorilla CCAAACAACA TTTCATGTGC TGTCATTTCT GAAGATATGA GACAAGTGAG CTCTCCGAAA + Human CCAAACAACA TTTCATGTGC TGTCATTTCT GAAGATAAGA GACAAGTGAG CTCTCCGAAA + Chimp CCAAACAACA TTTCATGTGC TGTCATTTCT GAAGATATGA GACAAGTGAG CTCTCCGAAA - 168 5125 - IRAT112 GAGAACCGTC CTGTAAGTAC TCTTGCTTTA AGTAATAAAG TAATACTAAT - KARASUKARA GAGAACCGTC CTGTAAGTAC TCTTGCTTTA AATACGAAAG TAATACTAAT + CCAACATATC AGACATATGT GAATTTCAAT TATTGTACGG GCATCCTGGG CTCTCAAAGT + CCAAGATATC AGACATTTAT GAATTTCAAT TATTGTACGG GCATCCTGGG CTCTCAAAGT + CCAAGATACC AGACATTTGT GAATTTCAAT TATTGTACTG GCATCCTGGG CTCTCAAAGT + CCAAGATATC AGACATTTAT GAATTTCAAT TATTGTACTG GCATCCTGGG CTCTCAAAGT + + Parameters ========== -Output name -> Newick tree +:: -Evolutionary model -> F84 + Output name: Newick tree + Evolutionary model : TN93 + Distance method : BIONJ -Distance methode -> BIONJ Output files ============ -Newick tree ------------ +**Newick tree**:: + + ((Gorilla:0.005755,Orangutan:0.020680):0.001063,Human:0.006655,Chimp:0.002132); + +----- + +OPTIONS +======= + + + -i file, --input_data=file + The input data file contains sequence alignment(s) or a distance matrix(ces). + + -u input_tree_file, --user_tree=input_tree_file + FastME may use an existing topology available in the input user tree file which corresponds to the input dataset. + + -o output_tree_file, --output_tree=output_tree_file + FastME will write the infered tree into the output tree file. + + -O output_matrix_file, --output_matrix=output_matrix_file + Use output matrix file option if you want FastME to write the distances + matrix computed from the input alignment in the output matrix file. + + -I output_information_file, --output_info=output_information_file + Use this option if you want FastME to write information + about its execution in the output information file. + + -B output_bootstrap_trees_file, --output_boot=output_bootstrap_trees_file + Use this option if you want FastME to write bootstrap trees + in the bootstrap trees file. + + -a, --append + Use this option to append results to existing output files (if any). + By default output files will be overwritten. + + -m method, --method=method + FastME computes a tree using a distance algorithm. + You may choose this method from: + TaxAdd_(B)alME, TaxAdd_(O)LSME, B(I)ONJ (default), + (N)J or (U)NJ. + + -d model, --dna=model + Use this option if your input data file contains DNA sequences alignment(s). + You may also indicate the evolutionary [model] which can be choosen from: + (p)-distance, R(Y) symmetric, (R)Y, (J)C69, (K)2P, F8(1), F8(4) (default), (T)N93, (L)ogDet. + + -p model, --protein=model + Use this option if your input data file contains protein sequences alignment(s). + You may also indicate the evolutionary [model] which can be choosen from: + (p)-distance, (F)81 like, (L)G (default), (W)AG, (J)TT, Day(h)off, (D)CMut, (C)pRev, + (M)tREV, (R)tREV, HIV(b), H(I)Vw or FL(U). + + -r, --remove_gap + Use this option to completely remove any site which has a gap in + any sequence. By default, FastME is doing pairwise deletion of gaps. -:: + -e, --equilibrium + The equilibrium frequencies for DNA are always estimated by counting + the occurence of the nucleotides in the input alignment. + For amino-acid sequences, the equilibrium frequencies are estimated + using the frequencies defined by the substitution model. + Use this option if you whish to estimate the amino-acid frequencies + by counting their occurence in the input alignment. + + -g alpha, --gamma=alpha + Use this option if you wish to have gamma distributed rates across sites. + By default, FastME runs with no gamma variation. + If running FastME with gamma distributed rates across sites, the [alpha] default value is 1.0. + Only helpful when the input data file contains sequences alignment(s). + + -n NNI, --nni=NNI + Use this option to do [NNI] tree topology improvement. + You may choose the [NNI] type from: + NNI_(B)alME (default) or NNI_(O)LS. + + -s, --spr + Use this option to do SPR tree topology improvement. + + -w branch, --branch_length=branch + Use this option to indicate the branch length to assign to the tree. + Only helpful when not improving the tree topology (no NNI nor SPR). + You may choose the branch length from: + (B)alLS (default), (O)LS or (n)one. (n)one is only available with BIONJ, NJ or UNJ. - (((((((((((((((((((((((((GOGOLEMPUK:0.001198,GOGOLEMPAK:0.002128):0.030378,TREMBESE:0.013258):0.055246,(((JIMBRUKJOL:0.045219,KETANKONIR:0.035298):0.006267, ... - + -D datasets, --datasets=datasets + Use this option to indicate the number of datasets in your input + data file. Default value is 1. + + -b replicates, --bootstrap=replicates + Use this option to indicate the number of replicates FastME will + do for bootstrapping. Default value is 0. + Only helpful when the input data file contains sequences alignment(s). + + -z seed, --seed=seed + Use this option to initialize randomization with seed value. Only helpful when bootstrapping. + + -c Use this option if you want FastME only to compute distance matrix. + Only helpful when the input data file contains sequences alignment(s). + + -T number_of_threads, --nb_threads=number_of_threads + Use this option to set the number of threads to use. + Default number of threads is 4. + + -v value, --verbose=value + Sets the verbose level to value [0-3]. Default value is 0 + + -V, --version + Prints the FastME version. + + -h, --help Display this usage. + + +For further informations, please visite FastME_ + +.. _FastME: http://www.atgc-montpellier.fr/fastme/usersguide.php - - - -@article{Lefort30062015, -author = {Lefort, Vincent and Desper, Richard and Gascuel, Olivier}, -title = {FastME 2.0: A Comprehensive, Accurate, and Fast Distance-Based Phylogeny Inference Program}, -year = {2015}, -doi = {10.1093/molbev/msv150}, -abstract ={FastME provides distance algorithms to infer phylogenies. FastME is based on balanced minimum evolution, which is the very principle of Neighbor Joining (NJ). FastME improves over NJ by performing topological moves using fast, sophisticated algorithms. The first version of FastME only included Nearest Neighbor Interchange. The new 2.0 version also includes Subtree Pruning and Regrafting, while remaining as fast as NJ and providing a number of facilities: Distance estimation for DNA and proteins with various models and options, bootstrapping, and parallel computations. FastME is available using several interfaces: Command-line (to be integrated in pipelines), PHYLIP-like, and a Web server (http://www.atgc-montpellier.fr/fastme/).}, -URL = {http://mbe.oxfordjournals.org/content/early/2015/07/25/molbev.msv150.abstract}, -eprint = {http://mbe.oxfordjournals.org/content/early/2015/07/25/molbev.msv150.full.pdf+html}, -journal = {Molecular Biology and Evolution} -} - - - + 10.1093/molbev/msv150 + 10.1089/106652702761034136 - - - + \ No newline at end of file