# HG changeset patch # User pjbriggs # Date 1448640388 18000 # Node ID 3c5f10f7dd407c34b7e60e755100e6715867a8f3 # Parent 571cb77ab9e797867495a5a2089b9e020e541c4f Updated to tool version 2.0.1 (use data table to locate freqfiles). diff -r 571cb77ab9e7 -r 3c5f10f7dd40 README.rst --- a/README.rst Tue Dec 09 11:27:19 2014 -0500 +++ b/README.rst Fri Nov 27 11:06:28 2015 -0500 @@ -30,7 +30,12 @@ -You will also need to install ``weeder2`` from: +You also need to make a copy of the ``weeder2.loc`` file (a sample version is +provided here) which lists the species for which frequency files are available. +This file should be placed in the ``tool-data`` directory of your Galaxy +installation. + +Additionally you will need to install ``weeder2`` from: - http://159.149.160.51/modtools/downloads/weeder2.html @@ -41,20 +46,41 @@ Also the directory holding the Weeder2 executables should be on your ``PATH``. +Functional tests +================ + If you want to run the functional tests, copy the sample test files under sample test files under Galaxy's ``test-data/`` directory. Then: - ./run_tests.sh -id trimmomatic + ./run_tests.sh -id weeder2 You will need to have set the environment variables above. +Reference Data +============== + +Weeder2 requires reference data in the form of frequency files for each +species of interest. A set of reference files is provided as part of the +Weeder2 installation. + +Additional frequency files can be generated for novel species using the +``w2frequency_maker`` utility available via: + +- http://159.149.160.51/weederaddons/weeder2freq.html + +This page also explains what input data should be used. + +The location of the additional frequency files can then be specified by +adding them to the ``weeder2.loc`` file (see above). + History ======= ========== ====================================================================== Version Changes ---------- ---------------------------------------------------------------------- -2.0.0.0 - Initial version +2.0.1 - Explicitly specify frequency files in ``weeder2.loc``. +2.0.0 - Initial version ========== ====================================================================== diff -r 571cb77ab9e7 -r 3c5f10f7dd40 test-data/weeder2.loc --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/weeder2.loc Fri Nov 27 11:06:28 2015 -0500 @@ -0,0 +1,5 @@ +HS Homo sapiens (HS) . +MM Mus musculus (MM) . +DM Drosophila melanogaster (DM) . +SC Saccharomyces cerevisiae (SC) . +AT Arabidopsis thaliana (AT) . diff -r 571cb77ab9e7 -r 3c5f10f7dd40 tool-data/weeder2.loc.sample --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/tool-data/weeder2.loc.sample Fri Nov 27 11:06:28 2015 -0500 @@ -0,0 +1,35 @@ +# This is a sample file distributed with Galaxy that is used by the +# weeder2 tool to find the frequency files. +# +# The weeder.loc file has this format (white space characters are TAB +# characters): +# +# +# +# should be a period ('.') to indicate the +# frequency files that come as standard with weeder2; otherwise +# it should be the full path to the directory holding a custom +# set of .freq files. +# +# For example: +# +#AF Aspergillus fumigatus (AF) /home/galaxy/weeder/FreqFiles +# +# where '/home/galaxy/weeder/FreqFiles' would contain: +# +#-rw-rw-r-- 1 pjb pjb 20109718 Oct 23 13:16 AF_ds.10.freq +#-rw-rw-r-- 1 pjb pjb 47080 Oct 23 13:15 AF_ds.6.freq +#-rw-rw-r-- 1 pjb pjb 1006374 Oct 23 13:15 AF_ds.8.freq +#-rw-rw-r-- 1 pjb pjb 19930169 Oct 23 13:16 AF_ss.10.freq +#-rw-rw-r-- 1 pjb pjb 45262 Oct 23 13:16 AF_ss.6.freq +#-rw-rw-r-- 1 pjb pjb 984583 Oct 23 13:16 AF_ss.8.freq +# +# Entries are already provided for the standard frequency files that +# are distributed with Weeder2. +# This file should be placed in galaxy's tool-data directory when the +# weeder2 tool is installed. +HS Homo sapiens (HS) . +MM Mus musculus (MM) . +DM Drosophila melanogaster (DM) . +SC Saccharomyces cerevisiae (SC) . +AT Arabidopsis thaliana (AT) . diff -r 571cb77ab9e7 -r 3c5f10f7dd40 tool_data_table_conf.xml.sample --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/tool_data_table_conf.xml.sample Fri Nov 27 11:06:28 2015 -0500 @@ -0,0 +1,6 @@ + + + value, name, path + +
+
\ No newline at end of file diff -r 571cb77ab9e7 -r 3c5f10f7dd40 tool_data_table_conf.xml.test --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/tool_data_table_conf.xml.test Fri Nov 27 11:06:28 2015 -0500 @@ -0,0 +1,6 @@ + + + value, name, path + +
+
\ No newline at end of file diff -r 571cb77ab9e7 -r 3c5f10f7dd40 weeder2_wrapper.sh --- a/weeder2_wrapper.sh Tue Dec 09 11:27:19 2014 -0500 +++ b/weeder2_wrapper.sh Fri Nov 27 11:06:28 2015 -0500 @@ -2,31 +2,40 @@ # # Wrapper script to run weeder2 as a Galaxy tool # -# Usage: weeder_wrapper.sh FASTA_IN SPECIES_CODE MOTIFS_OUT MATRIX_OUT [ ARGS... ] +# Usage: weeder_wrapper.sh FASTA_IN SPECIES_CODE FREQFILES_DIR MOTIFS_OUT MATRIX_OUT [ ARGS... ] # # ARGS: one or more arguments to supply directly to weeder2 # # Process command line FASTA_IN=$1 SPECIES_CODE=$2 -MOTIFS_OUT=$3 -MATRIX_OUT=$4 +FREQFILES_DIR=$3 +MOTIFS_OUT=$4 +MATRIX_OUT=$5 # # Other arguments ARGS="" -while [ ! -z "$5" ] ; do - ARGS="$ARGS $5" +while [ ! -z "$6" ] ; do + ARGS="$ARGS $6" shift done # # Link to input file ln -s $FASTA_IN # +# Locate the FreqFiles directory +if [ $FREQFILES_DIR == "." ] ; then + # Use the files in the Weeder2 distribution + freqfiles_dir=$WEEDER_FREQFILES_DIR +else + # Alternative location + freqfiles_dir=$FREQFILES_DIR +fi +# # Link to the FreqFiles directory as weeder2 executable # expects it to be the same directory -freqfiles_dir=$WEEDER_FREQFILES_DIR if [ -d $freqfiles_dir ] ; then - echo "Linking to FreqFiles directory" + echo "Linking to FreqFiles directory: $freqfiles_dir" ln -s $freqfiles_dir FreqFiles else echo "ERROR FreqFiles directory not found" >&2 diff -r 571cb77ab9e7 -r 3c5f10f7dd40 weeder2_wrapper.xml --- a/weeder2_wrapper.xml Tue Dec 09 11:27:19 2014 -0500 +++ b/weeder2_wrapper.xml Fri Nov 27 11:06:28 2015 -0500 @@ -1,7 +1,10 @@ - + Motif discovery in sequences from coregulated genes of a single species + + weeder + weeder2_wrapper.sh - $sequence_file $species_code + $sequence_file $species_code ${species_code.fields.path} $output_motifs_file $output_matrix_file $strands #if $chipseq.use_chipseq @@ -13,21 +16,12 @@ -sim $advanced_options.sim_threshold -em $advanced_options.em_cycles #end if - - - weeder - + - - - - - - + +