changeset 13:eb53be9a09f4 draft

Uploaded
author timpalpant
date Sat, 19 May 2012 10:36:45 -0400
parents 81d5b81fb3c2
children f58706d4d421
files dist/java-genomics-toolkit.jar galaxy-conf/._BaseAlignCounts.xml galaxy-conf/._DNAPropertyCalculator.xml galaxy-conf/._GeneTrackToBedGraph.xml galaxy-conf/._GeneTrackToWig.xml galaxy-conf/._IntervalAverager.xml galaxy-conf/._LogTransform.xml galaxy-conf/._Phasogram.xml galaxy-conf/._ReadLengthDistributionMatrix.xml galaxy-conf/._StripMatrix.xml galaxy-conf/._WigCorrelate.xml galaxy-conf/._ZScore.xml galaxy-conf/._Zinba.xml galaxy-conf/._galaxyToolRunner.sh galaxy-conf/BaseAlignCounts.xml galaxy-conf/DNAPropertyCalculator.xml galaxy-conf/Downsample.xml galaxy-conf/FastqIlluminaToSanger.xml galaxy-conf/FindNMers.xml galaxy-conf/FindOutlierRegions.xml galaxy-conf/GeneTrackToBedGraph.xml galaxy-conf/GeneTrackToWig.xml galaxy-conf/InterpolateDiscontinuousData.xml galaxy-conf/IntervalAverager.xml galaxy-conf/IntervalLengthDistribution.xml galaxy-conf/IntervalToWig.xml galaxy-conf/LogTransform.xml galaxy-conf/Phasogram.xml galaxy-conf/ReadLengthDistributionMatrix.xml galaxy-conf/StripMatrix.xml galaxy-conf/WaveletTransform.xml galaxy-conf/WigCorrelate.xml galaxy-conf/WigSummary.xml galaxy-conf/ZScore.xml galaxy-conf/Zinba.xml galaxy-conf/galaxyToolRunner.sh lib/java-genomics-io.jar lib/picard-1.67.jar lib/sam-1.56.jar lib/sam-1.67.jar
diffstat 40 files changed, 353 insertions(+), 68 deletions(-) [+]
line wrap: on
line diff
Binary file dist/java-genomics-toolkit.jar has changed
Binary file galaxy-conf/._BaseAlignCounts.xml has changed
Binary file galaxy-conf/._DNAPropertyCalculator.xml has changed
Binary file galaxy-conf/._GeneTrackToBedGraph.xml has changed
Binary file galaxy-conf/._GeneTrackToWig.xml has changed
Binary file galaxy-conf/._IntervalAverager.xml has changed
Binary file galaxy-conf/._LogTransform.xml has changed
Binary file galaxy-conf/._Phasogram.xml has changed
Binary file galaxy-conf/._ReadLengthDistributionMatrix.xml has changed
Binary file galaxy-conf/._StripMatrix.xml has changed
Binary file galaxy-conf/._WigCorrelate.xml has changed
Binary file galaxy-conf/._ZScore.xml has changed
Binary file galaxy-conf/._Zinba.xml has changed
Binary file galaxy-conf/._galaxyToolRunner.sh has changed
--- a/galaxy-conf/BaseAlignCounts.xml	Wed Apr 25 16:53:48 2012 -0400
+++ b/galaxy-conf/BaseAlignCounts.xml	Sat May 19 10:36:45 2012 -0400
@@ -3,12 +3,13 @@
   <command interpreter="sh">galaxyToolRunner.sh ngs.BaseAlignCounts -i $input -a ${chromInfo} -x $X -o $output</command>
   <inputs>
     <param name="input" type="data" format="sam,bam,bed,bedgraph" label="Sequencing reads" />
-    <param name="X" type="integer" value="-1" label="In silico extension (-1 for read length)" />
+    <param name="X" type="integer" value="-1" label="In silico extension (-1 for fragment length)" />
   </inputs>
   <outputs>
     <data name="output" format="wig" />
   </outputs>
-  
+  <tests>
+  </tests>
   <help>
         
 This tool produces a new Wig file with the number of reads/intervals overlapping each base pair. Reads can be artificially extended to match known fragment lengths. If you wish to count the number of reads starting at each base pair, set the read extension to 1. If you wish to count the number of intervals overlapping each base pair, set the extension to -1.
@@ -19,6 +20,10 @@
 
 This tool requires sequencing reads in SAM, BAM, Bed, or BedGraph format. If you are artificially extending reads, ensure that the strand is set correctly in SAM, BAM, and Bed files.
 
+.. class:: warningmark
+
+Paired-end reads are considered to be the entire fragment (the distance from the 5' end of mate 1 to the 5' end of mate 2) if the extension is set to -1.
+
 .. class:: infomark
 
 If you would like to convert valued interval data (e.g. BedGraph files from microarrays) to Wig format, use the Converters -> Interval to Wig converter.
--- a/galaxy-conf/DNAPropertyCalculator.xml	Wed Apr 25 16:53:48 2012 -0400
+++ b/galaxy-conf/DNAPropertyCalculator.xml	Sat May 19 10:36:45 2012 -0400
@@ -81,6 +81,21 @@
       </data>
   </outputs>
   
+  <tests>
+    <test>
+      <param name="genomeSource" value="history"/>
+      <param name="ownFile" value="test.fasta"/>
+      <param name="N" value="false"/>
+      <output name="output" file="twist.wig"/>
+  	</test>
+  	<test>
+      <param name="genomeSource" value="history"/>
+      <param name="ownFile" value="test.fasta"/>
+      <param name="N" value="true"/>
+      <output name="output" file="twist.normalized.wig"/>
+  	</test>
+  </tests>
+  
   <help>
 
 This tool will create a new Wig file with genome-wide calculations of sequence-specific DNA properties determined from local n-nucleotide sequences. DNA properties are calculated using AJT_.
--- a/galaxy-conf/Downsample.xml	Wed Apr 25 16:53:48 2012 -0400
+++ b/galaxy-conf/Downsample.xml	Sat May 19 10:36:45 2012 -0400
@@ -6,8 +6,10 @@
       <param name="window" type="integer" value="100" label="Window size (bp)" />
       <param name="metric" type="select" label="Downsampling method">
       	<option value="mean">Mean</option>
-      	<option value="min">Min</option>
-      	<option value="max">Max</option>
+      	<option value="min">Minimum</option>
+      	<option value="max">Maximum</option>
+      	<option value="coverage">Coverage</option>
+      	<option value="total">Total</option>
       </param>
   </inputs>
   <outputs>
@@ -16,13 +18,23 @@
   
   <help>
 
+This tool can be used to reduce the resolution and file size of Wig files for easier upload to UCSC. Data is downsampled in non-overlapping windows starting from the beginning of each chromosome. Each window can be downsampled as the mean, minimum, maximum, total, or coverage of the original data.
+
+-----
+
+**Downsampling Methods**
+
+- **Mean:** the arithmetic mean of the values in the original data window
+- **Minimum:** the least value in the original data window
+- **Maximum:** the greatest value in the original data window
+- **Coverage:** the fraction of bases with values in the original window
+- **Total:** the sum of all values in the original data window
+
+-----
+
 .. class:: infomark
 
 **TIP:** If your dataset does not appear in the pulldown menu, it means that it is not in Wig or BigWig format. Use "edit attributes" to set the correct format if it was not detected correctly.
 
------
-
-This tool can be used to reduce the resolution and file size of Wig files for easier upload to UCSC. Data is downsampled in non-overlapping moving windows starting from the beginning of each chromosome. Each window can be downsampled as the arithmetic mean, minimum, or maximum value of the original data.
-
   </help>
 </tool>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/galaxy-conf/FastqIlluminaToSanger.xml	Sat May 19 10:36:45 2012 -0400
@@ -0,0 +1,25 @@
+<tool id="FastqIlluminaToSanger" name="Convert Fastq qualities" version="1.0.0">
+  <description>from Illumina to Sanger</description>
+  <command interpreter="sh">galaxyToolRunner.sh converters.FastqIlluminaToSanger -i $input -o $output</command>
+  <inputs>
+      <param name="input" type="data" format="fastqillumina" label="FASTQ, Illumina qualities" />
+  </inputs>
+  <outputs>
+      <data name="output" format="fastqsanger" metadata_source="input" />
+  </outputs>
+  <tests>
+	  <test>
+	    <param name="input" value="test.fastqillumina" ftype="fastqillumina"/>
+	    <output name="output" file="test.fastqsanger"/>
+      </test>
+  </tests>
+<help>
+
+This tool will convert a FASTQ file with ASCII quality scores encoded in Illumina 1.3 format (Phred+64) to Sanger format (Phred+33). It is a simpler, faster version of the FASTQ Groomer.
+
+.. class:: warningmark
+	
+This tool requires fastqillumina formatted data. If you have tabular data that was not correctly autodetected, change the metadata by clicking on the pencil icon for the dataset.
+
+</help>
+</tool>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/galaxy-conf/FindNMers.xml	Sat May 19 10:36:45 2012 -0400
@@ -0,0 +1,43 @@
+<tool id="FindNMers" name="Find NMers" version="1.0.0">
+  <description>in a DNA sequence</description>
+  <command interpreter="sh">galaxyToolRunner.sh dna.FindNMers -i 
+    #if $refGenomeSource.genomeSource == "history":
+      $refGenomeSource.ownFile
+    #else
+      ${refGenomeSource.index.fields.path}
+    #end if
+	-m $mismatches -n $nmer $rc -o $output
+  </command>
+  <inputs>
+    <conditional name="refGenomeSource">
+      <param name="genomeSource" type="select" label="Will you select a reference genome from your history or use a built-in index?" help="Built-ins were indexed using default options">
+        <option value="indexed">Use a built-in index</option>
+        <option value="history">Use one from the history</option>
+      </param>
+      <when value="indexed">
+        <param name="index" type="select" label="Select a reference genome" help="if your genome of interest is not listed - contact Galaxy team">
+          <options from_data_table="sam_fa_indexes">
+            <filter type="sort_by" column="1" />
+            <validator type="no_options" message="No indexes are available" />
+          </options>
+        </param>
+      </when>
+      <when value="history">
+        <param name="ownFile" type="data" format="fasta" metadata_name="dbkey" label="Select the reference genome" />
+      </when>  <!-- history -->
+    </conditional>  <!-- refGenomeSource -->
+    
+    <param name="nmer" type="text" optional="false" label="NMer to search for" />
+    <param name="mismatches" type="integer" value="0" label="Number of allowed mismatches (Hamming distance)" />
+    <param name="rc" type="boolean" checked="true" truevalue="--rc" falsevalue="" label="Search reverse-complement as well" />
+  </inputs>
+  <outputs>
+      <data format="bed" name="output"/>
+  </outputs>
+  
+  <help>
+
+This tool will find all matches of a given NMer in a DNA sequence.
+
+  </help>
+</tool>
--- a/galaxy-conf/FindOutlierRegions.xml	Wed Apr 25 16:53:48 2012 -0400
+++ b/galaxy-conf/FindOutlierRegions.xml	Sat May 19 10:36:45 2012 -0400
@@ -1,10 +1,11 @@
 <tool id="WigFindOutliers" name="Find outlier regions" version="1.0.0">
   <description>such as CNVs</description>
-  <command interpreter="sh">galaxyToolRunner.sh ngs.FindOutlierRegions -i $input -w $window -t $threshold -o $output</command>
+  <command interpreter="sh">galaxyToolRunner.sh ngs.FindOutlierRegions -i $input -w $window -t $threshold $below -o $output</command>
   <inputs>
       <param format="bigwig,wig" name="input" type="data" label="Input data" />
       <param name="window" type="integer" value="150" label="Window size" />
       <param name="threshold" type="float" value="3" label="Threshold (fold times the mean)" />
+      <param name="below" type="boolean" checked="false" truevalue="-b" falsevalue="" label="Search for outliers below the threshold" />
   </inputs>
   <outputs>
       <data format="bed" name="output" metadata_source="input" />
--- a/galaxy-conf/GeneTrackToBedGraph.xml	Wed Apr 25 16:53:48 2012 -0400
+++ b/galaxy-conf/GeneTrackToBedGraph.xml	Sat May 19 10:36:45 2012 -0400
@@ -2,12 +2,17 @@
   <description>converter</description>
   <command interpreter="sh">galaxyToolRunner.sh converters.GeneTrackToBedGraph -i $input -o $output</command>
   <inputs>
-      <param name="input" type="data" format="genetrack" label="Input GeneTrack index" />
+      <param name="input" type="data" format="tabular" label="Input GeneTrack index" />
   </inputs>
   <outputs>
       <data name="output" format="bedgraph" metadata_source="input" />
   </outputs>
-	
+	<tests>
+	  <test>
+	    <param name="input" value="test.genetrack" ftype="tabular"/>
+	    <output name="output" file="geneTrackToBedGraph.bedGraph"/>
+    </test>
+  </tests>
 <help>
 
 This tool will sum the counts from the forward and reverse strands in a GeneTrack_ index to create a BedGraph file.
--- a/galaxy-conf/GeneTrackToWig.xml	Wed Apr 25 16:53:48 2012 -0400
+++ b/galaxy-conf/GeneTrackToWig.xml	Sat May 19 10:36:45 2012 -0400
@@ -2,14 +2,29 @@
   <description>converter</description>
   <command interpreter="sh">galaxyToolRunner.sh converters.GeneTrackToWig -i $input -s $shift $zero -a ${chromInfo} -o $output</command>
   <inputs>
-      <param name="input" type="data" format="genetrack" label="Input GeneTrack index" />
+      <param name="input" type="data" format="tabular" label="Input GeneTrack index" />
       <param name="shift" type="integer" value="0" optional="true" label="Shift +/- strand counts by this amount when merging" />
   	  <param name="zero" type="boolean" checked="false" truevalue="-z" falsevalue="" label="Assume zero where there is no data (default is NaN)" />
   </inputs>
   <outputs>
       <data name="output" format="wig" metadata_source="input" />
   </outputs>
-	
+	<tests>
+	  <test>
+	    <param name="input" value="test.genetrack" ftype="tabular"/>
+	    <param name="shift" value="73"/>
+	    <param name="zero" value="true"/>
+	    <param name="chromInfo" value="sacCer2"/>
+	    <output name="output" file="geneTrackToWig1.wig"/>
+    </test>
+    <test>
+	    <param name="input" value="test.genetrack" ftype="tabular"/>
+	    <param name="shift" value="0"/>
+	    <param name="zero" value="false"/>
+	    <param name="chromInfo" value="sacCer2"/>
+	    <output name="output" file="geneTrackToWig2.wig"/>
+    </test>
+  </tests>
 <help>
   
 This tool will convert GeneTrack_ format files into Wig files, optionally offsetting the + and - strand counts by a specified value before merging them.
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/galaxy-conf/InterpolateDiscontinuousData.xml	Sat May 19 10:36:45 2012 -0400
@@ -0,0 +1,40 @@
+<tool id="WigInterpolate" name="Interpolate" version="1.0.0">
+  <description>missing values in a (Big)Wig file</description>
+  <command interpreter="sh">galaxyToolRunner.sh converters.InterpolateDiscontinousData -i $input -t $type -m $max -o $output</command>
+  <inputs>
+      <param format="bigwig,wig" name="input" type="data" label="Interpolate missing values in" />
+      <param name="type" type="select" label="Interpolation type">
+      	<option value="nearest">Nearest</option>
+      	<option value="linear">Linear</option>
+      	<option value="cubic">Cubic</option>
+      </param>
+      <param name="max" type="integer" value="1000" label="Maximum span of missing values to interpolate (bp)"/>
+  </inputs>
+  <outputs>
+      <data format="wig" name="output" metadata_source="input" />
+  </outputs>
+  
+  <help>
+
+This tool will attempt to interpolate missing values (NaN) in a Wig file that result when converting discontinuous microarray probe data to Wig format. Stretches of missing data that extend longer than the allowed maximum will be left as NaN.
+
+-----
+
+**Interpolation types**
+
+- **Nearest** uses the value of the nearest base pair that has data
+- **Linear** uses a linear interpolant between the values of the nearest two probes
+- **Cubic** uses a cubic interpolant between the values of the nearest two probes
+
+For more information, see Wikipedia_.
+
+.. _Wikipedia: http://en.wikipedia.org/wiki/Interpolation
+
+-----
+
+.. class:: infomark
+
+**TIP:** If your dataset does not appear in the pulldown menu, it means that it is not in Wig or BigWig format. Use the Converters -> IntervalToWig tool to convert Bed, BedGraph, or GFF-formatted microarray data to Wig format, then use this tool to interpolate the missing values between probes.
+
+  </help>
+</tool>
--- a/galaxy-conf/IntervalAverager.xml	Wed Apr 25 16:53:48 2012 -0400
+++ b/galaxy-conf/IntervalAverager.xml	Sat May 19 10:36:45 2012 -0400
@@ -1,8 +1,16 @@
 <tool id="IntervalAverager" name="Average intervals" version="1.0.0">
   <description>that have been aligned</description>
-  <command interpreter="sh">galaxyToolRunner.sh visualization.IntervalAverager -i $input -l $loci -o $output</command>
+  <command interpreter="sh">
+    galaxyToolRunner.sh visualization.IntervalAverager -l $loci -o $output $file1
+      #for $input in $inputs
+        ${input.file}
+      #end for
+  </command>
   <inputs>
-      <param format="wig,bigwig" name="input" type="data" label="Sequencing data" />
+      <param name="file1" label="Sequencing data" type="data" format="bigwig,wig" />
+      <repeat name="inputs" title="Additional sequencing data">
+        <param name="file" type="data" format="bigwig,wig" />
+      </repeat>
       <param format="bed" name="loci" type="data" label="List of intervals (with alignment points)" />
   </inputs>
   <outputs>
--- a/galaxy-conf/IntervalLengthDistribution.xml	Wed Apr 25 16:53:48 2012 -0400
+++ b/galaxy-conf/IntervalLengthDistribution.xml	Sat May 19 10:36:45 2012 -0400
@@ -1,8 +1,9 @@
 <tool id="IntervalLengthDistribution" name="Make histogram" version="1.0.0">
   <description>of read lengths</description>
-  <command interpreter="sh">galaxyToolRunner.sh ngs.IntervalLengthDistribution -i $input -o $output</command>
+  <command interpreter="sh">galaxyToolRunner.sh ngs.IntervalLengthDistribution -i $input $freq -o $output</command>
   <inputs>
       <param name="input" type="data" format="sam,bam,bed,bedgraph,gff" label="Reads/Intervals" />
+      <param name="freq" type="boolean" checked="false" truevalue="-f" falsevalue="" label="Output normalized frequencies rather than counts" />
   </inputs>
   <outputs>
       <data format="tabular" name="output" />
--- a/galaxy-conf/IntervalToWig.xml	Wed Apr 25 16:53:48 2012 -0400
+++ b/galaxy-conf/IntervalToWig.xml	Sat May 19 10:36:45 2012 -0400
@@ -2,7 +2,7 @@
   <description>converter</description>
   <command interpreter="sh">galaxyToolRunner.sh converters.IntervalToWig -i $input $zero -a ${chromInfo} -o $output</command>
   <inputs>
-      <param name="input" type="data" format="bed,bedGraph,gff" label="Input Bed/BedGraph/GFF file" />
+      <param name="input" type="data" format="bed,bedgraph,gff" label="Input Bed/BedGraph/GFF file" />
   	  <param name="zero" type="boolean" checked="false" truevalue="-z" falsevalue="" label="Assume zero where there is no data (default is NaN)" />
   </inputs>
   <outputs>
--- a/galaxy-conf/LogTransform.xml	Wed Apr 25 16:53:48 2012 -0400
+++ b/galaxy-conf/LogTransform.xml	Sat May 19 10:36:45 2012 -0400
@@ -9,42 +9,36 @@
     <data format="wig" name="output" metadata_source="input" />
   </outputs>
   <tests>
-    <!--<test>
-	    <param name="input" value="wigmath.input1"/>
+	  <test>
+	    <param name="input" value="wigmath1.wig"/>
 	    <param name="base" value="2"/>
-	    <param name="dbkey" value="sacCer2"/>
-	    <output name="output" file="logger.output1"/>
+	    <output name="output" file="logger1.wig"/>
 	  </test>
 	  <test>
-	    <param name="input" value="wigmath.input1.bw"/>
-	    <param name="base" value="2"/>
-	    <param name="dbkey" value="sacCer2"/>
-	    <output name="output" file="logger.output1"/>
+	    <param name="input" value="wigmath2.wig"/>
+	    <param name="base" value="3"/>
+	    <output name="output" file="logger2.wig"/>
 	  </test>
 	  <test>
-	    <param name="input" value="wigmath.input2"/>
-	    <param name="base" value="2"/>
-	    <param name="dbkey" value="sacCer2"/>
-	    <output name="output" file="logger.output2"/>
+	    <param name="input" value="wigmath3.wig"/>
+	    <param name="base" value="10"/>
+	    <output name="output" file="logger3.wig"/>
 	  </test>
 	  <test>
-	    <param name="input" value="wigmath.input2.bw"/>
+	    <param name="input" value="wigmath1.bw"/>
 	    <param name="base" value="2"/>
-	    <param name="dbkey" value="sacCer2"/>
-	    <output name="output" file="logger.output2"/>
+	    <output name="output" file="logger4.wig"/>
 	  </test>
 	  <test>
-	    <param name="input" value="wigmath.input3"/>
-	    <param name="base" value="10"/>
-	    <param name="dbkey" value="sacCer2"/>
-	    <output name="output" file="logger.output3"/>
+	    <param name="input" value="wigmath2.bw"/>
+	    <param name="base" value="3"/>
+	    <output name="output" file="logger5.wig"/>
 	  </test>
 	  <test>
-	    <param name="input" value="wigmath.input3.bw"/>
+	    <param name="input" value="wigmath3.bw"/>
 	    <param name="base" value="10"/>
-	    <param name="dbkey" value="sacCer2"/>
-	    <output name="output" file="logger.output3"/>
-	  </test>-->
+	    <output name="output" file="logger6.wig"/>
+	  </test>
   </tests>
   
   <help>
--- a/galaxy-conf/Phasogram.xml	Wed Apr 25 16:53:48 2012 -0400
+++ b/galaxy-conf/Phasogram.xml	Sat May 19 10:36:45 2012 -0400
@@ -11,7 +11,7 @@
   
   <help>
 
-This tool calculates the phase distribution of sequencing data. It can be used to identify genome-wide periodicities. Phase counts are aggregated for each base pair across the genome. The tool is a reimplementation of the algorithm described in (Valouev et al. 2011).
+This tool calculates the phase distribution of sequencing data. It can be used to identify genome-wide periodicities. Phase counts are aggregated for each base pair across the genome. This is equivalent to summing the autocovariance of a sliding window across the genome. The tool is a reimplementation of the algorithm described in (Valouev et al. 2011).
 
 .. class:: infomark
 
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/galaxy-conf/ReadLengthDistributionMatrix.xml	Sat May 19 10:36:45 2012 -0400
@@ -0,0 +1,63 @@
+<tool id="ReadLengthDistributionMatrix" name="Create read length distribution matrix" version="1.0.0">
+  <description>across a genomic interval</description>
+  <command interpreter="sh">galaxyToolRunner.sh ngs.ReadLengthDistributionMatrix -i $input --chr $chr --start $start --stop $stop --min $min --max $max --bin $bin -o $output</command>
+  <inputs>
+      <param format="sam,bam,bed,bedgraph" name="input" type="data" label="Mapped reads" />
+      <param name="chr" type="text" label="Chromosome" />
+      <param name="start" type="integer" value="1" label="Start base pair" />
+      <param name="stop" type="integer" value="1000" label="Stop base pair" />
+      <param name="min" type="integer" value="1" label="Minimum fragment length (bp)" />
+      <param name="max" type="integer" value="200" label="Maximum fragment length (bp)" />
+      <param name="bin" type="integer" value="1" label="Fragment length bin size (bp)" />
+  </inputs>
+  <outputs>
+      <data format="tabular" name="output" />
+  </outputs>
+  
+<help>
+  
+This tool will create a matrix (in matrix2png_ format) with the distribution of read lengths over each base pair. Reads are binned by genomic location and length to create a matrix where each column represents the distribution of read lengths over that base pair. The resulting matrix can be turned into heatmap using the Visualization -> Make heatmap with matrix2png tool.
+  
+.. _matrix2png: http://bioinformatics.ubc.ca/matrix2png/dataformat.html
+  
+.. class:: warningmark
+
+This tool requires paired-end SAM, BAM, Bed, or BedGraph formatted data. Using single-end data will result in a constant read length.
+
+-----
+
+**Syntax**
+
+- **Mapped reads** are the mapped paired-end reads used to make the histograms
+- **Chromosome** a locus in the genome
+- **Start base pair** a locus in the genome
+- **Stop base pair** a locus in the genome
+- **Minimum fragment length** is the lowest fragment length bin. Reads shorter than this will be ignored.
+- **Maximum fragment length** is the highest fragment length bin. Reads longer than this will be ignored.
+- **Fragment length bin size** is the bin size used when making the fragment length histograms
+
+-----
+  
+**Example**
+
+Make a matrix with the read length distribution across the region chrI:5001-6000, looking at reads 100-200bp in length in bins of 1bp:
+
+- **Chromosome:** chrI
+- **Start:** 5001
+- **Stop:** 6000
+- **Minimum fragment length:** 100
+- **Maximum fragment length:** 200
+- **Fragment length bin size:** 1
+
+The resulting matrix will be 1000x101, with each column representing a base pair and each row representing a read length. The column headers give the base pair and the row headers give the read length.
+
+-----
+
+**Citation**
+
+This tool was inspired by the analysis and figures in 
+
+Floer M, Wang X, Prabhu V, Berrozpe G, Narayan S, Spagna D, Alvarez D, Kendall J, Krasnitz A, Stepansky A, Hicks J, Bryant GO and Ptashne M (2010) A RSC/nucleosome complex determines chromatin architecture and facilitates activator binding. Cell 141: 407–418
+
+</help>
+</tool>
--- a/galaxy-conf/StripMatrix.xml	Wed Apr 25 16:53:48 2012 -0400
+++ b/galaxy-conf/StripMatrix.xml	Sat May 19 10:36:45 2012 -0400
@@ -9,8 +9,8 @@
   </outputs>
   <tests>
     <test>
-      <param name="input" value="stripMatrix.input"/>
-	    <output name="output" file="stripMatrix.output"/>
+      <param name="input" value="test.matrix2png.txt"/>
+	    <output name="output" file="stripMatrix.txt"/>
     </test>
   </tests>
   
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/galaxy-conf/WaveletTransform.xml	Sat May 19 10:36:45 2012 -0400
@@ -0,0 +1,21 @@
+<tool id="WaveletTransform" name="Wavelet analysis" version="1.0.0">
+  <description>across a genomic interval</description>
+  <command interpreter="sh">galaxyToolRunner.sh ngs.WaveletTransform -i $input -w $wavelet --chr $chr --start $start --stop $stop --min $min --max $max --step $N -o $output</command>
+  <inputs>
+      <param format="wig,bigwig" name="input" type="data" label="Sequencing data" />
+      <param format="tabular" name="wavelet" type="data" label="Wavelet" />
+      <param name="chr" type="text" label="Chromosome" />
+      <param name="start" type="integer" value="1" label="Start base pair" />
+      <param name="stop" type="integer" value="1000" label="Stop base pair" />
+      <param name="min" type="integer" value="10" label="Minimum wavelet size (bp)" />
+      <param name="max" type="integer" value="400" label="Maximum wavelet size (bp)" />
+      <param name="N" type="integer" value="1" label="Step size (bp)" />
+  </inputs>
+  <outputs>
+      <data format="tabular" name="output" />
+  </outputs>
+  
+<help>
+  
+</help>
+</tool>
--- a/galaxy-conf/WigCorrelate.xml	Wed Apr 25 16:53:48 2012 -0400
+++ b/galaxy-conf/WigCorrelate.xml	Sat May 19 10:36:45 2012 -0400
@@ -1,7 +1,7 @@
 <tool id="WigCorrelate" name="Correlate" version="1.0.0">
   <description>multiple (Big)Wig files</description>
   <command interpreter="sh">
-    galaxyToolRunner.sh wigmath.WigCorrelate -w $window -t $type -o $output
+    galaxyToolRunner.sh wigmath.WigCorrelate -w $window -s $step -t $type -o $output
       #for $input in $inputs
         ${input.file}
       #end for
@@ -11,6 +11,7 @@
         <param name="file" type="data" format="bigwig,wig" />
       </repeat>
       <param name="window" type="integer" value="100" label="Window size (bp)" />
+      <param name="step" type="integer" value="50" label="Sliding step size (bp)" />
       <param name="type" type="select" label="Correlation metric">
       	<option value="pearson">Pearson</option>
       	<option value="spearman">Spearman</option>
@@ -22,7 +23,7 @@
   
 <help>
   
-This tool will compute a correlation matrix between the supplied Wig or BigWig files. Each row/column in the matrix is added in the order that files are added above, starting from the top left. The Wig file is downsampled into non-overlapping windows with the specified size by computing the mean value in each window. These windows are then correlated using either  Pearson_'s Product-Moment correlation coefficient or Spearman_'s rank correlation coefficient. If the window size is set to 1, the correlation is calculated between all base pairs in the genome.
+This tool will compute a correlation matrix between the supplied Wig or BigWig files. Each row/column in the matrix is added in the order that files are added above, starting from the top left. The Wig file is downsampled into sliding windows with the specified bin size and shift by computing the mean value in each window. These windows are then correlated using either Pearson_'s Product-Moment correlation coefficient or Spearman_'s rank correlation coefficient. If the window size is set to 1, the correlation is calculated between all base pairs in the genome.
   
 .. _Pearson: http://en.wikipedia.org/wiki/Pearson_product-moment_correlation_coefficient
 
@@ -30,6 +31,15 @@
   
 -----
 
+**Syntax**
+
+- **Inputs** are the genomic data to correlate
+- **Window size** is the size of the window to bin data into
+- **Sliding step size** is the shift step size of the sliding window used during binning
+- **Correlation metric** is the type of correlation to calculate
+  
+-----
+
 .. class:: warningmark
 
 **WARN:** In order to calculate the correlation coefficient, the data is loaded into entirely into memory. For large genomes, this may require a lot of RAM unless comparably larger window sizes are used.
--- a/galaxy-conf/WigSummary.xml	Wed Apr 25 16:53:48 2012 -0400
+++ b/galaxy-conf/WigSummary.xml	Sat May 19 10:36:45 2012 -0400
@@ -7,6 +7,20 @@
   <outputs>
       <data format="txt" name="output" />
   </outputs>
+  <tests>
+      <test>
+      	<param name="input" value="wigmath1.wig"/>
+      	<output name="output" file="wigsummary1.txt"/>
+      </test>
+      <test>
+      	<param name="input" value="test.wig"/>
+      	<output name="output" file="wigsummary2.txt"/>
+      </test>
+      <test>
+      	<param name="input" value="test.bw"/>
+      	<output name="output" file="wigsummary3.txt"/>
+      </test>
+  </tests>
   
 <help>
   
--- a/galaxy-conf/ZScore.xml	Wed Apr 25 16:53:48 2012 -0400
+++ b/galaxy-conf/ZScore.xml	Sat May 19 10:36:45 2012 -0400
@@ -8,36 +8,30 @@
       <data format="wig" name="output" metadata_source="input" />
   </outputs>
   <tests>
-    <!--<test>
-	    <param name="input" value="wigmath.input1"/>
-	    <param name="dbkey" value="sacCer2"/>
-	    <output name="output" file="zscorer.output1"/>
+	  <test>
+	    <param name="input" value="wigmath1.wig"/>
+	    <output name="output" file="zscorer1.wig"/>
 	  </test>
 	  <test>
-	    <param name="input" value="wigmath.input1.bw"/>
-	    <param name="dbkey" value="sacCer2"/>
-	    <output name="output" file="zscorer.output1"/>
+	    <param name="input" value="wigmath2.wig"/>
+	    <output name="output" file="zscorer2.wig"/>
 	  </test>
 	  <test>
-	    <param name="input" value="wigmath.input2"/>
-	    <param name="dbkey" value="sacCer2"/>
-	    <output name="output" file="zscorer.output2"/>
+	    <param name="input" value="wigmath3.wig"/>
+	    <output name="output" file="zscorer3.wig"/>
 	  </test>
 	  <test>
-	    <param name="input" value="wigmath.input2.bw"/>
-	    <param name="dbkey" value="sacCer2"/>
-	    <output name="output" file="zscorer.output2"/>
+	    <param name="input" value="wigmath1.bw"/>
+	    <output name="output" file="zscorer4.wig"/>
 	  </test>
 	  <test>
-	    <param name="input" value="wigmath.input3"/>
-	    <param name="dbkey" value="sacCer2"/>
-	    <output name="output" file="zscorer.output3"/>
+	    <param name="input" value="wigmath2.bw"/>
+	    <output name="output" file="zscorer5.wig"/>
 	  </test>
 	  <test>
-	    <param name="input" value="wigmath.input3.bw"/>
-	    <param name="dbkey" value="sacCer2"/>
-	    <output name="output" file="zscorer.output3"/>
-	  </test>-->
+	    <param name="input" value="wigmath3.bw"/>
+	    <output name="output" file="zscorer6.wig"/>
+	  </test>
   </tests>
   
   <help>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/galaxy-conf/Zinba.xml	Sat May 19 10:36:45 2012 -0400
@@ -0,0 +1,16 @@
+<tool id="Zinba" name="Call peaks" version="1.0.0">
+  <description>with ZINBA</description>
+  <command interpreter="sh">runZINBA.sh -i $input -o $output</command>
+  <inputs>
+      <param format="bed" name="reads" type="data" label="Mapped reads (in BED format)" />
+      <param format="wig" name="basecount" type="data" label="Coverage track (base align counts)" />
+      
+  </inputs>
+  <outputs>
+      <data format="wig" name="output" metadata_source="input" />
+  </outputs>
+  <help>
+
+
+  </help>
+</tool>
--- a/galaxy-conf/galaxyToolRunner.sh	Wed Apr 25 16:53:48 2012 -0400
+++ b/galaxy-conf/galaxyToolRunner.sh	Sat May 19 10:36:45 2012 -0400
@@ -6,9 +6,12 @@
   exit;
 fi
 
-if [ "$1" = "list" ]
-then
-  find src/edu/unc/genomics/**/*.java -exec basename -s .java {} \;
+# Verify that the user has Java 7 installed
+# Otherwise there will be an obscure UnsupportedClassVersion error
+version=$(java -version 2>&1 | awk -F '"' '/version/ {print $2}')
+if [[ "$version" < "1.7" ]]; then
+    echo "Need Java 7 or greater. You have Java $version installed."
+    exit
 fi
 
 DIR="$( cd "$( dirname "${BASH_SOURCE[0]}" )" && pwd )"
Binary file lib/java-genomics-io.jar has changed
Binary file lib/picard-1.67.jar has changed
Binary file lib/sam-1.56.jar has changed
Binary file lib/sam-1.67.jar has changed