Mercurial > repos > timpalpant > java_genomics_toolkit
changeset 23:01d5d20eaadd draft
Deleted selected files
author | timpalpant |
---|---|
date | Tue, 19 Jun 2012 22:14:11 -0400 |
parents | 727fbba02ef7 |
children | a77e126ae856 |
files | dist/java-genomics-toolkit.jar galaxy-conf/._Add.xml galaxy-conf/._Autocorrelation.xml galaxy-conf/._Average.xml galaxy-conf/._BaseAlignCounts.xml galaxy-conf/._Correlate.xml galaxy-conf/._DNAPropertyCalculator.xml galaxy-conf/._Divide.xml galaxy-conf/._Downsample.xml galaxy-conf/._DynaPro.xml galaxy-conf/._FastqIlluminaToSanger.xml galaxy-conf/._FindAbsoluteMaxima.xml galaxy-conf/._FindBoundaryNucleosomes.xml galaxy-conf/._FindNMers.xml galaxy-conf/._FindOutlierRegions.xml galaxy-conf/._GaussianSmooth.xml galaxy-conf/._GeneTrackToBedGraph.xml galaxy-conf/._GeneTrackToWig.xml galaxy-conf/._GreedyCaller.xml galaxy-conf/._InterpolateDiscontinuousData.xml galaxy-conf/._IntervalAverager.xml galaxy-conf/._IntervalLengthDistribution.xml galaxy-conf/._IntervalStats.xml galaxy-conf/._IntervalToBed.xml galaxy-conf/._IntervalToWig.xml galaxy-conf/._KMeans.xml galaxy-conf/._LogTransform.xml galaxy-conf/._MapDyads.xml galaxy-conf/._MatrixAligner.xml galaxy-conf/._MovingAverageSmooth.xml galaxy-conf/._Multiply.xml galaxy-conf/._PercusDecomposition.xml galaxy-conf/._Phasogram.xml galaxy-conf/._PowerSpectrum.xml galaxy-conf/._ReadLengthDistributionMatrix.xml galaxy-conf/._RollingReadLength.xml galaxy-conf/._RomanNumeralize.xml galaxy-conf/._Scale.xml galaxy-conf/._Shift.xml galaxy-conf/._StripMatrix.xml galaxy-conf/._Subtract.xml galaxy-conf/._Summary.xml galaxy-conf/._ValueDistribution.xml galaxy-conf/._WaveletTransform.xml galaxy-conf/._ZScore.xml galaxy-conf/._galaxyToolRunner.sh galaxy-conf/._log4j.properties galaxy-conf/._matrix2png.xml galaxy-conf/Add.xml galaxy-conf/Autocorrelation.xml galaxy-conf/Average.xml galaxy-conf/BaseAlignCounts.xml galaxy-conf/Correlate.xml galaxy-conf/DNAPropertyCalculator.xml galaxy-conf/Divide.xml galaxy-conf/Downsample.xml galaxy-conf/DynaPro.xml galaxy-conf/ExtractDataFromRegion.xml galaxy-conf/FastqIlluminaToSanger.xml galaxy-conf/FindAbsoluteMaxima.xml galaxy-conf/FindBoundaryNucleosomes.xml galaxy-conf/FindNMers.xml galaxy-conf/FindOutlierRegions.xml galaxy-conf/GaussianSmooth.xml galaxy-conf/GeneTrackToBedGraph.xml galaxy-conf/GeneTrackToWig.xml galaxy-conf/GreedyCaller.xml galaxy-conf/InterpolateDiscontinuousData.xml galaxy-conf/IntervalAverager.xml galaxy-conf/IntervalLengthDistribution.xml galaxy-conf/IntervalStats.xml galaxy-conf/IntervalToBed.xml galaxy-conf/IntervalToWig.xml galaxy-conf/KMeans.xml galaxy-conf/LogTransform.xml galaxy-conf/MapDyads.xml galaxy-conf/MatrixAligner.xml galaxy-conf/MovingAverageSmooth.xml galaxy-conf/Multiply.xml galaxy-conf/PairOverlappingNucleosomes.xml galaxy-conf/PercusDecomposition.xml galaxy-conf/Phasogram.xml galaxy-conf/PowerSpectrum.xml galaxy-conf/ReadLengthDistributionMatrix.xml galaxy-conf/RollingReadLength.xml galaxy-conf/RomanNumeralize.xml galaxy-conf/Scale.xml galaxy-conf/Shift.xml galaxy-conf/StripMatrix.xml galaxy-conf/Subtract.xml galaxy-conf/Summary.xml galaxy-conf/ValueDistribution.xml galaxy-conf/WaveletTransform.xml galaxy-conf/ZScore.xml galaxy-conf/galaxyToolRunner.sh galaxy-conf/log4j.properties galaxy-conf/matrix2png.xml lib/BigWig.jar lib/commons-lang3-3.1.jar lib/commons-math3-3.0.jar lib/dnaproperties-1732.jar lib/hamcrest-core-1.1.0.jar lib/java-genomics-io.jar lib/jcommander-1.27.jar lib/jtransforms-2.4.jar lib/junit.jar lib/log4j-1.2.15.jar lib/picard-1.67.jar lib/sam-1.67.jar sam_fa_indices.loc.sample tool_data_table_conf.xml.sample |
diffstat | 111 files changed, 0 insertions(+), 2269 deletions(-) [+] |
line wrap: on
line diff
--- a/galaxy-conf/Add.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,27 +0,0 @@ -<tool id="WigAdd" name="Add" version="1.1.0"> - <description>multiple (Big)Wig files</description> - <command interpreter="sh"> - galaxyToolRunner.sh wigmath.Add -o $output - #for $input in $inputs - ${input.file} - #end for - </command> - <inputs> - <repeat name="inputs" title="(Big)Wig file"> - <param name="file" type="data" format="bigwig,wig" /> - </repeat> - </inputs> - <outputs> - <data format="wig" name="output" /> - </outputs> - -<help> - -This tool will add all values in the specified Wig files base pair by base pair. - -.. class:: infomark - -**TIP:** If your dataset does not appear in the pulldown menu, it means that it is not in Wig or BigWig format. Use "edit attributes" to set the correct format if it was not detected correctly. - -</help> -</tool>
--- a/galaxy-conf/Autocorrelation.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,40 +0,0 @@ -<tool id="Autocovariance" name="Compute the autocovariance" version="2.0.0"> - <description>of data in a Wiggle file</description> - <command interpreter="sh">galaxyToolRunner.sh ngs.Autocorrelation -i $input -l $windows -m $max -o $output</command> - <inputs> - <param format="bigwig,wig" name="input" type="data" label="Input data" /> - <param format="bed,bedgraph,gff" name="windows" type="data" label="List of intervals" /> - <param name="max" type="integer" value="200" label="Maximum shift" /> - </inputs> - <outputs> - <data format="tabular" name="output" /> - </outputs> - -<help> - -This tool computes the unnormalized autocovariance_ of intervals of data in a Wig file. - -.. _autocovariance: http://en.wikipedia.org/wiki/Autocorrelation - ------ - -**Syntax** - -- **Input data** is the genomic data on which to compute the autocorrelation. -- **List of intervals:** The autocorrelation will be computed for each genomic interval specified in this list. -- **Maximum shift:** In computing the autocorrelation, the data will be phase-shifted up to this limit. - ------ - -.. class:: infomark - -**TIP:** For more information, see Wikipedia_ (right click to open this link in another window). - -.. _Wikipedia: http://en.wikipedia.org/wiki/Autocorrelation - -.. class:: infomark - -**TIP:** If your input data does not appear in the pulldown menu, it means that it is not in Wig or BigWig format. Use "edit attributes" to set the correct format. Similarly, the intervals must be in either Bed, BedGraph, or GFF format. - -</help> -</tool>
--- a/galaxy-conf/Average.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,33 +0,0 @@ -<tool id="WigAvg" name="Average" version="1.1.0"> - <description>multiple (Big)Wig files</description> - <command interpreter="sh"> - galaxyToolRunner.sh wigmath.Average -o $output $file1 $file2 - #for $input in $inputs - ${input.file} - #end for - </command> - <inputs> - <param name="file1" label="(Big)Wig file 1" type="data" format="bigwig,wig" /> - <param name="file2" label="(Big)Wig file 2" type="data" format="bigwig,wig" /> - <repeat name="inputs" title="Additional (Big)Wig file"> - <param name="file" type="data" format="bigwig,wig" /> - </repeat> - </inputs> - <outputs> - <data format="wig" name="output" /> - </outputs> - <tests> - <!-- TODO --> - </tests> - - -<help> - -This tool will average the values of the provided Wig files, base pair by base pair. - -.. class:: infomark - -**TIP:** If your dataset does not appear in the pulldown menu, it means that it is not in Wig or BigWig format. Use "edit attributes" to set the correct format if it was not detected correctly. - -</help> -</tool>
--- a/galaxy-conf/BaseAlignCounts.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,43 +0,0 @@ -<tool id="BaseAlignCounts" name="Calculate coverage" version="2.0.0"> - <description>of sequencing reads</description> - <command interpreter="sh">galaxyToolRunner.sh ngs.BaseAlignCounts -i $input -a ${chromInfo} -x $X -o $output</command> - <inputs> - <param name="input" type="data" format="sam,bam,bed,bedgraph" label="Sequencing reads" /> - <param name="X" type="integer" value="-1" label="In silico extension (-1 for fragment length)" /> - </inputs> - <outputs> - <data name="output" format="wig" /> - </outputs> - <tests> - </tests> - <help> - -This tool produces a new Wig file with the number of reads/intervals overlapping each base pair. Reads can be artificially extended to match known fragment lengths. If you wish to count the number of reads starting at each base pair, set the read extension to 1. If you wish to count the number of intervals overlapping each base pair, set the extension to -1. - ------ - -.. class:: warningmark - -This tool requires sequencing reads in SAM, BAM, Bed, or BedGraph format. If you are artificially extending reads, ensure that the strand is set correctly in SAM, BAM, and Bed files. - -.. class:: warningmark - -Paired-end reads are considered to be the entire fragment (the distance from the 5' end of mate 1 to the 5' end of mate 2) if the extension is set to -1. - -.. class:: infomark - -If you would like to convert valued interval data (e.g. BedGraph files from microarrays) to Wig format, use the Converters -> Interval to Wig converter. - -.. class:: infomark - -**TIP:** If you are going to be using reads in SAM format for multiple analyses, it is often more efficient to first convert it into BAM format using NGS: SAM Tools -> SAM-to-BAM. - ------ - -**Syntax** - -- **Sequencing reads** are mapped reads from a high-throughput sequencing experiment. -- **In silico extension:** Reads will be artificially extended from their 5' end to be this length. - - </help> -</tool>
--- a/galaxy-conf/Correlate.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,60 +0,0 @@ -<tool id="WigCorrelate" name="Correlate" version="1.1.0"> - <description>multiple (Big)Wig files</description> - <command interpreter="sh"> - galaxyToolRunner.sh wigmath.Correlate -w $window -s $step -t $type -o $output $file1 $file2 - #for $input in $inputs - ${input.file} - #end for - </command> - <inputs> - <param name="file1" label="(Big)Wig file 1" type="data" format="bigwig,wig" /> - <param name="file2" label="(Big)Wig file 2" type="data" format="bigwig,wig" /> - <repeat name="inputs" title="Additional (Big)Wig file"> - <param name="file" type="data" format="bigwig,wig" /> - </repeat> - <param name="window" type="integer" value="100" label="Window size (bp)" /> - <param name="step" type="integer" value="50" label="Sliding step size (bp)" /> - <param name="type" type="select" label="Correlation metric"> - <option value="pearson">Pearson</option> - <option value="spearman">Spearman</option> - </param> - </inputs> - <outputs> - <data format="tabular" name="output" /> - </outputs> - -<help> - -This tool will compute a correlation matrix between the supplied Wig or BigWig files. Each row/column in the matrix is added in the order that files are added above, starting from the top left. The Wig file is downsampled into sliding windows with the specified bin size and shift by computing the mean value in each window. These windows are then correlated using either Pearson_'s Product-Moment correlation coefficient or Spearman_'s rank correlation coefficient. If the window size is set to 1, the correlation is calculated between all base pairs in the genome. - -.. _Pearson: http://en.wikipedia.org/wiki/Pearson_product-moment_correlation_coefficient - -.. _Spearman: http://en.wikipedia.org/wiki/Spearman%27s_rank_correlation_coefficient - ------ - -**Syntax** - -- **Inputs** are the genomic data to correlate -- **Window size** is the size of the window to bin data into -- **Sliding step size** is the shift step size of the sliding window used during binning -- **Correlation metric** is the type of correlation to calculate - ------ - -.. class:: warningmark - -**WARN:** In order to calculate the correlation coefficient, the data is loaded into entirely into memory. For large genomes, this may require a lot of RAM unless comparably larger window sizes are used. - ------ - -**Citation** - -This tool was inspired by ACT_ from the Gerstein lab. - -.. _ACT: http://act.gersteinlab.org - -J Jee*, J Rozowsky*, KY Yip*, L Lochovsky, R Bjornson, G Zhong, Z Zhang, Y Fu, J Wang, Z Weng, M Gerstein. ACT: Aggregation and Correlation Toolbox for Analyses of Genome Tracks. (2011) Bioinformatics 27(8): 1152-4. - -</help> -</tool>
--- a/galaxy-conf/DNAPropertyCalculator.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,114 +0,0 @@ -<tool id="DNAPropertyCalculator" name="Calculate sequence-specific DNA properties" version="2.0.0"> - <description>for a genome</description> - <command interpreter="sh">galaxyToolRunner.sh dna.DNAPropertyCalculator -i - #if $refGenomeSource.genomeSource == "history": - $refGenomeSource.ownFile - #else - ${refGenomeSource.index.fields.path} - #end if - $N -p $property -o $output - </command> - <inputs> - <conditional name="refGenomeSource"> - <param name="genomeSource" type="select" label="Will you select a reference genome from your history or use a built-in index?" help="Built-ins were indexed using default options"> - <option value="indexed">Use a built-in index</option> - <option value="history">Use one from the history</option> - </param> - <when value="indexed"> - <param name="index" type="select" label="Select a reference genome" help="if your genome of interest is not listed - contact Galaxy team"> - <options from_data_table="sam_fa_indexes"> - <filter type="sort_by" column="1" /> - <validator type="no_options" message="No indexes are available" /> - </options> - </param> - </when> - <when value="history"> - <param name="ownFile" type="data" format="fasta" metadata_name="dbkey" label="Select the reference genome" /> - </when> <!-- history --> - </conditional> <!-- refGenomeSource --> - - <param name="property" type="select" label="Property to calculate"> - <option value="ATG-density">ATG</option> - <option value="G-content">G</option> - <option value="C-content">C</option> - <option value="T-content">T</option> - <option value="A-content">A</option> - <option value="GC-content">GC</option> - <option value="AT-content">AT</option> - <option value="Pyrimidine-content">Pyrimidine</option> - <option value="Purine-content">Purine</option> - <option value="Bendability">Bendability</option> - <option value="zDNA">zDNA</option> - <option value="DuplexStabilityFreeEnergy">Duplex Stability Free Energy</option> - <option value="DuplexStabilityDisruptEnergy">Duplex Stability Disrupt Energy</option> - <option value="DNADenaturation">DNA Denaturation</option> - <option value="PropellorTwist">Propellor Twist</option> - <option value="BaseStacking">Base Stacking</option> - <option value="ProteinDeformation">Protein Deformation</option> - <option value="BendingStiffness">Bending Stiffness</option> - <option value="ProteinDNATwist">Protein DNA Twist</option> - <option value="bDNATwist">bDNA Twist</option> - <option value="APhilicity">APhilicity</option> - <option value="NucleosomePosition">Nucleosome Position (trinucleotide model)</option> - <option value="Twist">Twist</option> - <option value="Tilt">Tilt</option> - <option value="Roll">Roll</option> - <option value="Slide">Slide</option> - <option value="Rise">Rise</option> - </param> - - <param name="N" type="boolean" checked="true" truevalue="-n" falsevalue="" label="Output normalized values" /> - </inputs> - <outputs> - <data format="wig" name="output" label="Calculate ${property.value_label}"> - <actions> - <conditional name="refGenomeSource.genomeSource"> - <when value="indexed"> - <action type="metadata" name="dbkey"> - <option type="from_data_table" name="sam_fa_indexes" column="1" offset="0"> - <filter type="param_value" column="0" value="#" compare="startswith" keep="False"/> - <filter type="param_value" ref="refGenomeSource.index" column="0"/> - </option> - </action> - </when> - <when value="history"> - <action type="metadata" name="dbkey"> - <option type="from_param" name="refGenomeSource.ownFile" param_attribute="dbkey" /> - </action> - </when> - </conditional> - </actions> - </data> - </outputs> - - <tests> - <test> - <param name="genomeSource" value="history"/> - <param name="ownFile" value="test.fasta"/> - <param name="property" value="Twist"/> - <param name="N" value="false"/> - <output name="output" file="twist.wig"/> - </test> - <test> - <param name="genomeSource" value="history"/> - <param name="ownFile" value="test.fasta"/> - <param name="property" value="Twist"/> - <param name="N" value="true"/> - <output name="output" file="twist.normalized.wig"/> - </test> - </tests> - - <help> - -This tool will create a new Wig file with genome-wide calculations of sequence-specific DNA properties determined from local n-nucleotide sequences. DNA properties are calculated using AJT_. - -.. _AJT: http://www.abeel.be/ajt - ------ - -**Example** - -To calculate GC-content, choose your genome assembly and select "GC" as the property. This will create a new Wig file in which G and C nucleotides are represented by 1, while A and T nucleotides are represented by -1. If you would like to compute GC-content in 10-bp windows, use the WigMath -> Moving average tool to compute a moving average with 10bp windows. - - </help> -</tool>
--- a/galaxy-conf/Divide.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,36 +0,0 @@ -<tool id="WigDivide" name="Divide" version="1.1.0"> - <description>two (Big)Wig files</description> - <command interpreter="sh">galaxyToolRunner.sh wigmath.Divide -n $dividend -d $divisor -o $output</command> - <inputs> - <param format="bigwig,wig" name="dividend" type="data" label="File 1 (dividend)" /> - <param format="bigwig,wig" name="divisor" type="data" label="File 2 (divisor)" /> - </inputs> - <outputs> - <data format="wig" name="output" metadata_source="dividend" /> - </outputs> - <tests> - <test> - <param name="dividend" value="wigmath1.wig"/> - <param name="divisor" value="wigmath2.wig"/> - <output name="output" file="divide1.wig"/> - </test> - <test> - <param name="dividend" value="wigmath1.wig"/> - <param name="divisor" value="wigmath3.bw"/> - <output name="output" file="divide2.wig"/> - </test> - <test> - <param name="dividend" value="wigmath3.bw"/> - <param name="divisor" value="wigmath2.bw"/> - <output name="output" file="divide3.wig"/> - </test> - </tests> - - <help> - -.. class:: infomark - -**TIP:** If your dataset does not appear in the pulldown menu, it means that it is not in Wig or BigWig format. Use "edit attributes" to set the correct format if it was not detected correctly. - - </help> -</tool>
--- a/galaxy-conf/Downsample.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,61 +0,0 @@ -<tool id="WigDownsample" name="Downsample" version="1.1.0"> - <description>a (Big)Wig file</description> - <command interpreter="sh">galaxyToolRunner.sh wigmath.Downsample -i $input -m $metric -w $window -o $output</command> - <inputs> - <param format="bigwig,wig" name="input" type="data" label="Original data" /> - <param name="window" type="integer" value="100" label="Window size (bp)" /> - <param name="metric" type="select" label="Downsampling method"> - <option value="mean">Mean</option> - <option value="min">Minimum</option> - <option value="max">Maximum</option> - <option value="coverage">Coverage</option> - <option value="total">Total</option> - </param> - </inputs> - <outputs> - <data format="wig" name="output" metadata_source="input" /> - </outputs> - - <tests> - <test> - <param name="input" value="wigmath1.wig"/> - <param name="window" value="1"/> - <param name="metric" value="mean"/> - <output name="output" file="downsample1.wig"/> - </test> - <test> - <param name="input" value="wigmath2.bw"/> - <param name="window" value="5"/> - <param name="metric" value="max"/> - <output name="output" file="downsample2.wig"/> - </test> - <test> - <param name="input" value="wigmath3.wig"/> - <param name="window" value="100"/> - <param name="metric" value="total"/> - <output name="output" file="downsample3.wig"/> - </test> - </tests> - - <help> - -This tool can be used to reduce the resolution and file size of Wig files for easier upload to UCSC. Data is downsampled in non-overlapping windows starting from the beginning of each chromosome. Each window can be downsampled as the mean, minimum, maximum, total, or coverage of the original data. - ------ - -**Downsampling Methods** - -- **Mean:** the arithmetic mean of the values in the original data window -- **Minimum:** the least value in the original data window -- **Maximum:** the greatest value in the original data window -- **Coverage:** the fraction of bases with values in the original window -- **Total:** the sum of all values in the original data window - ------ - -.. class:: infomark - -**TIP:** If your dataset does not appear in the pulldown menu, it means that it is not in Wig or BigWig format. Use "edit attributes" to set the correct format if it was not detected correctly. - - </help> -</tool>
--- a/galaxy-conf/DynaPro.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,48 +0,0 @@ -<tool id="DynaPro" name="Compute equilibrium nucleosome positions" version="1.1.0"> - <description>using DynaPro</description> - <command interpreter="sh">galaxyToolRunner.sh nucleosomes.DynaPro -i $input -n $N - #if str( $mean ) != '' - -m $mean - #end if - - #if str( $variance ) != '' - -v $variance - #end if - -o $output - </command> - <inputs> - <param format="bigwig,wig" name="input" type="data" label="Energy landscape" /> - <param name="N" type="integer" value="147" label="Nucleosome size (bp)" /> - <param name="mean" type="float" optional="true" label="Shift energy landscape to have mean" /> - <param name="variance" type="float" optional="true" label="Rescale energy landscape to have variance" /> - </inputs> - <outputs> - <data format="wig" name="output" metadata_source="input" /> - </outputs> - <help> - -.. class:: warningmark - -At present, this tool is only suitable for small genomes (yeast) since entire chromosomes must be loaded into memory. - ------ - -Equilibrium nucleosome distribution is modeled as a one-dimensional fluid of hard rods adsorbing and moving within an external potential. This tool provides a simplified version of the DynaPro_ algorithm for a single factor interacting with hard-core repulsion. - -.. _DynaPro: http://nucleosome.rutgers.edu/nucleosome/ - ------ - -**Syntax** - -- **Energy landscape** is the external potential function for each genomic base pair, and must be in Wig format. -- **Nucleosome size** is the hard-core interaction size. - ------ - -**Citation** - -Morozov AV, Fortney K, Gaykalova DA, Studitsky VM, Widom J and Siggia ED (2009) Using DNA mechanics to predict in vitro nucleosome positions and formation energies. Nucleic Acids Res 37: 4707–4722. - - </help> -</tool>
--- a/galaxy-conf/ExtractDataFromRegion.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,27 +0,0 @@ -<tool id="ExtractDataFromWig" name="Extract data from a Wig file" version="1.0.0"> - <description>for a genomic interval</description> - <command interpreter="sh"> - galaxyToolRunner.sh ngs.ExtractDataFromRegion --chr $chr --start $start --stop $stop -o $output $file1 - #for $input in $inputs - ${input.file} - #end for - </command> - <inputs> - <param name="file1" label="(Big)Wig file" type="data" format="bigwig,wig" /> - <repeat name="inputs" title="(Big)Wig file"> - <param name="file" type="data" format="bigwig,wig" /> - </repeat> - <param name="chr" type="text" label="Chromosome" /> - <param name="start" type="integer" value="1" label="Start base pair" /> - <param name="stop" type="integer" value="1000" label="Stop base pair" /> - </inputs> - <outputs> - <data format="tabular" name="output" /> - </outputs> - -<help> - -This tool will extract data from Wig or BigWig file(s) for a specific region of the genome. - -</help> -</tool>
--- a/galaxy-conf/FastqIlluminaToSanger.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,29 +0,0 @@ -<tool id="FastqIlluminaToSanger" name="Convert Fastq qualities" version="1.0.0"> - <description>from Illumina to Sanger</description> - <command interpreter="sh">galaxyToolRunner.sh converters.FastqIlluminaToSanger -i $input -o $output</command> - <inputs> - <param name="input" type="data" format="fastqillumina" label="FASTQ, Illumina qualities" /> - </inputs> - <outputs> - <data name="output" format="fastqsanger" metadata_source="input" /> - </outputs> - <tests> - <test> - <param name="input" value="test.fastqillumina" ftype="fastqillumina"/> - <output name="output" file="test.fastqsanger"/> - </test> - </tests> -<help> - -This tool will convert a FASTQ file with ASCII quality scores encoded in Illumina 1.3-1.7 format (Phred+64) to Sanger format (Phred+33) for use with Bowtie and other Galaxy tools. Illumina CASAVA >= 1.8 already produces FASTQ files in Sanger format, so this tool should not be used on new Illumina sequencing data. This tool is a simpler, faster version of the FASTQ Groomer that does little error checking but performs much faster. If you are unsure what format your file is in, or need to do other conversions, use the FASTQ Groomer instead. - -For more information, read about FASTQ formats_ (right-click to open in new window). - -.. _formats: http://en.wikipedia.org/wiki/FASTQ_format - -.. class:: warningmark - -This tool requires fastqillumina formatted data. If you have fastq data that was not correctly autodetected, change the metadata by clicking on the pencil icon for the dataset. - -</help> -</tool>
--- a/galaxy-conf/FindAbsoluteMaxima.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,52 +0,0 @@ -<tool id="FindWigMaxima" name="Find absolute maxima" version="1.1.0"> - <description>in intervals</description> - <command interpreter="sh"> - galaxyToolRunner.sh ngs.FindAbsoluteMaxima -l $window -o $output - #for $input in $inputs - ${input.file} - #end for - </command> - <inputs> - <repeat name="inputs" title="(Big)Wig file"> - <param name="file" type="data" format="bigwig,wig" /> - </repeat> - <param name="window" type="data" format="bed,bedgraph,gff" label="Intervals to find maxima in" /> - </inputs> - <outputs> - <data name="output" format="tabular" /> - </outputs> - - <help> - -This tool can be used to find the location of the maximum value in genomic intervals, such as finding the peak summit inside a set of peak calls. - -.. class:: infomark - -**TIP:** If your dataset does not appear in the pulldown menu, it means that it is not in Wig or BigWig format. Use "edit attributes" to set the correct format if it was not detected correctly. Intervals must be provided in Bed, BedGraph, or GFF format. - ------ - -**Example** - - -if **Intervals** are genes :: - - chr11 5203271 5204877 NM_000518 0 - - chr11 5210634 5212434 NM_000519 0 - - chr11 5226077 5227663 NM_000559 0 - - -and **Wig files** are :: - - Data1.wig - Data2.wig - -this tool will find the location of the maximum value in each interval for each of the provided Wig/BigWig files, and append them in columns in the order that they were added :: - - chr11 5203271 5204877 NM_000518 0 - 5203374 5204300 - chr11 5210634 5212434 NM_000519 0 - 5210638 5212450 - chr11 5226077 5227663 NM_000559 0 - 5226800 5226241 - -where column 7 is the location of the maximum value in that interval for Data1.wig, and column 7 is the location of the maximum value in that interval for Data2.wig. - - </help> -</tool>
--- a/galaxy-conf/FindBoundaryNucleosomes.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,30 +0,0 @@ -<tool id="FindNuke" name="Find boundary nucleosomes" version="2.0.0"> - <description>in windows</description> - <command interpreter="sh">galaxyToolRunner.sh nucleosomes.FindBoundaryNucleosomes -i $input -l $loci -o $output</command> - <inputs> - <param name="input" type="data" format="tabular" label="Nucleosome calls" /> - <param name="loci" type="data" format="bed,bedgraph,gff" label="List of intervals" /> - </inputs> - <outputs> - <data name="output" format="bed" metadata_source="loci" /> - </outputs> - - <help> - -.. class:: infomark - -Use the Call Nucleosomes tool to create a file of called nucleosomes, then use this tool to identify the first nucleosome's dyad position (peak maximum) from the 5' and 3' end of the gene. - -.. class:: infomark - -**TIP:** Nucleosome calls must be in tabular format of the kind produced by the Nucleosomes -> Call nucleosomes tool. Intervals must be in either Bed, BedGraph, or GFF format. - ------ - -**Syntax** - -- **Nucleosome calls** is a list of stereotypic nucleosome position calls. -- **List of intervals:** The 5' and 3' boundary nucleosomes will be found for each interval in this list - - </help> -</tool>
--- a/galaxy-conf/FindNMers.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,52 +0,0 @@ -<tool id="FindNMers" name="Find NMers" version="1.0.0"> - <description>in a DNA sequence</description> - <command interpreter="sh">galaxyToolRunner.sh dna.FindNMers -i - #if $refGenomeSource.genomeSource == "history": - $refGenomeSource.ownFile - #else - ${refGenomeSource.index.fields.path} - #end if - -m $mismatches -n $nmer $rc -o $output - </command> - <inputs> - <conditional name="refGenomeSource"> - <param name="genomeSource" type="select" label="Will you select a reference genome from your history or use a built-in index?" help="Built-ins were indexed using default options"> - <option value="indexed">Use a built-in index</option> - <option value="history">Use one from the history</option> - </param> - <when value="indexed"> - <param name="index" type="select" label="Select a reference genome" help="if your genome of interest is not listed - contact Galaxy team"> - <options from_data_table="sam_fa_indexes"> - <filter type="sort_by" column="1" /> - <validator type="no_options" message="No indexes are available" /> - </options> - </param> - </when> - <when value="history"> - <param name="ownFile" type="data" format="fasta" metadata_name="dbkey" label="Select the reference genome" /> - </when> <!-- history --> - </conditional> <!-- refGenomeSource --> - - <param name="nmer" type="text" optional="false" label="NMer to search for" /> - <param name="mismatches" type="integer" value="0" label="Number of allowed mismatches (Hamming distance)" /> - <param name="rc" type="boolean" checked="true" truevalue="--rc" falsevalue="" label="Search reverse-complement as well" /> - </inputs> - <outputs> - <data format="bed" name="output"/> - </outputs> - <tests> - <test> - <param name="genomeSource" value="history"/> - <param name="ownFile" value="test.fasta"/> - <param name="property" value="Twist"/> - <param name="N" value="false"/> - <output name="output" file="twist.wig"/> - </test> - </tests> - - <help> - -This tool will find all matches of a given NMer in a DNA sequence. Sequences may be provided in FASTA format or selected from available reference genomes. Mismatches are allowed, but not insertions/deletions. The output is a Bed file with the locations of matches in the reference sequence. - - </help> -</tool>
--- a/galaxy-conf/FindOutlierRegions.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,33 +0,0 @@ -<tool id="WigFindOutliers" name="Find outlier regions" version="1.1.0"> - <description>such as CNVs</description> - <command interpreter="sh">galaxyToolRunner.sh ngs.FindOutlierRegions -i $input -w $window -t $threshold $below -o $output</command> - <inputs> - <param format="bigwig,wig" name="input" type="data" label="Input data" /> - <param name="window" type="integer" value="150" label="Window size" /> - <param name="threshold" type="float" value="3" label="Threshold (fold times the mean)" /> - <param name="below" type="boolean" checked="false" truevalue="-b" falsevalue="" label="Search for outliers below the threshold" /> - </inputs> - <outputs> - <data format="bed" name="output" metadata_source="input" /> - </outputs> - - <help> - -This tool identifies regions of the genome that may be repetitive elements or CNVs by scanning for windows that have an exceptionally high mean relative to the genome-wide mean. - ------ - -.. class:: infomark - -**TIP:** If your dataset does not appear in the pulldown menu, it means that it is not in Wig or BigWig format. Use "edit attributes" to set the correct format if it was not detected correctly. - ------ - -**Syntax** - -- **Input data** is Wig or BigWig formatted data from a high-throughput sequencing experiment. -- **Window size** is the size of the moving average to use. -- **Threshold** is the fold times the genome-wide mean that a window's mean must be in order to be considered an outlier region. - - </help> -</tool>
--- a/galaxy-conf/GaussianSmooth.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,40 +0,0 @@ -<tool id="WigGaussianSmooth" name="Gaussian smooth" version="1.1.0"> - <description>a (Big)Wig file</description> - <command interpreter="sh">galaxyToolRunner.sh wigmath.GaussianSmooth -i $input -s $S -o $output</command> - <inputs> - <param name="input" type="data" format="bigwig,wig" label="Smooth the data in" /> - <param name="S" type="integer" value="20" optional="true" label="Standard deviation of the Gaussian in base pairs" /> - </inputs> - <outputs> - <data format="wig" name="output" metadata_source="input" /> - </outputs> - <tests> - <test> - <param name="input" value="wigmath1.wig"/> - <param name="S" value="20"/> - <output name="output" file="gaussian1.wig"/> - </test> - <test> - <param name="input" value="wigmath2.bw"/> - <param name="S" value="3"/> - <output name="output" file="gaussian2.wig"/> - </test> - <test> - <param name="input" value="wigmath3.wig"/> - <param name="S" value="40"/> - <output name="output" file="gaussian3.wig"/> - </test> - </tests> - -<help> - -This tool smooths genomic data with an area-preserving Gaussian_ filter. The Gaussian filter is computed out to +/- 3 standard deviations. - -.. _Gaussian: http://en.wikipedia.org/wiki/Gaussian_filter - -.. class:: infomark - -**TIP:** If your dataset does not appear in the pulldown menu, it means that it is not in Wig or BigWig format. Use "edit attributes" to set the correct format if it was not detected correctly. - -</help> -</tool>
--- a/galaxy-conf/GeneTrackToBedGraph.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,27 +0,0 @@ -<tool id="GeneTrackToBedGraph" name="GeneTrack to BedGraph" version="1.1.0"> - <description>converter</description> - <command interpreter="sh">galaxyToolRunner.sh converters.GeneTrackToBedGraph -i $input -o $output</command> - <inputs> - <param name="input" type="data" format="tabular" label="Input GeneTrack index" /> - </inputs> - <outputs> - <data name="output" format="bedgraph" metadata_source="input" /> - </outputs> - <tests> - <test> - <param name="input" value="test.genetrack" ftype="tabular"/> - <output name="output" file="geneTrackToBedGraph.bedGraph"/> - </test> - </tests> -<help> - -This tool will sum the counts from the forward and reverse strands in a GeneTrack_ index to create a BedGraph file. - -.. _GeneTrack: http://atlas.bx.psu.edu/genetrack/docs/genetrack.html - -.. class:: warningmark - -This tool requires GeneTrack formatted data. If you have tabular data that was not correctly autodetected, change the metadata by clicking on the pencil icon for the dataset. - -</help> -</tool>
--- a/galaxy-conf/GeneTrackToWig.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,39 +0,0 @@ -<tool id="GeneTrackToWig" name="GeneTrack to Wig" version="1.1.0"> - <description>converter</description> - <command interpreter="sh">galaxyToolRunner.sh converters.GeneTrackToWig -i $input -s $shift $zero -a ${chromInfo} -o $output</command> - <inputs> - <param name="input" type="data" format="tabular" label="Input GeneTrack index" /> - <param name="shift" type="integer" value="0" optional="true" label="Shift +/- strand counts by this amount when merging" /> - <param name="zero" type="boolean" checked="false" truevalue="-z" falsevalue="" label="Assume zero where there is no data (default is NaN)" /> - </inputs> - <outputs> - <data name="output" format="wig" metadata_source="input" /> - </outputs> - <tests> - <test> - <param name="input" value="test.genetrack" ftype="tabular"/> - <param name="shift" value="73"/> - <param name="zero" value="true"/> - <param name="chromInfo" value="sacCer2"/> - <output name="output" file="geneTrackToWig1.wig"/> - </test> - <test> - <param name="input" value="test.genetrack" ftype="tabular"/> - <param name="shift" value="0"/> - <param name="zero" value="false"/> - <param name="chromInfo" value="sacCer2"/> - <output name="output" file="geneTrackToWig2.wig"/> - </test> - </tests> -<help> - -This tool will convert GeneTrack_ format files into Wig files, optionally offsetting the + and - strand counts by a specified value before merging them. - -.. _GeneTrack: http://atlas.bx.psu.edu/genetrack/docs/genetrack.html - -.. class:: warningmark - -This tool requires GeneTrack formatted data. If you have tabular data that was not correctly autodetected, change the metadata by clicking on the pencil icon for the dataset. - -</help> -</tool>
--- a/galaxy-conf/GreedyCaller.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,49 +0,0 @@ -<tool id="CallNukes" name="Call Nucleosomes" version="1.1.0"> - <description>in an MNase experiment</description> - <command interpreter="sh">galaxyToolRunner.sh nucleosomes.GreedyCaller -d $dyads -s $smoothed -n $N -o $output</command> - <inputs> - <param name="dyads" type="data" format="bigwig,wig" label="Dyad counts" /> - <param name="smoothed" type="data" format="bigwig,wig" label="Smoothed dyad counts" /> - <param name="N" type="integer" value="147" optional="true" label="Assumed nucleosome size" /> - </inputs> - <outputs> - <data name="output" format="tabular" /> - </outputs> - -<help> - -Stereotypic nucleosome positions are identified from dyad density maps using an approach similar to the previously reported greedy algorithm in GeneTrack_ (Albert, et al. 2008). Nucleosome calls are identified at peak maxima (p) in the smoothed dyad density map, and then excluded in the surrounding window [p–N, p+N], where N is the assumed nucleosome size in base pairs. This process is continued until all possible sterically hindered nucleosome positions are identified. - -.. _GeneTrack: http://atlas.bx.psu.edu/genetrack/docs/genetrack.html - -.. class:: warningmark - -This tool requires dyad counts and smoothed dyad counts in Wig or BigWig format. Smoothed dyad counts can be generated from dyad counts using the WigMath -> Gaussian smooth tool. - ------ - -**Syntax** - -- **Dyad counts** is the relative number of nucleosomes positioned at each base pair. -- **Smoothed dyad counts** should correspond to a smoothed version of the **Dyad counts** -- **Assumed nucleosome size** is the window size used while identifying maxima to restrict overlapping calls. - ------ - -**Output** - -The output format has 10 columns defined as follows - -- 1. **Chromosome:** the chromosome of this nucleosome call -- 2. **Start:** the lower coordinate of the call window, equal to the dyad position - N/2 -- 3. **Stop:** the higher coordinate of the call window, equal to the dyad position + N/2 -- 4. **Length:** the window size (N) of the nucleosome call, equal to the value specified when the tool was run -- 5. **Length standard deviation:** the standard deviation of the nucleosome call length (equal to 0 because it is not currently calculated) -- 6. **Dyad:** the location of the peak maximum (p) in the smoothed dyad density data -- 7. **Dyad standard deviation:** the standard deviation of dyad density around the dyad mean in the dyad counts data -- 8. **Conditional position:** the probability that a nucleosome is at this exact dyad location as opposed to anywhere else in the nucleosome call window [p-N/2, p+N/2] -- 9. **Dyad mean:** the mean of the dyad counts in the window [p-N/2, p+N/2] -- 10. **Occupancy:** the sum of the dyad counts in the window [p-N/2, p+N/2] - -</help> -</tool>
--- a/galaxy-conf/InterpolateDiscontinuousData.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,40 +0,0 @@ -<tool id="WigInterpolate" name="Interpolate" version="1.1.0"> - <description>missing values in a (Big)Wig file</description> - <command interpreter="sh">galaxyToolRunner.sh converters.InterpolateDiscontinousData -i $input -t $type -m $max -o $output</command> - <inputs> - <param format="bigwig,wig" name="input" type="data" label="Interpolate missing values in" /> - <param name="type" type="select" label="Interpolation type"> - <option value="nearest">Nearest</option> - <option value="linear">Linear</option> - <option value="cubic">Cubic</option> - </param> - <param name="max" type="integer" value="1000" label="Maximum span of missing values to interpolate (bp)"/> - </inputs> - <outputs> - <data format="wig" name="output" metadata_source="input" /> - </outputs> - - <help> - -This tool will attempt to interpolate missing values (NaN) in a Wig file that result when converting discontinuous microarray probe data to Wig format. Stretches of missing data that extend longer than the allowed maximum will be left as NaN. - ------ - -**Interpolation types** - -- **Nearest** uses the value of the nearest base pair that has data -- **Linear** uses a linear interpolant between the values of the nearest two probes -- **Cubic** uses a cubic interpolant between the values of the nearest two probes - -For more information, see Wikipedia_. - -.. _Wikipedia: http://en.wikipedia.org/wiki/Interpolation - ------ - -.. class:: infomark - -**TIP:** If your dataset does not appear in the pulldown menu, it means that it is not in Wig or BigWig format. Use the Converters -> IntervalToWig tool to convert Bed, BedGraph, or GFF-formatted microarray data to Wig format, then use this tool to interpolate the missing values between probes. - - </help> -</tool>
--- a/galaxy-conf/IntervalAverager.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,40 +0,0 @@ -<tool id="IntervalAverager" name="Average intervals" version="2.1.0"> - <description>that have been aligned</description> - <command interpreter="sh"> - galaxyToolRunner.sh visualization.IntervalAverager -l $loci -o $output $file1 - #for $input in $inputs - ${input.file} - #end for - </command> - <inputs> - <param name="file1" label="Sequencing data" type="data" format="bigwig,wig" /> - <repeat name="inputs" title="Additional sequencing data"> - <param name="file" type="data" format="bigwig,wig" /> - </repeat> - <param format="bed" name="loci" type="data" label="List of intervals (with alignment points)" /> - </inputs> - <outputs> - <data format="tabular" name="output" /> - </outputs> - -<help> - -This tool calculates the average signal for a set of aligned intervals. Intervals are lined up on their alignment point (column 5 in the Bed file), flipped if on the - strand, and averaged. The output is equivalent to aligning the data in a matrix and then taking the columnwise average of the matrix. - -Intervals with alignment points must be provided in the following extended Bed format :: - - chr low high id alignment strand - -.. class:: infomark - -**TIP:** If your dataset does not appear in the pulldown menu, it means that it is not in Wig or BigWig format. Use "edit attributes" to set the correct format if it was not detected correctly. - ------ - -**Syntax** - -- **Sequencing data** is the genomic data used to create the average -- **List of intervals** is a list of intervals in Bed format with alignment points - -</help> -</tool>
--- a/galaxy-conf/IntervalLengthDistribution.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,38 +0,0 @@ -<tool id="IntervalLengthDistribution" name="Make histogram" version="1.0.0"> - <description>of read lengths</description> - <command interpreter="sh">galaxyToolRunner.sh ngs.IntervalLengthDistribution -i $input $freq -o $output</command> - <inputs> - <param name="input" type="data" format="sam,bam,bed,bedgraph,gff" label="Reads/Intervals" /> - <param name="freq" type="boolean" checked="false" truevalue="-f" falsevalue="" label="Output normalized frequencies rather than counts" /> - </inputs> - <outputs> - <data format="tabular" name="output" /> - </outputs> - <tests> - <test> - <param name="input" value="test.bed"/> - <param name="freq" value="false"/> - <output name="output" file="intervallengthdistribution1.txt"/> - </test> - <test> - <param name="input" value="test.bed"/> - <param name="freq" value="true"/> - <output name="output" file="intervallengthdistribution2.txt"/> - </test> - <test> - <param name="input" value="test2.bed"/> - <param name="freq" value="false"/> - <output name="output" file="intervallengthdistribution3.txt"/> - </test> - </tests> - -<help> - -This tool calculates the distribution of interval lengths from a list of intervals or reads in SAM, BAM, Bed, BedGraph, or GFF format. - -.. class:: warningmark - -For paired-end sequencing reads, the length is the length of the fragment (5' end of read 1 to 5' end of read 2) - -</help> -</tool>
--- a/galaxy-conf/IntervalStats.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,44 +0,0 @@ -<tool id="IntervalStats" name="Compute mean/min/max of intervals" version="1.0.0"> - <description>of data in a (Big)Wig file</description> - <command interpreter="sh"> - galaxyToolRunner.sh ngs.IntervalStats -l $windows -s $stat -o $output - #for $input in $inputs - ${input.file} - #end for - </command> - <inputs> - <repeat name="inputs" title="(Big)Wig file"> - <param name="file" type="data" format="bigwig,wig" /> - </repeat> - <param format="bed,bedgraph,gff" name="windows" type="data" label="List of intervals" /> - <param name="stat" type="select" optional="true" label="For each interval, compute the"> - <option value="mean">Mean</option> - <!-- TODO <option value="median">Median</option> --> - <option value="max">Max</option> - <option value="min">Min</option> - </param> - </inputs> - <outputs> - <data format="tabular" name="output" /> - </outputs> - -<help> - -This tool calculates the arithmetic mean, maximum, or minimum value for the Wig data in each interval. For each Wig file provided, an additional column is added to the output file in the order that they are added above. - -.. class:: infomark - -**TIP:** If your dataset does not appear in the pulldown menu, it means that it is not in Wig or BigWig format. Use "edit attributes" to set the correct format if it was not detected correctly. - ------ - -**Example** - -Calculate the mean change in nucleosome occupancy for each gene in the yeast genome: - -- 1. Create a "change in occupancy" dataset by subtracting the normalized occupancy Wig files from your two conditions using the WigMath -> Subtract tool. -- 2. Upload a list of intervals corresponding to the genes in the yeast genome, or pull the data from UCSC using Get Data -> UCSC Main. -- 3. Calculate the mean change in occupancy for each gene using this tool and the datasets from (1) and (2). - -</help> -</tool>
--- a/galaxy-conf/IntervalToBed.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,19 +0,0 @@ -<tool id="IntervalToBed" name="SAM/BAM/GFF/BedGraph/BigBed/VCF to Bed" version="1.0.0"> - <description>converter</description> - <command interpreter="sh">galaxyToolRunner.sh converters.IntervalToBed -i $input -o $output</command> - <inputs> - <param name="input" type="data" format="sam,bam,gff,bigbed,bedgraph,vcf" label="Input" /> - </inputs> - <outputs> - <data name="output" format="bed" metadata_source="input" /> - </outputs> -<help> - -This tool will convert any file in SAM, BAM, GFF, BedGraph, BigBed, or VCF format to Bed format. - -.. class:: warningmark - -For SAM/BAM data, paired-end reads are converted to Bed format as the entire fragment (5' end of mate 1 to the 5' end of mate 2). Single-end reads are converted to Bed format as the read itself, with strand information. If your SAM/BAM file contains both mate alignments from a paired-end sequencing run (i.e. two entries for each fragment), you should first filter out reads from either the + or - strand with the SAM Tools -> Filter SAM tool to avoid producing redundant entries in the output Bed file. - -</help> -</tool>
--- a/galaxy-conf/IntervalToWig.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,21 +0,0 @@ -<tool id="BedToWig" name="Bed/BedGraph/GFF to Wig" version="1.1.0"> - <description>converter</description> - <command interpreter="sh">galaxyToolRunner.sh converters.IntervalToWig -i $input $zero -a ${chromInfo} -o $output</command> - <inputs> - <param name="input" type="data" format="bed,bedgraph,gff" label="Input Bed/BedGraph/GFF file" /> - <param name="zero" type="boolean" checked="false" truevalue="-z" falsevalue="" label="Assume zero where there is no data (default is NaN)" /> - </inputs> - <outputs> - <data name="output" format="wig" metadata_source="input" /> - </outputs> - -<help> - -This tool converts data from an interval format, such as Bed, BedGraph or GFF, to Wig format. This can be used to convert data from microarrays to Wig format. The value of each interval is mapped into the Wig file. Intervals that overlap in the original file (multiple-valued base pairs) are averaged, and bases without data in the original interval file are set to NaN. - -.. class:: warningmark - -This tool requires Bed, BedGraph, or GFF formatted data. If you have tabular data that was not correctly autodetected, change the metadata by clicking on the pencil icon for the dataset. - -</help> -</tool>
--- a/galaxy-conf/KMeans.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,41 +0,0 @@ -<tool id="KMeans" name="KMeans cluster" version="1.0.0"> - <description>an aligned matrix</description> - <command interpreter="sh">galaxyToolRunner.sh visualization.KMeans -i $input -k $K -1 $min -2 $max -o $output</command> - <inputs> - <param format="tabular" name="input" type="data" label="Aligned matrix" /> - <param name="K" type="integer" value="10" label="Number of clusters" /> - <param name="min" type="integer" value="1" label="Minimum column to use for clustering" /> - <param name="max" type="integer" value="-1" label="Maximum column to use for clustering (-1 to end)" /> - </inputs> - <outputs> - <data format="tabular" name="output" metadata="input" /> - </outputs> - <tests> - </tests> - - <help> - -.. class:: warningmark - -This tool requires tabular data in matrix2png format (with column AND row headers). For more information about the required format and usage instructions, see the matrix2png_ website. - -.. _matrix2png: http://bioinformatics.ubc.ca/matrix2png/dataformat.html - -.. class:: infomark - -You can use the "Align values in a matrix" tool to create a matrix, then use this tool to cluster the matrix with k-means. - -.. class:: infomark - -**TIP:** You can use the **min** and **max** columns to cluster a large matrix based on a subset of the columns. For example, you could cluster a 4000x4000 matrix on columns 200-300 by setting min = 200 and max = 300. This will greatly increase the efficiency of distance calculations during the k-means EM, and also allows you to cluster based on specific regions, such as promoters or coding sequences. - ------ - -This tool will cluster the rows in an aligned matrix with KMeans_. The implementation builds upon the KMeansPlusPlusClusterer available in commons-math3_. - -.. _KMeans: http://en.wikipedia.org/wiki/K-means_clustering - -.. _commons-math3: http://commons.apache.org/math/ - - </help> -</tool>
--- a/galaxy-conf/LogTransform.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,51 +0,0 @@ -<tool id="WigLogTransform" name="Log transform" version="1.1.0"> - <description>a (Big)Wig file</description> - <command interpreter="sh">galaxyToolRunner.sh wigmath.LogTransform -i $input -b $base -o $output</command> - <inputs> - <param format="bigwig,wig" name="input" type="data" label="(Big)Wig file" /> - <param name="base" type="integer" value="2" label="Logarithm base" /> - </inputs> - <outputs> - <data format="wig" name="output" metadata_source="input" /> - </outputs> - <tests> - <test> - <param name="input" value="wigmath1.wig"/> - <param name="base" value="2"/> - <output name="output" file="logger1.wig"/> - </test> - <test> - <param name="input" value="wigmath2.wig"/> - <param name="base" value="3"/> - <output name="output" file="logger2.wig"/> - </test> - <test> - <param name="input" value="wigmath3.wig"/> - <param name="base" value="10"/> - <output name="output" file="logger3.wig"/> - </test> - <test> - <param name="input" value="wigmath1.bw"/> - <param name="base" value="2"/> - <output name="output" file="logger4.wig"/> - </test> - <test> - <param name="input" value="wigmath2.bw"/> - <param name="base" value="3"/> - <output name="output" file="logger5.wig"/> - </test> - <test> - <param name="input" value="wigmath3.bw"/> - <param name="base" value="10"/> - <output name="output" file="logger6.wig"/> - </test> - </tests> - - <help> - -.. class:: infomark - -**TIP:** If your dataset does not appear in the pulldown menu, it means that it is not in Wig or BigWig format. Use "edit attributes" to set the correct format if it was not detected correctly. - - </help> -</tool>
--- a/galaxy-conf/MapDyads.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,41 +0,0 @@ -<tool id="MapDyads" name="Map dyads" version="1.1.0"> - <description>from sequencing reads</description> - <command interpreter="sh"> - galaxyToolRunner.sh nucleosomes.MapDyads -i $input -a ${chromInfo} -o $output - #if $type.read == 'single' - -s $type.size - #end if - </command> - <inputs> - <param name="input" type="data" format="sam,bam,bed,bedGraph" label="Sequencing reads" /> - <conditional name="type"> - <param name="read" type="select" label="Type of reads"> - <option value="paired" selected="true">Paired-End</option> - <option value="single">Single-End</option> - </param> - <when value="single"> - <param name="size" type="integer" value="147" label="Estimated mononucleosome length (used to offset +/- strands)" /> - </when> - <when value="paired"> - <!-- No values here --> - </when> - </conditional> - </inputs> - <outputs> - <data name="output" format="wig" /> - </outputs> - -<help> - -This tool produces a Wig file with the number of dyads at each base pair. For paired-end MNase data, dyads are approximated using the center of the fragment. For Bed/BedGraph formatted input, this means the center of the interval; for SAM/BAM formatted input, this means the middle between the 5' end of mate 1 and the 5' end of mate 2. For single-end data, the estimated mononucleosome fragment length (N) must be specified, which will be used to offset reads from the + and - strands by +/- N/2. - -.. class:: warningmark - -This tool requires sequencing reads in SAM, BAM, Bed, or BedGraph format. - -.. class:: warningmark - -Since BedGraph format does not contain strand information, all reads in BedGraph format are considered to be on the 5' strand. - -</help> -</tool>
--- a/galaxy-conf/MatrixAligner.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,80 +0,0 @@ -<tool id="MatrixAligner" name="Align values in a matrix" version="1.0.0"> - <description>for a heatmap</description> - <command interpreter="sh">galaxyToolRunner.sh visualization.MatrixAligner -i $input -l $loci -m $M -o $output</command> - <inputs> - <param format="wig,bigwig" name="input" type="data" label="Sequencing data" /> - <param format="bed" name="loci" type="data" label="List of intervals (with alignment points)" /> - <param type="integer" name="M" value="4000" label="Maximum row length" /> - </inputs> - <outputs> - <data format="tabular" name="output" /> - </outputs> - <!-- TODO:<tests> - <test> - <param name="input" value="test.wig"/> - <param name="loci" value="test.bed"/> - <param name="M" value="4000"/> - <output name="output" file="matrixAligner.output"/> - </test> - <test> - <param name="input" value="test.bw"/> - <param name="loci" value="test.bed"/> - <param name="M" value="4000"/> - <output name="output" file="matrixAligner.output"/> - </test> - <test> - <param name="input" value="test.wig"/> - <param name="loci" value="test2.bed"/> - <param name="M" value="4000"/> - <output name="output" file="matrixAligner.output2"/> - </test> - <test> - <param name="input" value="test.bw"/> - <param name="loci" value="test2.bed"/> - <param name="M" value="4000"/> - <output name="output" file="matrixAligner.output2"/> - </test> - <test> - <param name="input" value="test.wig"/> - <param name="loci" value="test3.bed"/> - <param name="M" value="4000"/> - <output name="output" file="matrixAligner.output3"/> - </test> - <test> - <param name="input" value="test.bw"/> - <param name="loci" value="test3.bed"/> - <param name="M" value="4000"/> - <output name="output" file="matrixAligner.output3"/> - </test> - </tests>--> - -<help> - -This tool aligns sequencing data into a rectangular matrix for creating a heatmap with matrix2png. Data from each interval is lined up on the specified alignment point (column 5 in the Bed file), and flipped if on the - strand so that all intervals are 5'-to-3' from left-to-right. - -Intervals with alignment points must be provided in the following extended Bed format :: - - chr low high id alignment strand - -The heatmap is created by taking each interval in the **List of Intervals**, retrieving the data for that interval from the Wig file, and adding it as a new row in the matrix. Intervals are processed in their original order. - ------ - -**Syntax** - -- **Sequencing data** is the genomic data used to create the matrix -- **List of intervals** is a list of intervals in Bed format with alignment points -- **Maximum row length** is the maximum allowed width of the matrix. If aligned intervals extend outside of this width, they will be truncated. - ------ - -.. class:: infomark - -**TIP:** If your dataset does not appear in the pulldown menu, it means that it is not in Wig or BigWig format. Use "edit attributes" to set the correct format if it was not detected correctly. - -.. class:: warningmark - -Large heatmap matrices may require a long time to generate in Galaxy because it validates that the output is in correct tab-delimited format. To reduce the size of an MxN matrix with large M, rows (N) can be truncated using the maximum row length parameter. Rows are truncated from the alignment point (symmetrically) if possible, or as nearly symmetrically as possible. - -</help> -</tool>
--- a/galaxy-conf/MovingAverageSmooth.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,71 +0,0 @@ -<tool id="WigMovingAverage" name="Moving average smooth" version="1.1.0"> - <description>a (Big)Wig file</description> - <command interpreter="sh">galaxyToolRunner.sh wigmath.MovingAverageSmooth -i $input -w $W -o $output</command> - <inputs> - <param name="input" type="data" format="bigwig,wig" label="Smooth the data in" /> - <param name="W" type="integer" value="20" optional="true" label="Width of the moving average in base pairs" /> - </inputs> - <outputs> - <data format="wig" name="output" metadata_source="input" /> - </outputs> - <tests> - <!--<test> - <param name="input" value="test.wig"/> - <param name="dbkey" value="sacCer2"/> - <param name="S" value="20"/> - <param name="W" value="3"/> - <output name="output" file="smoother.output1"/> - </test> - <test> - <param name="input" value="test.bw"/> - <param name="dbkey" value="sacCer2"/> - <param name="S" value="20"/> - <param name="W" value="3"/> - <output name="output" file="smoother.output1"/> - </test> - <test> - <param name="input" value="test.wig"/> - <param name="dbkey" value="sacCer2"/> - <param name="S" value="10"/> - <param name="W" value="2"/> - <output name="output" file="smoother.output2"/> - </test> - <test> - <param name="input" value="test.bw"/> - <param name="dbkey" value="sacCer2"/> - <param name="S" value="10"/> - <param name="W" value="2"/> - <output name="output" file="smoother.output2"/> - </test> - <test> - <param name="input" value="test.wig"/> - <param name="dbkey" value="sacCer2"/> - <param name="S" value="50"/> - <param name="W" value="1"/> - <output name="output" file="smoother.output3"/> - </test> - <test> - <param name="input" value="test.bw"/> - <param name="dbkey" value="sacCer2"/> - <param name="S" value="5"/> - <param name="W" value="1"/> - <output name="output" file="smoother.output3"/> - </test>--> - </tests> - -<help> - -This tool smooths genomic data with a mean_ filter of the specified width. - -.. _mean: http://en.wikipedia.org/wiki/Moving_average - -.. class:: warningmark - -Note that for the moving average to be perfectly symmetric, the window should be an odd number of base pairs. - -.. class:: infomark - -**TIP:** If your dataset does not appear in the pulldown menu, it means that it is not in Wig or BigWig format. Use "edit attributes" to set the correct format if it was not detected correctly. - -</help> -</tool>
--- a/galaxy-conf/Multiply.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,27 +0,0 @@ -<tool id="WigMultiply" name="Multiply" version="1.1.0"> - <description>(Big)Wig files</description> - <command interpreter="sh"> - galaxyToolRunner.sh wigmath.Multiply -o $output - #for $input in $inputs - ${input.file} - #end for - </command> - <inputs> - <repeat name="inputs" title="(Big)Wig file"> - <param name="file" type="data" format="bigwig,wig" /> - </repeat> - </inputs> - <outputs> - <data format="wig" name="output" /> - </outputs> - -<help> - -This tool multiplies Wig or BigWig files base pair by base pair. - -.. class:: infomark - -**TIP:** If your dataset does not appear in the pulldown menu, it means that it is not in Wig or BigWig format. Use "edit attributes" to set the correct format if it was not detected correctly. - -</help> -</tool>
--- a/galaxy-conf/PairOverlappingNucleosomes.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,18 +0,0 @@ -<tool id="PairNukes" name="Pair nucleosomes" version="1.0.0"> - <description>by overlap</description> - <command interpreter="sh">galaxyToolRunner.sh nucleosomes.PairOverlappingNucleosomes -a $input1 -b $input2 -m $N -o $output</command> - <inputs> - <param name="input1" type="data" format="tabular" label="Nucleosome calls 1" /> - <param name="input2" type="data" format="tabular" label="Nucleosome calls 2" /> - <param name="N" type="integer" value="73" label="Minimum overlap (bp)" /> - </inputs> - <outputs> - <data name="output" format="tabular" /> - </outputs> - -<help> - -This tool will pair overlapping nucleosomes from two sets of nucleosome calls. In the event that multiple calls overlap, the one with the largest overlap is selected as a match. - -</help> -</tool>
--- a/galaxy-conf/PercusDecomposition.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,25 +0,0 @@ -<tool id="PercusDecomposition" name="Derive Percus energy landscape" version="1.1.0"> - <description>from occupancy data</description> - <command interpreter="sh">galaxyToolRunner.sh nucleosomes.PercusDecomposition -d $dyads -n $N -o $output</command> - <inputs> - <param name="dyads" type="data" format="bigwig,wig" label="Dyad counts (smoothed)" /> - <param name="N" type="integer" value="147" optional="true" label="Assumed nucleosome size" /> - </inputs> - <outputs> - <data name="output" format="wig" /> - </outputs> - -<help> - -This tool derives an external potential energy function from experimental nucleosome positioning data by assuming that nucleosomes interact with DNA like a fluid of hard rods. This energy function can then be used to derive sequence-specific nucleosome formation preferences, while accounting for hard-core steric restriction by adjacent nucleosomes. This tool is a reimplementation of the algorithm described in (Locke et al. 2010). - ------ - -**Citations** - -Locke G, Tolkunov D, Moqtaderi Z, Struhl K and Morozov AV (2010) High-throughput sequencing reveals a simple model of nucleosome energetics. Proceedings of the National Academy of Sciences 107: 20998–21003 - -Percus JK (1976) Equilibrium state of a classical fluid of hard rods in an external field. J Stat Phys 15: 505–511 - -</help> -</tool>
--- a/galaxy-conf/Phasogram.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,27 +0,0 @@ -<tool id="Phasogram" name="Make phasogram" version="1.0.0"> - <description>of dyads</description> - <command interpreter="sh">galaxyToolRunner.sh nucleosomes.Phasogram -i $input -m $max -o $output</command> - <inputs> - <param name="input" type="data" format="bigwig,wig" label="Dyads (Big)Wig file" /> - <param name="max" type="integer" value="1000" label="Maximum phase shift (bp)" /> - </inputs> - <outputs> - <data name="output" format="tabular" /> - </outputs> - - <help> - -This tool calculates the phase distribution of sequencing data. It can be used to identify genome-wide periodicities. Phase counts are aggregated for each base pair across the genome. This is equivalent to summing the autocovariance of a sliding window across the genome. The tool is a reimplementation of the algorithm described in (Valouev et al. 2011). - -.. class:: infomark - -**TIP:** If your dataset does not appear in the pulldown menu, it means that it is not in Wig or BigWig format. Use "edit attributes" to set the correct format if it was not detected correctly. - ------ - -**Citation** - -Valouev A, Johnson SM, Boyd SD, Smith CL, Fire AZ and Sidow A (2011) Determinants of nucleosome organization in primary human cells. Nature 474: 516–520 - - </help> -</tool>
--- a/galaxy-conf/PowerSpectrum.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,59 +0,0 @@ -<tool id="PowerSpectrum" name="Compute the power spectrum" version="1.0.0"> - <description>of data in a Wiggle file</description> - <command interpreter="sh">galaxyToolRunner.sh ngs.PowerSpectrum -i $input -l $windows -m $max -o $output</command> - <inputs> - <param format="bigwig,wig" name="input" type="data" label="Input data" /> - <param format="bed,bedgraph,gff" name="windows" type="data" label="List of intervals" /> - <param name="max" type="integer" value="40" label="Number of frequencies to output" /> - </inputs> - <outputs> - <data format="tabular" name="output" /> - </outputs> - -<help> - -This tool computes the power spectrum of intervals of sequencing data. For each interval provided, the normalized power spectrum is calculated, representing the relative power in each frequency. Power spectra are normalized to have total power 1, with the DC component (0 frequency) removed. Power spectra are computed using the FFT_ implementation in JTransforms_. - -.. _FFT: http://en.wikipedia.org/wiki/Fast_Fourier_transform - -.. _JTransforms: http://sites.google.com/site/piotrwendykier/software/jtransforms - ------ - -**Syntax** - -- **Input data** is the genomic data on which to compute the power spectrum. -- **List of intervals:** The power spectrum will be computed for each genomic interval specified in this list. -- **Number of frequencies:** The power spectrum will be truncated at this frequency in the output - ------ - -**Output** - -The output has the following format :: - - chr start stop id alignment strand freq1 freq2 ... - -up to the maximum frequency specified. Frequencies are truncated to reduce the size of the output since signals are often band-limited. - ------ - -.. class:: warningmark - -**NOTE:** Even though frequencies may be truncated in the output, all frequencies in the power spectrum are computed and used for normalization. - -.. class:: infomark - -**TIP:** If your dataset does not appear in the pulldown menu, it means that it is not in Wig or BigWig format. Use "edit attributes" to set the correct format if it was not detected correctly. Intervals must be provided in Bed, BedGraph, or GFF format. - ------ - -This tool is equivalent to the following Matlab commands, where x is a vector with the interval of sequencing data :: - - N = length(x); - f = fft(x); - p = abs(f(2:N/2)).^2; - p = p / sum(p); - -</help> -</tool>
--- a/galaxy-conf/ReadLengthDistributionMatrix.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,63 +0,0 @@ -<tool id="ReadLengthDistributionMatrix" name="Create read length distribution matrix" version="1.0.0"> - <description>across a genomic interval</description> - <command interpreter="sh">galaxyToolRunner.sh ngs.ReadLengthDistributionMatrix -i $input --chr $chr --start $start --stop $stop --min $min --max $max --bin $bin -o $output</command> - <inputs> - <param format="sam,bam,bed,bedgraph" name="input" type="data" label="Mapped reads" /> - <param name="chr" type="text" label="Chromosome" /> - <param name="start" type="integer" value="1" label="Start base pair" /> - <param name="stop" type="integer" value="1000" label="Stop base pair" /> - <param name="min" type="integer" value="1" label="Minimum fragment length (bp)" /> - <param name="max" type="integer" value="200" label="Maximum fragment length (bp)" /> - <param name="bin" type="integer" value="1" label="Fragment length bin size (bp)" /> - </inputs> - <outputs> - <data format="tabular" name="output" /> - </outputs> - -<help> - -This tool will create a matrix (in matrix2png_ format) with the distribution of read lengths over each base pair. Reads are binned by genomic location and length to create a matrix where each column represents the distribution of read lengths over that base pair. The resulting matrix can be turned into heatmap using the Visualization -> Make heatmap with matrix2png tool. - -.. _matrix2png: http://bioinformatics.ubc.ca/matrix2png/dataformat.html - -.. class:: warningmark - -This tool requires paired-end SAM, BAM, Bed, or BedGraph formatted data. Using single-end data will result in a constant read length. - ------ - -**Syntax** - -- **Mapped reads** are the mapped paired-end reads used to make the histograms -- **Chromosome** a locus in the genome -- **Start base pair** a locus in the genome -- **Stop base pair** a locus in the genome -- **Minimum fragment length** is the lowest fragment length bin. Reads shorter than this will be ignored. -- **Maximum fragment length** is the highest fragment length bin. Reads longer than this will be ignored. -- **Fragment length bin size** is the bin size used when making the fragment length histograms - ------ - -**Example** - -Make a matrix with the read length distribution across the region chrI:5001-6000, looking at reads 100-200bp in length in bins of 1bp: - -- **Chromosome:** chrI -- **Start:** 5001 -- **Stop:** 6000 -- **Minimum fragment length:** 100 -- **Maximum fragment length:** 200 -- **Fragment length bin size:** 1 - -The resulting matrix will be 1000x101, with each column representing a base pair and each row representing a read length. The column headers give the base pair and the row headers give the read length. - ------ - -**Citation** - -This tool was inspired by the analysis and figures in - -Floer M, Wang X, Prabhu V, Berrozpe G, Narayan S, Spagna D, Alvarez D, Kendall J, Krasnitz A, Stepansky A, Hicks J, Bryant GO and Ptashne M (2010) A RSC/nucleosome complex determines chromatin architecture and facilitates activator binding. Cell 141: 407–418 - -</help> -</tool>
--- a/galaxy-conf/RollingReadLength.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,20 +0,0 @@ -<tool id="RollingReadLength" name="Compute mean fragment length" version="1.1.0"> - <description>over each locus</description> - <command interpreter="sh">galaxyToolRunner.sh ngs.RollingReadLength -i $input -a ${chromInfo} -o $output</command> - <inputs> - <param format="sam,bam,bed,bedgraph" name="input" type="data" label="Mapped reads" /> - </inputs> - <outputs> - <data format="wig" name="output" /> - </outputs> - -<help> - -This tool will compute the mean length of all fragments overlapping a given locus, and can be used to identify sites with exceptionally long or short reads. - -.. class:: warningmark - -This tool requires paired-end SAM, BAM, Bed, or BedGraph formatted data. Using single-end data will result in a constant read length. - -</help> -</tool>
--- a/galaxy-conf/RomanNumeralize.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,22 +0,0 @@ -<tool id="RomanNumeralize" name="Convert Arabic to Roman numerals" version="1.0.0"> - <description>on any file</description> - <command interpreter="sh">galaxyToolRunner.sh converters.RomanNumeralize -i $input -o $output</command> - <inputs> - <param name="input" type="data" label="Convert Arabic integer chromosome coordinates in" /> - </inputs> - <outputs> - <data name="output" format="input" /> - </outputs> - <tests> - <test> - <param name="input" value="romanNumeralize.input"/> - <output name="output" file="romanNumeralize.output"/> - </test> - </tests> - -<help> - -This tool scans any file with chromosomal coordinates of the form "chr5" and replaces them with "chrV". - -</help> -</tool>
--- a/galaxy-conf/Scale.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,60 +0,0 @@ -<tool id="WigScale" name="Scale" version="1.2.0"> - <description>a (Big)Wig file</description> - <command interpreter="sh">galaxyToolRunner.sh wigmath.Scale -i $input -m $M $chr -o $output</command> - <inputs> - <param format="bigwig,wig" name="input" type="data" label="Scale the data in" /> - <param name="M" type="float" value="0" label="Multiply by (leave 0 to scale by 1/mean)" /> - <param name="chr" type="boolean" checked="false" truevalue="--bychr" falsevalue="" label="Scale chromosomes to 1/mean individually (no effect if scale factor is specified)" /> - </inputs> - <outputs> - <data format="wig" name="output" metadata_source="input" /> - </outputs> - <tests> - <!--<test> - <param name="input" value="wigmath.input1"/> - <param name="T" value="0"/> - <param name="dbkey" value="sacCer2"/> - <output name="output" file="percenter.output1"/> - </test> - <test> - <param name="input" value="wigmath.input1.bw"/> - <param name="T" value="0"/> - <param name="dbkey" value="sacCer2"/> - <output name="output" file="percenter.output1"/> - </test> - <test> - <param name="input" value="wigmath.input2"/> - <param name="T" value="2"/> - <param name="dbkey" value="sacCer2"/> - <output name="output" file="percenter.output2"/> - </test> - <test> - <param name="input" value="wigmath.input2.bw"/> - <param name="T" value="2"/> - <param name="dbkey" value="sacCer2"/> - <output name="output" file="percenter.output2"/> - </test> - <test> - <param name="input" value="wigmath.input3"/> - <param name="T" value="1000000"/> - <param name="dbkey" value="sacCer2"/> - <output name="output" file="percenter.output3"/> - </test> - <test> - <param name="input" value="wigmath.input3.bw"/> - <param name="T" value="1000000"/> - <param name="dbkey" value="sacCer2"/> - <output name="output" file="percenter.output3"/> - </test>--> - </tests> - - <help> - -This tool will multiply all values in a Wig file by a scale factor. For example, this can be used to normalize to read depth by multiplying by 1/(# reads). By default, the tool will scale to 1/(mean value), which is equivalent to dividing by coverage and multiplying by the size of the genome. The resulting output file should have mean 1. - -.. class:: infomark - -**TIP:** If your dataset does not appear in the pulldown menu, it means that it is not in Wig or BigWig format. Use "edit attributes" to set the correct format if it was not detected correctly. - - </help> -</tool>
--- a/galaxy-conf/Shift.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,21 +0,0 @@ -<tool id="WigShift" name="Mean shift" version="1.2.0"> - <description>a (Big)Wig file</description> - <command interpreter="sh">galaxyToolRunner.sh wigmath.Shift -i $input -m $M $chr -o $output</command> - <inputs> - <param format="bigwig,wig" name="input" type="data" label="Shift the data in" /> - <param name="M" type="float" value="0" label="To have mean" /> - <param name="chr" type="boolean" checked="false" truevalue="--bychr" falsevalue="" label="Mean-shift chromosomes individually" /> - </inputs> - <outputs> - <data format="wig" name="output" metadata_source="input" /> - </outputs> - <help> - -This tool will shift all values in a Wig file by a scalar so that the output has the desired mean. - -.. class:: infomark - -**TIP:** If your dataset does not appear in the pulldown menu, it means that it is not in Wig or BigWig format. Use "edit attributes" to set the correct format if it was not detected correctly. - - </help> -</tool>
--- a/galaxy-conf/StripMatrix.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,37 +0,0 @@ -<tool id="StripMatrix" name="Strip headers" version="1.1.0"> - <description>from an aligned matrix</description> - <command interpreter="sh">galaxyToolRunner.sh visualization.StripMatrix -i $input -o $output</command> - <inputs> - <param format="tabular" name="input" type="data" label="Aligned matrix" /> - </inputs> - <outputs> - <data format="tabular" name="output" metadata="input" /> - </outputs> - <tests> - <test> - <param name="input" value="test.matrix2png.txt"/> - <output name="output" file="stripMatrix.txt"/> - </test> - </tests> - - <help> - -This tool is intended to strip the column/row headers off of an aligned matrix (in matrix2png format) for easy import into Matlab or other software where only the data values are required. It removes the first row and first column from a tabular file. - ------ - -**Example** - -If the following tabular matrix is used as input :: - - ID col1 col2 col3 - row1 2 4 5 - row2 5 1 1 - -then the following tabular matrix will be produced as output :: - - 2 4 5 - 5 1 1 - - </help> -</tool>
--- a/galaxy-conf/Subtract.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,47 +0,0 @@ -<tool id="WigSubtract" name="Subtract" version="1.1.0"> - <description>two (Big)Wig files</description> - <command interpreter="sh">galaxyToolRunner.sh wigmath.Subtract -m $minuend -s $subtrahend -o $output</command> - <inputs> - <param format="bigwig,wig" name="minuend" type="data" label="File 1 (minuend / top)" /> - <param format="bigwig,wig" name="subtrahend" type="data" label="File 2 (subtrahend / bottom)" /> - </inputs> - <outputs> - <data format="wig" name="output" metadata_source="minuend" /> - </outputs> - <tests> - <!--<test> - <param name="minuend" value="wigmath.input1"/> - <param name="subtrahend" value="wigmath.input2"/> - <param name="dbkey" value="sacCer2"/> - <output name="output" file="difference.output"/> - </test> - <test> - <param name="minuend" value="wigmath.input1.bw"/> - <param name="subtrahend" value="wigmath.input2"/> - <param name="dbkey" value="sacCer2"/> - <output name="output" file="difference.output"/> - </test> - <test> - <param name="minuend" value="wigmath.input1"/> - <param name="subtrahend" value="wigmath.input2.bw"/> - <param name="dbkey" value="sacCer2"/> - <output name="output" file="difference.output"/> - </test> - <test> - <param name="minuend" value="wigmath.input1.bw"/> - <param name="subtrahend" value="wigmath.input2.bw"/> - <param name="dbkey" value="sacCer2"/> - <output name="output" file="difference.output"/> - </test>--> - </tests> - - <help> - -This tool will subtract the values in one Wig file from another, base pair by base pair. - -.. class:: infomark - -**TIP:** If your dataset does not appear in the pulldown menu, it means that it is not in Wig or BigWig format. Use "edit attributes" to set the correct format if it was not detected correctly. - - </help> -</tool>
--- a/galaxy-conf/Summary.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,83 +0,0 @@ -<tool id="WigSummary" name="Output a summary" version="1.1.0"> - <description>of a (Big)Wig file</description> - <command interpreter="sh">galaxyToolRunner.sh wigmath.Summary -i $input -o $output</command> - <inputs> - <param format="bigwig,wig" name="input" type="data" label="(Big)Wig file" /> - </inputs> - <outputs> - <data format="txt" name="output" /> - </outputs> - <tests> - <test> - <param name="input" value="wigmath1.wig"/> - <output name="output" file="wigsummary1.txt"/> - </test> - <test> - <param name="input" value="test.wig"/> - <output name="output" file="wigsummary2.txt"/> - </test> - <test> - <param name="input" value="test.bw"/> - <output name="output" file="wigsummary3.txt"/> - </test> - </tests> - -<help> - -This tool will output a summary of a Wig or BigWig file, including information about the chromosomes and types of contigs in the Wig file, as well as basic descriptive statistics. - ------ - -**Example:** - -The following is an example of the output of this tool :: - - ASCII Text Wiggle file: track type=wiggle_0 - Chromosomes: - 2micron start=1 stop=6318 - chrVI start=1 stop=270148 - chrI start=1 stop=230208 - chrIII start=1 stop=316617 - chrXII start=1 stop=1078175 - chrXV start=1 stop=1091289 - chrXVI start=1 stop=948062 - chrII start=1 stop=813178 - chrVIII start=1 stop=562643 - chrX start=1 stop=745742 - chrXIII start=1 stop=924429 - chrV start=1 stop=576869 - chrXIV start=1 stop=784333 - chrIV start=1 stop=1531919 - chrXI start=1 stop=666454 - chrIX start=1 stop=439885 - chrM start=1 stop=85779 - chrVII start=1 stop=1090947 - Contigs: - fixedStep chrom=2micron start=1 span=1 step=1 - fixedStep chrom=chrVI start=1 span=1 step=1 - fixedStep chrom=chrI start=1 span=1 step=1 - fixedStep chrom=chrIII start=1 span=1 step=1 - fixedStep chrom=chrXII start=1 span=1 step=1 - fixedStep chrom=chrXVI start=1 span=1 step=1 - fixedStep chrom=chrXV start=1 span=1 step=1 - fixedStep chrom=chrII start=1 span=1 step=1 - fixedStep chrom=chrVIII start=1 span=1 step=1 - fixedStep chrom=chrXIII start=1 span=1 step=1 - fixedStep chrom=chrX start=1 span=1 step=1 - fixedStep chrom=chrV start=1 span=1 step=1 - fixedStep chrom=chrXIV start=1 span=1 step=1 - fixedStep chrom=chrIV start=1 span=1 step=1 - fixedStep chrom=chrXI start=1 span=1 step=1 - fixedStep chrom=chrIX start=1 span=1 step=1 - fixedStep chrom=chrM start=1 span=1 step=1 - fixedStep chrom=chrVII start=1 span=1 step=1 - Basic Statistics: - Mean: 1.000000164913575 - Standard Deviation: 1.8843731523620193 - Total: 1.2162997005843896E7 - Bases Covered: 12162995 - Min value: 0.0 - Max value: 277.98996 - -</help> -</tool>
--- a/galaxy-conf/ValueDistribution.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,53 +0,0 @@ -<tool id="WigValueDistribution" name="Compute the value distribution" version="1.1.0"> - <description>of a (Big)Wig file</description> - <command interpreter="sh">galaxyToolRunner.sh wigmath.ValueDistribution -i $input - #if str( $min ) != '' - --min $min - #end if - - #if str( $max ) != '' - --max $max - #end if - - -n $bins -o $output - </command> - <inputs> - <param format="bigwig,wig" name="input" type="data" label="(Big)Wig file" /> - <param name="min" type="float" optional="true" label="Minimum bin value (optional)" /> - <param name="max" type="float" optional="true" label="Maximum bin value (optional)" /> - <param name="bins" type="integer" value="40" label="Number of bins" /> - </inputs> - <outputs> - <data format="txt" name="output" /> - </outputs> - -<help> - -This tool computes a histogram of the values in a Wig file, as well as the moments of the distribution. - ------ - -**Syntax** - -- **Input data** is the genomic data used to compute the histogram. -- **Minimum bin value** is the smallest bin. If unset, it is equal to the minimum value in the input data -- **Maximum bin value** is the largest bin. If unset, it is equal to the maximum value in the input data -- **Number of bins** is the number of bins to use. The bin size will be equal to (max - min) / (# bins). - ------ - -**Output** - -The output is in 2-column tabular format, where the first column represents the lower edge of a bin inteval and the second column represents the number of values that fell in that bin. For example if the **minimum bin value** is 0, the **maximum bin value** is 0.3, and the **number of bins** is 3, then the following output might be produced :: - - bin count - <0 3 - 0 1 - 0.1 10 - 0.2 4 - >0.3 12 - -where there were 3 values in (-inf, 0), 1 value in [0, 0.1), 10 values in [0.1, 0.2), 4 values in [0.2, 0.3), and 12 values in [0.3, inf). - -</help> -</tool>
--- a/galaxy-conf/WaveletTransform.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,40 +0,0 @@ -<tool id="WaveletTransform" name="Wavelet analysis" version="1.0.0"> - <description>across a genomic interval</description> - <command interpreter="sh">galaxyToolRunner.sh ngs.WaveletTransform -i $input -w $wavelet --chr $chr --start $start --stop $stop --min $min --max $max --step $N -o $output</command> - <inputs> - <param format="wig,bigwig" name="input" type="data" label="Sequencing data" /> - <param format="tabular" name="wavelet" type="data" label="Wavelet" /> - <param name="chr" type="text" label="Chromosome" /> - <param name="start" type="integer" value="1" label="Start base pair" /> - <param name="stop" type="integer" value="1000" label="Stop base pair" /> - <param name="min" type="integer" value="10" label="Minimum wavelet size (bp)" /> - <param name="max" type="integer" value="400" label="Maximum wavelet size (bp)" /> - <param name="N" type="integer" value="1" label="Scaling step size (bp)" /> - </inputs> - <outputs> - <data format="tabular" name="output" /> - </outputs> - -<help> - -This tool will perform a Wavelet_ scaling_ analysis on an interval of genomic data. For each base pair in the interval, the similarity (correlation) is calculated between the data and the wavelet over a range of scales. This can be used to identify high-frequency and low-frequency features in the data. The output is a matrix in matrix2png format that can be used to generate a heatmap: along the x-axis (columns) are the base pairs in the interval, along the y-axis (rows) are the correlation coefficients for each Wavelet size, with the largest Wavelet scale at the top and the smallest scale at the bottom. - -.. _Wavelet: http://en.wikipedia.org/wiki/Wavelet - -.. _scaling: http://en.wikipedia.org/wiki/Scaleogram - ------ - -**Syntax** - -- **Input data** is the genomic data on which to compute the Wavelet scaling analysis. -- **Wavelet** a single column of values representing a discrete Wavelet. -- **Chromosome** a locus in the genome -- **Start base pair** a locus in the genome -- **Stop base pair** a locus in the genome -- **Minimum wavelet size** the smallest Wavelet to analyze -- **Minimum wavelet size** the largest Wavelet to analyze -- **Scaling step size** the step size for the range of wavelet scales. The provided wavelet will be scaled to each size in the set min:step:max by interpolating the provided wavelet. - -</help> -</tool>
--- a/galaxy-conf/ZScore.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,51 +0,0 @@ -<tool id="WigZScore" name="Z-Score" version="1.2.0"> - <description>a (Big)Wig file</description> - <command interpreter="sh">galaxyToolRunner.sh wigmath.ZScore -i $input $chr -o $output</command> - <inputs> - <param format="bigwig,wig" name="input" type="data" label="Z-score the data in" /> - <param name="chr" type="boolean" checked="false" truevalue="--bychr" falsevalue="" label="Z-score chromosomes individually" /> - </inputs> - <outputs> - <data format="wig" name="output" metadata_source="input" /> - </outputs> - <tests> - <test> - <param name="input" value="wigmath1.wig"/> - <output name="output" file="zscorer1.wig"/> - </test> - <test> - <param name="input" value="wigmath2.wig"/> - <output name="output" file="zscorer2.wig"/> - </test> - <test> - <param name="input" value="wigmath3.wig"/> - <output name="output" file="zscorer3.wig"/> - </test> - <test> - <param name="input" value="wigmath1.bw"/> - <output name="output" file="zscorer4.wig"/> - </test> - <test> - <param name="input" value="wigmath2.bw"/> - <output name="output" file="zscorer5.wig"/> - </test> - <test> - <param name="input" value="wigmath3.bw"/> - <output name="output" file="zscorer6.wig"/> - </test> - </tests> - - <help> - -This tool will compute normal scores (Z-scores) for each of the values in a Wig file. For each base pair, the Z-scored value is equal to the deviance from the mean divided by the standard deviation (i.e. the number of standard deviations a value is away from the mean). The output file should have mean 0 and standard deviation 1. - -.. class:: infomark - -This tool is equivalent to using the **Mean Shift** tool to shift a Wig file to mean 0, then using the **Scale** tool to scale by 1/(standard deviation). - -.. class:: infomark - -**TIP:** If your dataset does not appear in the pulldown menu, it means that it is not in Wig or BigWig format. Use "edit attributes" to set the correct format if it was not detected correctly. - - </help> -</tool>
--- a/galaxy-conf/galaxyToolRunner.sh Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,18 +0,0 @@ -#!/usr/bin/env bash - -if [ $# -eq 0 ] -then - echo "USAGE: galaxyToolRunner.sh APPNAME [ARGS]"; - exit; -fi - -# Verify that the user has Java 7 installed -# Otherwise there will be an obscure UnsupportedClassVersion error -version=$(java -version 2>&1 | awk -F '"' '/version/ {print $2}') -if [[ "$version" < "1.7" ]]; then - echo "Need Java 7 or greater. You have Java $version installed." - exit -fi - -DIR="$( cd "$( dirname "${BASH_SOURCE[0]}" )" && pwd )" -java -Dlog4j.configuration=log4j.properties -cp $DIR:$DIR/../build:$DIR/../dist/*:$DIR/../lib/* edu.unc.genomics."$@" \ No newline at end of file
--- a/galaxy-conf/log4j.properties Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,12 +0,0 @@ -log4j.rootLogger=info, stdout - -log4j.appender.stdout=org.apache.log4j.ConsoleAppender -log4j.appender.stdout.layout=org.apache.log4j.PatternLayout - -# Pattern to output the caller's file name and line number. -log4j.appender.stdout.layout.ConversionPattern=%m%n - -# Only output errors from the BigWig library -log4j.logger.org.broad.igv.bbfile=ERROR -# Only output errors from java-genomics-io -log4j.logger.edu.unc.genomics.io=ERROR \ No newline at end of file
--- a/galaxy-conf/matrix2png.xml Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,114 +0,0 @@ -<tool id="matrix2png" name="Make heatmap" version="1.0.0"> - <description>using matrix2png</description> - <requirement type='package'>matrix2png</requirement> - <command>matrix2png -data $input - #if str( $range ) != '' - -range $range - #end if - - -con $con - -size $size - -numcolors $numcolors - -minsize $minsize - -mincolor $mincolor - -maxcolor $maxcolor - -bkgcolor $bkgcolor - -missingcolor $missingcolor - - #if str( $map ) != '' - -map $map - #end if - - #if str( $discrete_color_maps.discrete ) != 'false' - -discrete - -dmap $dmap - #end if - - #if str( $numr ) != '' - -numr $numr - #end if - - #if str( $numc ) != '' - -numc $numc - #end if - - -startrow $startrow - -startcol $startcol - - #if str( $trim ) != '0' - -trim $trim - #end if - - #if str( $title ) != '' - -title '$title' - #end if - - $z $b $d $s $r $c $f $e $l $u - - > $output</command> - <inputs> - <param name="input" type="data" format="tabular" label="Input data" /> - <param name="title" type="text" optional="true" size="30" label="Add a title" /> - <param name="size" type="text" optional="true" value="1:1" label="Pixel dimensions per value as x:y" /> - <param name="minsize" type="text" optional="true" value="800:600" label="Minimum image size as x:y pixels" /> - <!-- Not sure what this is, so exclude for now - <param name="desctext" type="data" label="Description Text?" /> --> - <param name="range" type="text" optional="true" label="Values assigned to mincolor and maxcolor as min:max (default is data range)" /> - <param name="con" type="float" optional="true" value="1.0" label="Contrast (only applies when not using -range option)" /> - <param name="numcolors" type="integer" optional="true" value="64" label="Number of colors" /> - <param name="mincolor" type="text" optional="true" value="blue" label="Color used at lowest value (name or r:g:b triplet)" /> - <param name="maxcolor" type="text" optional="true" value="yellow" label="Color used at highest value (name or r:g:b triplet)" /> - <param name="bkgcolor" type="text" optional="true" value="white" label="Color used as background (name or r:g:b triplet)" /> - <param name="missingcolor" type="text" optional="true" value="grey" label="Color used for missing values (name or r:g:b triplet)" /> - <param name="map" type="text" optional="true" label="Color choices from preset maps: overrides min/max colors and -b (default = 0 (none))" /> - <conditional name="discrete_color_maps"> - <param name="discrete" type="select" label="Use discretized mapping of values to colors"> - <option value="true">Yes</option> - <option value="false" selected="true">No</option> - </param> - <when value="true"> - <param name="dmap" type="data" label="Discrete color mapping file to use for discrete mapping (default = preset)" /> - </when> - <when value="false"> - <!-- No values here --> - </when> - </conditional> - <param name="numr" type="text" optional="true" label="Number of rows to process (default = all)" /> - <param name="numc" type="text" optional="true" label="Number of columns to process (default = all)" /> - <param name="startrow" type="integer" optional="true" value="1" label="Index of the first row to be processed" /> - <param name="startcol" type="integer" optional="true" value="1" label="Index of the first column to be processed" /> - <param name="trim" type="integer" optional="true" value="0" label="Trim this percent of data extremes when determining data range (only without the -range option)" /> - <param name="z" type="boolean" checked="false" truevalue="-z" falsevalue="" label="Row-normalize the data to mean 0 and variance 1" /> - <param name="b" type="boolean" checked="true" truevalue="-b" falsevalue="" label="Middle of color range is black" /> - <param name="d" type="boolean" checked="false" truevalue="-d" falsevalue="" label="Add cell dividers" /> - <param name="s" type="boolean" checked="true" truevalue="-s" falsevalue="" label="Add scale bar" /> - <param name="r" type="boolean" checked="false" truevalue="-r" falsevalue="" label="Add row names" /> - <param name="c" type="boolean" checked="false" truevalue="-c" falsevalue="" label="Add column names" /> - <param name="f" type="boolean" checked="false" truevalue="-f" falsevalue="" label="Data file has a format line" /> - <param name="e" type="boolean" checked="false" truevalue="-e" falsevalue="" label="Draw ellipses instead of rectangles" /> - <param name="l" type="boolean" checked="false" truevalue="-l" falsevalue="" label="Log transform the data (base 2)" /> - <param name="u" type="boolean" checked="false" truevalue="-u" falsevalue="" label="Put the column labels under the picture instead of above (ignored unless column names)" /> - <param name="g" type="boolean" checked="false" truevalue="-g" falsevalue="" label="Put the row labels to the left instead of the right (ignored unless row names)" /> - </inputs> - <outputs> - <data name="output" format="png" /> - </outputs> - - <help> - -.. class:: warningmark - -This tool requires that matrix2png be installed and available in Galaxy's PATH. - -.. class:: warningmark - -This tool requires tabular data with column AND row headers. For more information about the required format and usage instructions, see the matrix2png_ website. - -.. _matrix2png: http://bioinformatics.ubc.ca/matrix2png/dataformat.html - -.. class:: warningmark - -It is recommended to specify the colorspace range since outliers will often skew it otherwise. - - </help> -</tool>
--- a/sam_fa_indices.loc.sample Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,28 +0,0 @@ -#This is a sample file distributed with Galaxy that enables tools -#to use a directory of Samtools indexed sequences data files. You will need -#to create these data files and then create a sam_fa_indices.loc file -#similar to this one (store it in this directory) that points to -#the directories in which those files are stored. The sam_fa_indices.loc -#file has this format (white space characters are TAB characters): -# -#index <seq> <location> -# -#So, for example, if you had hg18 indexed stored in -#/depot/data2/galaxy/sam/, -#then the sam_fa_indices.loc entry would look like this: -# -#index hg18 /depot/data2/galaxy/sam/hg18.fa -# -#and your /depot/data2/galaxy/sam/ directory -#would contain hg18.fa and hg18.fa.fai files: -# -#-rw-r--r-- 1 james universe 830134 2005-09-13 10:12 hg18.fa -#-rw-r--r-- 1 james universe 527388 2005-09-13 10:12 hg18.fa.fai -# -#Your sam_fa_indices.loc file should include an entry per line for -#each index set you have stored. The file in the path does actually -#exist, but it should never be directly used. Instead, the name serves -#as a prefix for the index file. For example: -# -#index hg18 /depot/data2/galaxy/sam/hg18.fa -#index hg19 /depot/data2/galaxy/sam/hg19.fa
--- a/tool_data_table_conf.xml.sample Tue Jun 19 22:09:23 2012 -0400 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,118 +0,0 @@ -<!-- Use the file tool_data_table_conf.xml.oldlocstyle if you don't want to update your loc files as changed in revision 4550:535d276c92bc--> -<tables> - <!-- Locations of all fasta files under genome directory --> - <table name="all_fasta" comment_char="#"> - <columns>value, dbkey, name, path</columns> - <file path="tool-data/all_fasta.loc" /> - </table> - <!-- Locations of indexes in the BFAST mapper format --> - <table name="bfast_indexes" comment_char="#"> - <columns>value, dbkey, formats, name, path</columns> - <file path="tool-data/bfast_indexes.loc" /> - </table> - <!-- Locations of nucleotide (mega)blast databases --> - <table name="blastdb" comment_char="#"> - <columns>value, name, path</columns> - <file path="tool-data/blastdb.loc" /> - </table> - <!-- Locations of protein (mega)blast databases --> - <table name="blastdb_p" comment_char="#"> - <columns>value, name, path</columns> - <file path="tool-data/blastdb_p.loc" /> - </table> - <!-- Locations of indexes in the Bowtie mapper format --> - <table name="bowtie_indexes" comment_char="#"> - <columns>value, dbkey, name, path</columns> - <file path="tool-data/bowtie_indices.loc" /> - </table> - <!-- Locations of indexes in the Bowtie2 mapper format --> - <table name="bowtie2_indexes" comment_char="#"> - <columns>value, dbkey, name, path</columns> - <file path="tool-data/bowtie2_indices.loc" /> - </table> - <!-- Locations of indexes in the Bowtie color-space mapper format --> - <table name="bowtie_indexes_color" comment_char="#"> - <columns>value, dbkey, name, path</columns> - <file path="tool-data/bowtie_indices_color.loc" /> - </table> - <!-- Locations of indexes in the BWA mapper format --> - <table name="bwa_indexes" comment_char="#"> - <columns>value, dbkey, name, path</columns> - <file path="tool-data/bwa_index.loc" /> - </table> - <!-- Locations of indexes in the BWA color-space mapper format --> - <table name="bwa_indexes_color" comment_char="#"> - <columns>value, dbkey, name, path</columns> - <file path="tool-data/bwa_index_color.loc" /> - </table> - <!-- Locations of MAF files that have been indexed with bx-python --> - <table name="indexed_maf_files"> - <columns>name, value, dbkey, species</columns> - <file path="tool-data/maf_index.loc" /> - </table> - <!-- Locations of fasta files appropriate for NGS simulation --> - <table name="ngs_sim_fasta" comment_char="#"> - <columns>value, dbkey, name, path</columns> - <file path="tool-data/ngs_sim_fasta.loc" /> - </table> - <!-- Locations of 2bit sequence files for use in Lastz --> - <table name="lastz_seqs" comment_char="#"> - <columns>value, name, path</columns> - <file path="tool-data/lastz_seqs.loc" /> - </table> - <!-- Locations of PerM base index files --> - <table name="perm_base_indexes" comment_char="#"> - <columns>value, name, path</columns> - <file path="tool-data/perm_base_index.loc" /> - </table> - <!-- Locations of PerM color-space index files --> - <table name="perm_color_indexes" comment_char="#"> - <columns>value, name, path</columns> - <file path="tool-data/perm_color_index.loc" /> - </table> - <!-- Location of SAMTools indexes and other files --> - <table name="sam_fa_indexes" comment_char="#"> - <columns>line_type, value, path</columns> - <file path="tool-data/sam_fa_indices.loc" /> - </table> - <!-- Location of Picard dict file and other files --> - <table name="picard_indexes" comment_char="#"> - <columns>value, dbkey, name, path</columns> - <file path="tool-data/picard_index.loc" /> - </table> - <!-- Location of Picard dict files valid for GATK --> - <table name="gatk_picard_indexes" comment_char="#"> - <columns>value, dbkey, name, path</columns> - <file path="tool-data/gatk_sorted_picard_index.loc" /> - </table> - <!-- Available of GATK references --> - <table name="gatk_annotations" comment_char="#"> - <columns>value, name, gatk_value, tools_valid_for</columns> - <file path="tool-data/gatk_annotations.txt" /> - </table> - <!-- Location of SRMA dict file and other files --> - <table name="srma_indexes" comment_char="#"> - <columns>value, dbkey, name, path</columns> - <file path="tool-data/picard_index.loc" /> - </table> - <!-- Locations of indexes in the Bowtie mapper format for TopHat to use --> - <table name="tophat_indexes" comment_char="#"> - <columns>value, dbkey, name, path</columns> - <file path="tool-data/bowtie_indices.loc" /> - </table> - <!-- Locations of indexes in the Bowtie color-space mapper format for TopHat to use --> - <table name="tophat_indexes_color" comment_char="#"> - <columns>value, dbkey, name, path</columns> - <file path="tool-data/bowtie_indices_color.loc" /> - </table> - <!-- Locations of configurations in the CCAT peak/region caller format --> - <table name="ccat_configurations" comment_char="#"> - <columns>value, name, path</columns> - <file path="tool-data/ccat_configurations.loc" /> - </table> - <!-- Location of Mosaik files --> - <table name="mosaik_indexes" comment_char="#"> - <columns>value, dbkey, name, path</columns> - <file path="tool-data/mosaik_index.loc" /> - </table> -</tables>