view plotFingerprint.xml @ 8:449dc21ee4e9 draft

planemo upload for repository commit 2c5f94de9ddf6798e49b7e9c340c841ca2bfbcfe
author bgruening
date Mon, 19 Sep 2016 17:38:54 -0400
parents b9660f621e82
children 314348664620
line wrap: on
line source

<tool id="deeptools_plot_fingerprint" name="plotFingerprint" version="@WRAPPER_VERSION@.0">
    <description>plots profiles of BAM files; useful for assesing ChIP signal strength</description>
        <token name="@BINARY@">plotFingerprint</token>
    <expand macro="requirements" />
            --bamfiles #echo " ".join($files)
            --labels #echo " ".join($labels)
            --plotFile $outFileName

            #if $output.showOutputSettings == "yes"
                --plotFileFormat $output.outFileFormat
                #if $output.saveRawCounts:
                    --outRawCounts '$outFileRawCounts'
                #end if
                --plotFileFormat 'png'
            #end if

            #if str($region).strip() != '':
                --region '$region'
            #end if

            #if $advancedOpt.showAdvancedOpt == "yes":
                --binSize '$advancedOpt.binSize'
                --numberOfSamples '$advancedOpt.numberOfSamples'


                #if $advancedOpt.minMappingQuality:
                --minMappingQuality '$advancedOpt.minMappingQuality'
                #end if

                #if $advancedOpt.plotTitle and str($advancedOpt.plotTitle.value) != "":
                    --plotTitle '$advancedOpt.plotTitle'
                #end if
            #end if

        <expand macro="multiple_input_bams" />
        <expand macro="region_limit_operation" />

        <conditional name="advancedOpt">
            <param name="showAdvancedOpt" type="select" label="Show advanced options" >
                <option value="no" selected="true">no</option>
                <option value="yes">yes</option>
            <when value="no" />
            <when value="yes">
                <param argument="--binSize" type="integer" value="500" min="1"
                   label="Bin size in bases"
                   help="Length in bases for a window used to sample the genome."/>
                <param argument="--numberOfSamples" type="integer" value="100000" min="1"
                   label="Number of samples"
                   help="Number of samples taken from the genome to compute the scaling factors."/>
                <expand macro="read_processing_options" />
                <expand macro="skipZeros" />
                <expand macro="plotTitle" />
                <expand macro="blacklist" />

        <conditional name="output">
            <param name="showOutputSettings" type="select" label="Show advanced output settings">
                <option value="no" selected="true">no</option>
                <option value="yes">yes</option>
            <when value="no" />
            <when value="yes">
                <expand macro="input_image_file_format" />
                <param name="saveRawCounts" type="boolean" label="Save the bin counts" help="(--outRawCounts)"/>
        <expand macro="output_image_file_format" />
        <data format="tabular" name="outFileRawCounts" label="${} on ${on_string}: bin counts">
                output['showOutputSettings'] == 'yes' and
                output['saveRawCounts'] is True
            <param name="bamfiles" value="bowtie2 test1.bam,bowtie2 test1.bam" ftype="bam" />
            <param name="showAdvancedOpt" value="no" />
            <param name="showOutputSettings" value="no" />
            <output name="outFileName" file="plotFingerprint_result1.png" ftype="png" compare="sim_size" />
            <param name="bamfiles" value="bowtie2 test1.bam,bowtie2 test1.bam" ftype="bam" />
            <param name="showAdvancedOpt" value="yes" />
            <param name="showOutputSettings" value="yes" />
            <param name="saveRawCounts" value="True" />
            <param name="plotTitle" value="Test Fingerprint Plot" />
            <output name="outFileName" file="plotFingerprint_result2.png" ftype="png" compare="sim_size" />
            <output name="outFileRawCounts" file="plotFingerprint_result2.tabular" ftype="tabular" />

What it does

This tool is useful for assessing the strength of a ChIP (i.e. how clearly the enrichment signal can be separated from the background)
and is based on a method described in Diaz et al. (2012) Stat Appl Genet Mol Biol 11(3).


The default output is a diagnostic plot (see below for an example and further down for some background information).

Optionally, you can obtain the table of raw counts that was used to generate the plot.

.. image:: $PATH_TO_IMAGES/plotFingerprint_output.png
  :width: 600
  :height: 395

Example plot

What follows is the output of ``plotFingerprint`` with our test ChIP-Seq data sets, limiting the analysis to chromosome X. Single-end reads were extended to
200 bp (advanced options).

.. image:: $PATH_TO_IMAGES/bamFP_galaxy_output.png
   :width: 600
   :height: 450


Theoretical Background

The tool first samples indexed BAM files and counts all reads overlapping a window (bin) of the specified length.
These counts are then sorted according to their rank (the bin with the highest number of reads has the highest rank)
and the cumulative sum of read counts are plotted. An ideal input (control) with a uniform distribution of reads alignments
result in a diagonal line. A very specific and strong ChIP enrichment, on the other hand, would result in a large portion
of reads accumulating in just a few bins and the resulting plot showing a steep rise toward the right-most edge. Such results are
most commonly seen with transcription factors.

.. image:: $PATH_TO_IMAGES/QC_fingerprint.png
   :width: 600
   :height: 294


    <expand macro="citations" />