annotate rgFastQC.xml @ 2:2611a96c30b7 draft

Deleted selected files
author iuc
date Sat, 18 Jan 2014 22:33:36 -0500
parents 39b1c10532a4
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
1 <tool name="FastQC: Comprehensive QC" id="fastqc" version="0.53">
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
2 <description>reporting for short read sequence</description>
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
3 <command interpreter="python">
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
4 rgFastQC.py -i "$input_file" -d "$html_file.files_path" -o "$html_file" -n "$out_prefix" -f "$input_file.ext" -j "$input_file.name"
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
5 #if $contaminants.dataset and str($contaminants) > ''
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
6 -c "$contaminants"
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
7 #end if
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
8 -e fastqc
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
9 </command>
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
10 <requirements>
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
11 <requirement type="package" version="0.10.1">fastqc_dist_0_10_1</requirement>
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
12 </requirements>
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
13 <inputs>
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
14 <param format="fastqsanger,fastq,bam,sam" name="input_file" type="data" label="Short read data from your current history" />
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
15 <param name="out_prefix" value="FastQC" type="text" label="Title for the output file - to remind you what the job was for" size="80"
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
16 help="Letters and numbers only please - other characters will be removed">
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
17 <sanitizer invalid_char="">
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
18 <valid initial="string.letters,string.digits"/>
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
19 </sanitizer>
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
20 </param>
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
21 <param name="contaminants" type="data" format="tabular" optional="true" label="Contaminant list"
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
22 help="tab delimited file with 2 columns: name and sequence. For example: Illumina Small RNA RT Primer CAAGCAGAAGACGGCATACGA"/>
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
23 </inputs>
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
24 <outputs>
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
25 <data format="html" name="html_file" label="${out_prefix}_${input_file.name}.html" />
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
26 </outputs>
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
27 <tests>
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
28 <test>
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
29 <param name="input_file" value="1000gsample.fastq" />
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
30 <param name="out_prefix" value="fastqc_out" />
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
31 <param name="contaminants" value="fastqc_contaminants.txt" ftype="tabular" />
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
32 <output name="html_file" file="fastqc_report.html" ftype="html" lines_diff="100"/>
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
33 </test>
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
34 </tests>
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
35 <help>
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
36
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
37 .. class:: infomark
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
38
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
39 **Purpose**
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
40 Quote from FastQC_
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
41
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
42 FastQC aims to provide a simple way to do some quality control checks on raw
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
43 sequence data coming from high throughput sequencing pipelines.
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
44 It provides a modular set of analyses which you can use to give a quick
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
45 impression of whether your data has any problems of
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
46 which you should be aware before doing any further analysis.
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
47
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
48 The main functions of FastQC are:
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
49
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
50 - Import of data from BAM, SAM or FastQ files (any variant)
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
51 - Providing a quick overview to tell you in which areas there may be problems
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
52 - Summary graphs and tables to quickly assess your data
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
53 - Export of results to an HTML based permanent report
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
54 - Offline operation to allow automated generation of reports without running the interactive application
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
55
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
56 FastQC_ is the best place to look for documentation - it's very good.
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
57 Some features of the Galaxy wrapper you are using are described below.
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
58
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
59 -----
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
60
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
61 .. class:: infomark
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
62
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
63 **This Galaxy Tool**
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
64 You are using FastQC_ in Galaxy.
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
65 This is easy because it has been packaged into a Galaxy tool by the Intergalactic Utilities Commission.
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
66 It exposes the external package FastQC_ which is documented at FastQC_
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
67 Kindly acknowledge it as well as this tool if you use it.
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
68 FastQC incorporates the Picard-tools_ libraries for sam/bam processing.
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
69
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
70 The contaminants file parameter was borrowed from the independently developed
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
71 fastqcwrapper contributed to the Galaxy Community Tool Shed by Jim Johnson.
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
72
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
73 -----
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
74
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
75 .. class:: infomark
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
76
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
77 **Inputs and outputs**
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
78
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
79 This wrapper will accept a Galaxy fastq, sam or bam as the input read file to check.
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
80 It will also take an optional file containing a list of contaminants information, in the form of
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
81 a tab-delimited file with 2 columns, name and sequence.
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
82
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
83 FastQC_ produces a single HTML output file which is slightly adjusted so it looks good in Galaxy that contains all of the results, including the following:
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
84
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
85 - Basic Statistics
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
86 - Per base sequence quality
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
87 - Per sequence quality scores
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
88 - Per base sequence content
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
89 - Per base GC content
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
90 - Per sequence GC content
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
91 - Per base N content
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
92 - Sequence Length Distribution
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
93 - Sequence Duplication Levels
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
94 - Overrepresented sequences
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
95 - Kmer Content
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
96
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
97 All except Basic Statistics and Overrepresented sequences are plots.
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
98 .. _FastQC: http://www.bioinformatics.bbsrc.ac.uk/projects/fastqc/
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
99 .. _Picard-tools: http://picard.sourceforge.net/index.shtml
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
100
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
101 </help>
39b1c10532a4 Remove intermediate directory
iuc
parents:
diff changeset
102 </tool>