# HG changeset patch # User devteam # Date 1415303549 18000 # Node ID 86c73f0eb389c11350915bed75c8d7c1ea6727de # Parent d04dfa7de2dc3d83587a0922c9fa8cab9da6df4b Uploaded diff -r d04dfa7de2dc -r 86c73f0eb389 bwa-mem.xml --- a/bwa-mem.xml Thu Nov 06 14:52:14 2014 -0500 +++ b/bwa-mem.xml Thu Nov 06 14:52:29 2014 -0500 @@ -1,5 +1,10 @@ - + + + + bwa_macros.xml + + bwa samtools @@ -56,8 +61,8 @@ #if str( $fastq_input.fastq_input_selector ) == "paired_iv": ## For interleaved fastq files set -p option -p - #if str( $fastq_input.iv_stats.iv_stats_selector ) == "True": ## check that insert statistics is used - -I "${fastq_input.iv_stats.iset_stats}" + #if str( $fastq_input.iset_stats ): ## check that insert statistics is used + -I "${fastq_input.iset_stats}" #end if #end if @@ -118,23 +123,37 @@ #if str( $fastq_input.fastq_input_selector ) == "paired": - #if str( $fastq_input.paired_stats.paired_stats_selector ) == "True": ## check that insert statistics is used - -I "${fastq_input.paired_stats.iset_stats}" + #if str( $fastq_input.iset_stats ): ## check that insert statistics is used + -I "${fastq_input.iset_stats}" #end if "${reference_fasta_filename}" "${fastq_input.fastq_input1}" "${fastq_input.fastq_input2}" + #elif str( $fastq_input.fastq_input_selector ) == "paired_collection": + + #if str( $fastq_input.iset_stats ): ## check that insert statistics is used + -I "${fastq_input.iset_stats}" + #end if + + + "${reference_fasta_filename}" + + "${fastq_input.fastq_input1.forward}" "${fastq_input.fastq_input1.reverse}" + #else: - + + "${reference_fasta_filename}" "${fastq_input.fastq_input1}" #end if - | samtools view -Sb - > $bam_output + | samtools view -Sb - > temporary_bam_file.bam && + + samtools sort -f temporary_bam_file.bam ${bam_output} @@ -155,71 +174,52 @@ - + + - - - - - - - - - - - - - - - - - - - - - + + + + + + + + + + + + + - - - - - - - - - - - - - - - - - - - - - - + + + + + + + - + + + + @@ -252,7 +252,10 @@ - + + + + @@ -271,8 +274,12 @@ + - + + + + @@ -297,8 +304,12 @@ + - + + + + @@ -418,31 +429,13 @@ (4 sigma from the mean if absent) and min of the insert size distribution. FR orientation only. [inferred] ------- -.. class:: warningmark - -**An important note on Read Groups** - -One of the recommended best practices in NGS analysis is adding read group information to BAM files. You can do thid directly in BWA MEM interface using the -**Specify readgroup information?** widget. If you are not familiar with readgroups you shold know that this is effectively a way to tag reads with an additional ID. -This allows you to combine BAM files from, for example, multiple BWA MEM runs into a single dataset. This significantly simplifies downstream processing as -instead of dealing with multiple datasets you only have to handle only one. This is possible because the readgroup information allows you to identify -data from different experiments even if they are combined in one file. Many downstream analysis tools such as varinat callers (e.g., FreeBayes or Naive Varinat Caller -present in Galaxy) are aware of readgtroups and will automatically generate calls for each individual sample even if they are combined within a single file. +@dataset_collections@ ------ - -.. class:: infomark - -**More info** +@RG@ -To obtain more information about BWA MEM and ask questions use these resources: +@info@ - 1. https://biostar.usegalaxy.org/ - 2. https://www.biostars.org/ - 3. https://github.com/lh3/bwa - 4. http://bio-bwa.sourceforge.net/