# HG changeset patch # User jjohnson # Date 1614171746 0 # Node ID b7795c2f0b811aeed6f252b08532af4c4537e1c0 # Parent 0ad5327b80cc1ff86306a7d66370a365a9c1abbf "planemo upload commit 692ea558cbbefee93859dc2b005fab5ac4970eb8" diff -r 0ad5327b80cc -r b7795c2f0b81 fgbio_call_molecular_consensus_reads.xml --- a/fgbio_call_molecular_consensus_reads.xml Sun Feb 21 23:40:53 2021 +0000 +++ b/fgbio_call_molecular_consensus_reads.xml Wed Feb 24 13:02:26 2021 +0000 @@ -24,8 +24,8 @@ --min-input-base-quality=$filter_options.min_input_base_quality #end if - #if $bam_options.read-name-prefix - --read-name-prefix='$bam_options.read-name-prefix' + #if $bam_options.read_name_prefix + --read-name-prefix='$bam_options.read_name_prefix' #end if #if $bam_options.tag --tag=$bam_options.tag @@ -41,20 +41,18 @@ #end if ]]> - + -

- - - - + + +

- - + + @@ -64,13 +62,16 @@

- + - + output_rejects == True + - + + + diff -r 0ad5327b80cc -r b7795c2f0b81 macros.xml --- a/macros.xml Sun Feb 21 23:40:53 2021 +0000 +++ b/macros.xml Wed Feb 24 13:02:26 2021 +0000 @@ -17,22 +17,33 @@ + + + + + + + + + + + pairs much like the CIGAR string in BAM files. Four kinds of operators are recognized: - T identifies a template read - B identifies a sample barcode read - M identifies a unique molecular index read - S identifies a set of bases that should be skipped or ignored + - T identifies a template read + - B identifies a sample barcode read + - M identifies a unique molecular index read + - S identifies a set of bases that should be skipped or ignored The last pair may be specified using a + sign instead of number to denote “all remaining bases”. This is useful if, e.g., fastqs have been trimmed and contain reads of varying length. For example to convert a paired-end run with an index read and where the first 5 bases of R1 are a UMI and the second five bases are monotemplate you might specify: diff -r 0ad5327b80cc -r b7795c2f0b81 macros.xml.bak --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/macros.xml.bak Wed Feb 24 13:02:26 2021 +0000 @@ -0,0 +1,56 @@ + + 1.3.0 + 0 + + + fgbio + + + + (([1-9][0-9]*[TBMS])*([+]|[1-9][0-9]*)[TBMS]) + @READ_STRUCTURE_PATTERN@(\s@READ_STRUCTURE_PATTERN@)* + + ^@READ_STRUCTURES_PATTERN@$ + + + ^[A-Za-z][A-Za-z]$ + + + + + + + + + + + pairs much like the CIGAR string in BAM files. Four kinds of operators are recognized: + + - T identifies a template read + - B identifies a sample barcode read + - M identifies a unique molecular index read + - S identifies a set of bases that should be skipped or ignored + +The last pair may be specified using a + sign instead of number to denote “all remaining bases”. This is useful if, e.g., fastqs have been trimmed and contain reads of varying length. For example to convert a paired-end run with an index read and where the first 5 bases of R1 are a UMI and the second five bases are monotemplate you might specify: + +:: + + --input r1.fq r2.fq i1.fq --read-structures 5M5S+T +T +B + +Alternative if you know your reads are of fixed length you could specify: + +:: + + --input r1.fq r2.fq i1.fq --read-structures 5M5S65T 75T 8B + + +]]> + + + + + +