Mercurial > repos > iuc > data_manager_star_index_builder
comparison data_manager/macros.xml @ 12:71c994a11f71 draft default tip
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/data_managers/data_manager_star_index_builder commit 57d05675396f0b44265fb4dbc8f9f891c6073219
| author | iuc |
|---|---|
| date | Thu, 05 Dec 2024 06:49:40 +0000 |
| parents | d63c1442407f |
| children |
comparison
equal
deleted
inserted
replaced
| 11:d63c1442407f | 12:71c994a11f71 |
|---|---|
| 2 <!-- REMEMBER to bump the version of @IDX_VERSION_SUFFIX@ | 2 <!-- REMEMBER to bump the version of @IDX_VERSION_SUFFIX@ |
| 3 whenever you make changes to the @TOOL_VERSION@ token! | 3 whenever you make changes to the @TOOL_VERSION@ token! |
| 4 The data manager uses a symlink to this macro file to keep the STAR and | 4 The data manager uses a symlink to this macro file to keep the STAR and |
| 5 the index versions in sync, but you should manually update @IDX_VERSION_SUFFIX@ --> | 5 the index versions in sync, but you should manually update @IDX_VERSION_SUFFIX@ --> |
| 6 <!-- STAR version to be used --> | 6 <!-- STAR version to be used --> |
| 7 <token name="@TOOL_VERSION@">2.7.10b</token> | 7 <token name="@TOOL_VERSION@">2.7.11a</token> |
| 8 <token name="@VERSION_SUFFIX@">3</token> | 8 <token name="@VERSION_SUFFIX@">1</token> |
| 9 <token name="@PROFILE@">21.01</token> | 9 <token name="@PROFILE@">21.01</token> |
| 10 <!-- STAR index version compatible with this version of STAR | 10 <!-- STAR index version compatible with this version of STAR |
| 11 This is the STAR version that introduced the index structure expected | 11 This is the STAR version that introduced the index structure expected |
| 12 by the current version. | 12 by the current version. |
| 13 It can be found for any specific version of STAR with: | 13 It can be found for any specific version of STAR with: |
| 14 STAR -h | grep versionGenome | 14 STAR -h | grep versionGenome |
| 15 or by looking for the versionGenome parameter in source/parametersDefault | 15 or by looking for the versionGenome parameter in source/parametersDefault |
| 16 of STAR's source code --> | 16 of STAR's source code --> |
| 17 <token name="@IDX_VERSION@">2.7.4a</token> | 17 <token name="@IDX_VERSION@">2.7.4a</token> |
| 18 <token name="@IDX_VERSION_SUFFIX@">1</token> | 18 <token name="@IDX_VERSION_SUFFIX@">3</token> |
| 19 <token name="@IDX_DATA_TABLE@">rnastar_index2x_versioned</token> | 19 <token name="@IDX_DATA_TABLE@">rnastar_index2x_versioned</token> |
| 20 | |
| 21 <xml name="requirements"> | 20 <xml name="requirements"> |
| 22 <requirements> | 21 <requirements> |
| 23 <requirement type="package" version="@TOOL_VERSION@">star</requirement> | 22 <requirement type="package" version="@TOOL_VERSION@">star</requirement> |
| 24 <requirement type="package" version="1.16.1">samtools</requirement> | 23 <requirement type="package" version="1.18">samtools</requirement> |
| 25 <requirement type="package" version="1.12">gzip</requirement> | 24 <requirement type="package" version="1.13">gzip</requirement> |
| 26 <yield /> | 25 <yield/> |
| 27 </requirements> | 26 </requirements> |
| 28 </xml> | 27 </xml> |
| 29 | |
| 30 <xml name="edam"> | 28 <xml name="edam"> |
| 31 <edam_topics> | 29 <edam_topics> |
| 32 <edam_topic>topic_3170</edam_topic> | 30 <edam_topic>topic_3170</edam_topic> |
| 33 <edam_topic>topic_3308</edam_topic> | 31 <edam_topic>topic_3308</edam_topic> |
| 34 </edam_topics> | 32 </edam_topics> |
| 35 <edam_operations> | 33 <edam_operations> |
| 36 <edam_operation>operation_0292</edam_operation> | 34 <edam_operation>operation_0292</edam_operation> |
| 37 </edam_operations> | 35 </edam_operations> |
| 38 </xml> | 36 </xml> |
| 39 | |
| 40 <xml name="index_selection" token_with_gene_model="0"> | 37 <xml name="index_selection" token_with_gene_model="0"> |
| 41 <param argument="--genomeDir" type="select" | 38 <param argument="--genomeDir" type="select" label="Select reference genome" help="If your genome of interest is not listed, contact the Galaxy team"> |
| 42 label="Select reference genome" | |
| 43 help="If your genome of interest is not listed, contact the Galaxy team"> | |
| 44 <options from_data_table="@IDX_DATA_TABLE@"> | 39 <options from_data_table="@IDX_DATA_TABLE@"> |
| 45 <filter type="static_value" column="4" value="@WITH_GENE_MODEL@" /> | 40 <filter type="static_value" column="4" value="@WITH_GENE_MODEL@"/> |
| 46 <filter type="static_value" column="5" value="@IDX_VERSION@" /> | 41 <filter type="static_value" column="5" value="@IDX_VERSION@"/> |
| 47 <filter type="sort_by" column="2" /> | 42 <filter type="sort_by" column="2"/> |
| 48 <validator type="no_options" message="No indexes are available for the selected input dataset" /> | 43 <validator type="no_options" message="No indexes are available for the selected input dataset"/> |
| 49 </options> | 44 </options> |
| 50 </param> | 45 </param> |
| 51 </xml> | 46 </xml> |
| 52 | |
| 53 <token name="@FASTQ_GZ_OPTION@"> | 47 <token name="@FASTQ_GZ_OPTION@"> |
| 54 --readFilesCommand zcat | 48 --readFilesCommand zcat |
| 55 </token> | 49 </token> |
| 56 <xml name="citations"> | 50 <xml name="citations"> |
| 57 <citations> | 51 <citations> |
| 58 <citation type="doi">10.1093/bioinformatics/bts635</citation> | 52 <citation type="doi">10.1093/bioinformatics/bts635</citation> |
| 59 </citations> | 53 </citations> |
| 60 </xml> | 54 </xml> |
| 61 <xml name="SJDBOPTIONS"> | 55 <xml name="SJDBOPTIONS"> |
| 62 <param argument="--sjdbGTFfile" type="data" format="gff3,gtf" label="Gene model (gff3,gtf) file for splice junctions" optional="false" help="Exon junction information for mapping splices"/> | 56 <param argument="--sjdbGTFfile" type="data" format="gff3,gtf" label="Gene model (gff3,gtf) file for splice junctions" optional="false" help="Exon junction information for mapping splices"/> |
| 63 <param argument="--sjdbOverhang" type="integer" min="1" value="100" label="Length of the genomic sequence around annotated junctions" help="Used in constructing the splice junctions database. Ideal value is ReadLength-1"/> | 57 <param argument="--sjdbGTFfeatureExon" type="text" value="exon" label="Elements to use from the gene model to use for splice junctions" help="By default and for almost all cases: 'exon', referring to finding junctions at the RNA splice sites. This can optionally be changed to allow splicing at other levels, such as 'gene', 'transcript', 'CDS'."/> |
| 58 <param argument="--sjdbOverhang" type="integer" min="1" value="100" label="Length of the genomic sequence around annotated junctions" help="Used in constructing the splice junctions database. Ideal value is ReadLength-1"/> | |
| 64 </xml> | 59 </xml> |
| 65 <xml name="dbKeyActions"> | 60 <xml name="dbKeyActions"> |
| 66 <actions> | 61 <actions> |
| 67 <expand macro="dbKeyAction"/> | 62 <expand macro="dbKeyAction"/> |
| 68 </actions> | 63 </actions> |
| 77 </option> | 72 </option> |
| 78 </action> | 73 </action> |
| 79 </when> | 74 </when> |
| 80 <when value="history"> | 75 <when value="history"> |
| 81 <action type="metadata" name="dbkey"> | 76 <action type="metadata" name="dbkey"> |
| 82 <option type="from_param" name="refGenomeSource.genomeFastaFiles" param_attribute="dbkey" /> | 77 <option type="from_param" name="refGenomeSource.genomeFastaFiles" param_attribute="dbkey"/> |
| 83 </action> | 78 </action> |
| 84 </when> | 79 </when> |
| 85 </conditional> | 80 </conditional> |
| 86 </xml> | 81 </xml> |
| 87 <token name="@TEMPINDEX@"><![CDATA[ | 82 <token name="@TEMPINDEX@"><![CDATA[ |
| 101 #if 'GTFconditional' in $refGenomeSource: | 96 #if 'GTFconditional' in $refGenomeSource: |
| 102 ## GTFconditional exists only in STAR, but not STARsolo | 97 ## GTFconditional exists only in STAR, but not STARsolo |
| 103 #if str($refGenomeSource.GTFconditional.GTFselect) == 'with-gtf': | 98 #if str($refGenomeSource.GTFconditional.GTFselect) == 'with-gtf': |
| 104 --sjdbOverhang '${refGenomeSource.GTFconditional.sjdbOverhang}' | 99 --sjdbOverhang '${refGenomeSource.GTFconditional.sjdbOverhang}' |
| 105 --sjdbGTFfile '${refGenomeSource.GTFconditional.sjdbGTFfile}' | 100 --sjdbGTFfile '${refGenomeSource.GTFconditional.sjdbGTFfile}' |
| 101 --sjdbGTFfeatureExon '${refGenomeSource.GTFconditional.sjdbGTFfeatureExon}' | |
| 106 #if str($refGenomeSource.GTFconditional.sjdbGTFfile.ext) == 'gff3': | 102 #if str($refGenomeSource.GTFconditional.sjdbGTFfile.ext) == 'gff3': |
| 107 --sjdbGTFtagExonParentTranscript Parent | 103 --sjdbGTFtagExonParentTranscript Parent |
| 108 #end if | 104 #end if |
| 109 #end if | 105 #end if |
| 110 #else: | 106 #else: |
| 111 ## ref genome selection is less complex for STARsolo cause | 107 ## ref genome selection is less complex for STARsolo because |
| 112 ## with-gtf is mandatory there | 108 ## with-gtf is mandatory there |
| 113 --sjdbOverhang '${refGenomeSource.sjdbOverhang}' | 109 --sjdbOverhang '${refGenomeSource.sjdbOverhang}' |
| 114 --sjdbGTFfile '${refGenomeSource.sjdbGTFfile}' | 110 --sjdbGTFfile '${refGenomeSource.sjdbGTFfile}' |
| 111 --sjdbGTFfeatureExon '${refGenomeSource.sjdbGTFfeatureExon}' | |
| 115 #if str($refGenomeSource.sjdbGTFfile.ext) == 'gff3': | 112 #if str($refGenomeSource.sjdbGTFfile.ext) == 'gff3': |
| 116 --sjdbGTFtagExonParentTranscript Parent | 113 --sjdbGTFtagExonParentTranscript Parent |
| 117 #end if | 114 #end if |
| 118 #end if | 115 #end if |
| 119 #if str($refGenomeSource.genomeSAindexNbases): | 116 #if str($refGenomeSource.genomeSAindexNbases): |
| 120 --genomeSAindexNbases ${refGenomeSource.genomeSAindexNbases} | 117 --genomeSAindexNbases ${refGenomeSource.genomeSAindexNbases} |
| 118 #end if | |
| 119 ## Diploid mode | |
| 120 #if 'diploidconditional' in $refGenomeSource: | |
| 121 #if str($refGenomeSource.diploidconditional.diploid) == 'Yes': | |
| 122 --genomeTransformVCF '${refGenomeSource.diploidconditional.genomeTransformVCF}' | |
| 123 --genomeTransformType Diploid | |
| 124 #end if | |
| 121 #end if | 125 #end if |
| 122 --runThreadN \${GALAXY_SLOTS:-4} | 126 --runThreadN \${GALAXY_SLOTS:-4} |
| 123 ## in bytes | 127 ## in bytes |
| 124 --limitGenomeGenerateRAM \$((\${GALAXY_MEMORY_MB:-31000} * 1000000)) | 128 --limitGenomeGenerateRAM \$((\${GALAXY_MEMORY_MB:-31000} * 1000000)) |
| 125 && | 129 && |
| 126 #end if | 130 #end if |
| 127 ]]></token> | 131 ]]></token> |
| 128 <token name="@REFGENOMEHANDLING@" ><![CDATA[ | 132 <token name="@REFGENOMEHANDLING@"><![CDATA[ |
| 129 --runThreadN \${GALAXY_SLOTS:-4} | 133 --runThreadN \${GALAXY_SLOTS:-4} |
| 130 --genomeLoad NoSharedMemory | 134 --genomeLoad NoSharedMemory |
| 131 --genomeDir | 135 --genomeDir |
| 132 #if str($refGenomeSource.geneSource) == 'history': | 136 #if str($refGenomeSource.geneSource) == 'history': |
| 133 tempstargenomedir | 137 tempstargenomedir |
| 135 '${refGenomeSource.GTFconditional.genomeDir.fields.path}' | 139 '${refGenomeSource.GTFconditional.genomeDir.fields.path}' |
| 136 ## Handle difference between indices with/without annotations | 140 ## Handle difference between indices with/without annotations |
| 137 #if str($refGenomeSource.GTFconditional.GTFselect) == 'without-gtf-with-gtf': | 141 #if str($refGenomeSource.GTFconditional.GTFselect) == 'without-gtf-with-gtf': |
| 138 --sjdbOverhang $refGenomeSource.GTFconditional.sjdbOverhang | 142 --sjdbOverhang $refGenomeSource.GTFconditional.sjdbOverhang |
| 139 --sjdbGTFfile '${refGenomeSource.GTFconditional.sjdbGTFfile}' | 143 --sjdbGTFfile '${refGenomeSource.GTFconditional.sjdbGTFfile}' |
| 144 --sjdbGTFfeatureExon '${refGenomeSource.GTFconditional.sjdbGTFfeatureExon}' | |
| 140 #if str($refGenomeSource.GTFconditional.sjdbGTFfile.ext) == 'gff3': | 145 #if str($refGenomeSource.GTFconditional.sjdbGTFfile.ext) == 'gff3': |
| 141 --sjdbGTFtagExonParentTranscript Parent | 146 --sjdbGTFtagExonParentTranscript Parent |
| 142 #end if | 147 #end if |
| 143 #end if | 148 #end if |
| 144 #end if | 149 #end if |
| 145 ]]></token> | 150 ]]></token> |
| 146 <token name="@READSHANDLING@" ><![CDATA[ | 151 <token name="@READSHANDLING@"><![CDATA[ |
| 147 ## Check that the input pairs are of the same type | 152 ## Check that the input pairs are of the same type |
| 148 ## otherwise STARsolo will run for a long time and then error out. | 153 ## otherwise STARsolo will run for a long time and then error out. |
| 149 ## We consume either repeats of two inputs R1 + R2 | 154 ## We consume either repeats of two inputs R1 + R2 |
| 150 ## or a collection of paired reads. | 155 ## or a collection of paired reads. |
| 151 #if str($sc.input_types.use) == "repeat": | 156 #if str($sc.input_types.use) == "repeat": |
| 170 --soloCBmatchWLtype $sc.soloCBmatchWLtype | 175 --soloCBmatchWLtype $sc.soloCBmatchWLtype |
| 171 #if $r1.is_of_type('fastq.gz', 'fastqsanger.gz'): | 176 #if $r1.is_of_type('fastq.gz', 'fastqsanger.gz'): |
| 172 @FASTQ_GZ_OPTION@ | 177 @FASTQ_GZ_OPTION@ |
| 173 #end if | 178 #end if |
| 174 ]]></token> | 179 ]]></token> |
| 175 <token name="@LIMITS@" ><![CDATA[ | 180 <token name="@LIMITS@"><![CDATA[ |
| 176 --limitOutSJoneRead $getVar('algo.params.junction_limits.limitOutSJoneRead', $getVar('solo.junction_limits.limitOutSJoneRead', 1000)) | 181 --limitOutSJoneRead $getVar('algo.params.junction_limits.limitOutSJoneRead', $getVar('solo.junction_limits.limitOutSJoneRead', 1000)) |
| 177 --limitOutSJcollapsed $getVar('algo.params.junction_limits.limitOutSJcollapsed', $getVar('solo.junction_limits.limitOutSJcollapsed', 1000000)) | 182 --limitOutSJcollapsed $getVar('algo.params.junction_limits.limitOutSJcollapsed', $getVar('solo.junction_limits.limitOutSJcollapsed', 1000000)) |
| 178 --limitSjdbInsertNsj $getVar('algo.params.junction_limits.limitSjdbInsertNsj', $getVar('solo.junction_limits.limitSjdbInsertNsj', 1000000)) | 183 --limitSjdbInsertNsj $getVar('algo.params.junction_limits.limitSjdbInsertNsj', $getVar('solo.junction_limits.limitSjdbInsertNsj', 1000000)) |
| 179 ]]></token> | 184 ]]></token> |
| 180 <xml name="ref_selection"> | 185 <xml name="ref_selection"> |
| 181 <param argument="--genomeFastaFiles" type="data" format="fasta,fasta.gz" label="Select a reference genome" /> | 186 <param argument="--genomeFastaFiles" type="data" format="fasta,fasta.gz" label="Select a reference genome"/> |
| 182 <param argument="--genomeSAindexNbases" type="integer" min="2" max="16" value="14" label="Length of the SA pre-indexing string" help="Typically between 10 and 15. Longer strings will use much more memory, but allow faster searches. For small genomes, the parameter --genomeSAindexNbases must be scaled down to min(14, log2(GenomeLength)/2 - 1)"/> | 187 <param argument="--genomeSAindexNbases" type="integer" min="2" max="16" value="14" label="Length of the SA pre-indexing string" help="Typically between 10 and 15. Longer strings will use much more memory, but allow faster searches. For small genomes, the parameter --genomeSAindexNbases must be scaled down to min(14, log2(GenomeLength)/2 - 1)"/> |
| 183 </xml> | 188 </xml> |
| 184 <xml name="stdio" > | 189 <xml name="stdio"> |
| 185 <stdio> | 190 <stdio> |
| 186 <regex match="FATAL error" source="both" level="fatal"/> | 191 <regex match="FATAL error" source="both" level="fatal"/> |
| 187 <regex match="EXITING: FATAL INPUT ERROR:" source="both" level="fatal"/> | 192 <regex match="EXITING: FATAL INPUT ERROR:" source="both" level="fatal"/> |
| 188 <regex match="EXITING: fatal error trying to allocate genome arrays, exception thrown: std::bad_alloc" source="both" level="fatal"/> | 193 <regex match="EXITING: fatal error trying to allocate genome arrays, exception thrown: std::bad_alloc" source="both" level="fatal"/> |
| 189 <regex match="\[sam_read1\] missing header\? Abort!" source="both" level="fatal"/> | 194 <regex match="\[sam_read1\] missing header\? Abort!" source="both" level="fatal"/> |
| 190 <yield /> | 195 <yield/> |
| 191 </stdio> | 196 </stdio> |
| 192 </xml> | 197 </xml> |
| 193 <xml name="input_selection"> | 198 <xml name="input_selection"> |
| 194 <conditional name="input_types" > | 199 <conditional name="input_types"> |
| 195 <param name="use" type="select" label="Input Type" > | 200 <param name="use" type="select" label="Input Type"> |
| 196 <option value="repeat" >Separate barcode and cDNA reads</option> | 201 <option value="repeat">Separate barcode and cDNA reads</option> |
| 197 <option value="list_paired" >Paired collection of barcode and cDNA reads</option> | 202 <option value="list_paired">Paired collection of barcode and cDNA reads</option> |
| 198 </param> | 203 </param> |
| 199 <when value="repeat"> | 204 <when value="repeat"> |
| 200 <param format="fastq,fasta,fastq.gz,fastqsanger.gz" name="input1" type="data" multiple="true" | 205 <param format="fastq,fasta,fastq.gz,fastqsanger.gz" name="input1" type="data" multiple="true" label="RNA-Seq FASTQ/FASTA file, Barcode reads"/> |
| 201 label="RNA-Seq FASTQ/FASTA file, Barcode reads" /> | 206 <param format="fastq,fasta,fastq.gz,fastqsanger.gz" name="input2" type="data" multiple="true" label="RNA-Seq FASTQ/FASTA file, cDNA reads"/> |
| 202 <param format="fastq,fasta,fastq.gz,fastqsanger.gz" name="input2" type="data" multiple="true" | |
| 203 label="RNA-Seq FASTQ/FASTA file, cDNA reads"/> | |
| 204 </when> | 207 </when> |
| 205 <when value="list_paired"> | 208 <when value="list_paired"> |
| 206 <param name="input_collection" collection_type="paired" type="data_collection" format="fastq,fasta,fastq.gz,fastqsanger.gz" label="Collection of Pairs" /> | 209 <param name="input_collection" collection_type="paired" type="data_collection" format="fastq,fasta,fastq.gz,fastqsanger.gz" label="Collection of Pairs"/> |
| 207 </when> | 210 </when> |
| 208 </conditional> | 211 </conditional> |
| 209 </xml> | 212 </xml> |
| 210 <xml name="input_selection_smart_seq"> | 213 <xml name="input_selection_smart_seq"> |
| 211 <conditional name="input_types_smart_seq" > | 214 <conditional name="input_types_smart_seq"> |
| 212 <param name="use" type="select" label="Input Type" > | 215 <param name="use" type="select" label="Input Type"> |
| 213 <option value="list_single_end" >Single-end FASTQ collection</option> | 216 <option value="list_single_end">Single-end FASTQ collection</option> |
| 214 <option value="list_paired_end" >Paired FASTQ collection</option> | 217 <option value="list_paired_end">Paired FASTQ collection</option> |
| 215 </param> | 218 </param> |
| 216 <when value="list_single_end"> | 219 <when value="list_single_end"> |
| 217 <param name="single_end_collection" collection_type="list" type="data_collection" format="fastq,fasta,fastq.gz,fastqsanger.gz" label="List of single-end FASTQ files" /> | 220 <param name="single_end_collection" collection_type="list" type="data_collection" format="fastq,fasta,fastq.gz,fastqsanger.gz" label="List of single-end FASTQ files"/> |
| 218 </when> | 221 </when> |
| 219 <when value="list_paired_end"> | 222 <when value="list_paired_end"> |
| 220 <param name="paired_end_collection" collection_type="list:paired" type="data_collection" format="fastq,fasta,fastq.gz,fastqsanger.gz" label="List of paired-end FASTQ files" /> | 223 <param name="paired_end_collection" collection_type="list:paired" type="data_collection" format="fastq,fasta,fastq.gz,fastqsanger.gz" label="List of paired-end FASTQ files"/> |
| 221 </when> | 224 </when> |
| 222 </conditional> | 225 </conditional> |
| 223 </xml> | 226 </xml> |
| 224 <xml name="umidedup_options"> | 227 <xml name="umidedup_options"> |
| 225 <option value="1MM_All" selected="true">Collapse all UMIs with 1 mismatch distance to each other (1MM_All)</option> | 228 <option value="1MM_All" selected="true">Collapse all UMIs with 1 mismatch distance to each other (1MM_All)</option> |
| 226 <option value="1MM_Directional_UMItools" >Directional method from the UMI-tool</option> | 229 <option value="1MM_Directional_UMItools">Directional method from the UMI-tool</option> |
| 227 <option value="1MM_Directional" >Directional with stringent UMI deduplication</option> | 230 <option value="1MM_Directional">Directional with stringent UMI deduplication</option> |
| 228 </xml> | 231 </xml> |
| 229 <xml name="anchor_types"> | 232 <xml name="anchor_types"> |
| 230 <option value="0">Read start</option> | 233 <option value="0">Read start</option> |
| 231 <option value="1">Read end</option> | 234 <option value="1">Read end</option> |
| 232 <option value="2">Adapter start</option> | 235 <option value="2">Adapter start</option> |
| 233 <option value="3">Adapter end</option> | 236 <option value="3">Adapter end</option> |
| 234 </xml> | 237 </xml> |
| 235 <xml name="cb_match_wl_common"> | 238 <xml name="cb_match_wl_common"> |
| 236 <option value="Exact" >Exact</option> | 239 <option value="Exact">Exact</option> |
| 237 <option value="1MM" >Single match (1MM)</option> | 240 <option value="1MM">Single match (1MM)</option> |
| 238 </xml> | 241 </xml> |
| 239 <xml name="cb_match_wl_cellranger"> | 242 <xml name="cb_match_wl_cellranger"> |
| 240 <option value="1MM_multi" selected="true" >Multiple matches (CellRanger 2, 1MM_multi)</option> | 243 <option value="1MM_multi" selected="true">Multiple matches (CellRanger 2, 1MM_multi)</option> |
| 241 <option value="1MM_multi_pseudocounts" >Multiple matches (CellRanger 3, 1MM_multi_pseudocounts)</option> | 244 <option value="1MM_multi_pseudocounts">Multiple matches (CellRanger 3, 1MM_multi_pseudocounts)</option> |
| 242 <option value="1MM_multi_Nbase_pseudocounts" >Multimatching to WL is allowed for CBs with N-bases (CellRanger 3, 1MM_multi_Nbase_pseudocounts)</option> | 245 <option value="1MM_multi_Nbase_pseudocounts">Multimatching to WL is allowed for CBs with N-bases (CellRanger 3, 1MM_multi_Nbase_pseudocounts)</option> |
| 243 </xml> | 246 </xml> |
| 244 <xml name="solo_adapter_params"> | 247 <xml name="solo_adapter_params"> |
| 245 <param argument="--soloAdapterSequence" type="text" value="-" label="Adapter sequence to anchor barcodes." > | 248 <param argument="--soloAdapterSequence" type="text" value="-" label="Adapter sequence to anchor barcodes."> |
| 246 <sanitizer> | 249 <sanitizer> |
| 247 <valid initial="string.digits"> | 250 <valid initial="string.digits"> |
| 248 <add value="-"/> | 251 <add value="-"/> |
| 249 <add value="A"/> | 252 <add value="A"/> |
| 250 <add value="T"/> | 253 <add value="T"/> |
| 252 <add value="G"/> | 255 <add value="G"/> |
| 253 <add value="N"/> | 256 <add value="N"/> |
| 254 </valid> | 257 </valid> |
| 255 </sanitizer> | 258 </sanitizer> |
| 256 </param> | 259 </param> |
| 257 <param argument="--soloAdapterMismatchesNmax" type="integer" min="1" value="1" label="Maximum number of mismatches allowed in adapter sequence" /> | 260 <param argument="--soloAdapterMismatchesNmax" type="integer" min="1" value="1" label="Maximum number of mismatches allowed in adapter sequence"/> |
| 258 <param argument="--clipAdapterType" type="select" > | 261 <param argument="--clipAdapterType" type="select"> |
| 259 <option value="Hamming" selected="true" >Adapter clipping based on Hamming distance</option> | 262 <option value="Hamming" selected="true">Adapter clipping based on Hamming distance</option> |
| 260 <option value="CellRanger4" >5p and 3p adapter clipping similar to CellRanger4</option> | 263 <option value="CellRanger4">5p and 3p adapter clipping similar to CellRanger4</option> |
| 261 <option value="None" >No adapter clipping</option> | 264 <option value="None">No adapter clipping</option> |
| 262 </param> | 265 </param> |
| 263 </xml> | 266 </xml> |
| 264 <xml name="common_SAM_attributes"> | 267 <xml name="common_SAM_attributes"> |
| 265 <option value="NH" selected="true">NH (number of reported alignments/hits for the read)</option> | 268 <option value="NH" selected="true">NH (number of reported alignments/hits for the read)</option> |
| 266 <option value="HI" selected="true">HI (query hit index)</option> | 269 <option value="HI" selected="true">HI (query hit index)</option> |
| 271 <option value="jM">jM (intron motifs for all junctions)</option> | 274 <option value="jM">jM (intron motifs for all junctions)</option> |
| 272 <option value="jI">jI (1-based start and end of introns for all junctions)</option> | 275 <option value="jI">jI (1-based start and end of introns for all junctions)</option> |
| 273 </xml> | 276 </xml> |
| 274 <xml name="limits"> | 277 <xml name="limits"> |
| 275 <section name="junction_limits" title="Junction Limits" expanded="false"> | 278 <section name="junction_limits" title="Junction Limits" expanded="false"> |
| 276 <param argument="--limitOutSJoneRead" type="integer" min="1" value="1000" label="Maximum number of junctions for one read (including all multimappers)" /> | 279 <param argument="--limitOutSJoneRead" type="integer" min="1" value="1000" label="Maximum number of junctions for one read (including all multimappers)"/> |
| 277 <param argument="--limitOutSJcollapsed" type="integer" min="1" value="1000000" label="Maximum number of collapsed junctions" /> | 280 <param argument="--limitOutSJcollapsed" type="integer" min="1" value="1000000" label="Maximum number of collapsed junctions"/> |
| 278 <param argument="--limitSjdbInsertNsj" type="integer" min="0" value="1000000" label="Maximum number of inserts to be inserted into the genome on the fly." /> | 281 <param argument="--limitSjdbInsertNsj" type="integer" min="0" value="1000000" label="Maximum number of inserts to be inserted into the genome on the fly."/> |
| 279 </section> | 282 </section> |
| 280 </xml> | 283 </xml> |
| 281 <xml name="outCountActions"> | 284 <xml name="outCountActions"> |
| 282 <actions> | 285 <actions> |
| 283 <action name="column_names" type="metadata" default="GeneID,Counts_unstrand,Counts_firstStrand,Counts_secondStrand" /> | 286 <action name="column_names" type="metadata" default="GeneID,Counts_unstrand,Counts_firstStrand,Counts_secondStrand"/> |
| 284 <expand macro="dbKeyAction"/> | 287 <expand macro="dbKeyAction"/> |
| 285 </actions> | 288 </actions> |
| 286 </xml> | 289 </xml> |
| 287 <xml name="outWig"> | 290 <xml name="outWig"> |
| 288 <conditional name="outWig"> | 291 <conditional name="outWig"> |
| 291 <option value="bedGraph">Yes in bedgraph format</option> | 294 <option value="bedGraph">Yes in bedgraph format</option> |
| 292 <option value="wiggle">Yes in wiggle format</option> | 295 <option value="wiggle">Yes in wiggle format</option> |
| 293 </param> | 296 </param> |
| 294 <when value="None"> | 297 <when value="None"> |
| 295 <!-- This is necessary for the filtering of output --> | 298 <!-- This is necessary for the filtering of output --> |
| 296 <param name="outWigStrand" type="hidden" value="false" /> | 299 <param name="outWigStrand" type="hidden" value="false"/> |
| 297 </when> | 300 </when> |
| 298 <when value="bedGraph"> | 301 <when value="bedGraph"> |
| 299 <expand macro="outWigParams"/> | 302 <expand macro="outWigParams"/> |
| 300 </when> | 303 </when> |
| 301 <when value="wiggle"> | 304 <when value="wiggle"> |
| 339 #end if | 342 #end if |
| 340 ]]></token> | 343 ]]></token> |
| 341 <xml name="outWigOutputs"> | 344 <xml name="outWigOutputs"> |
| 342 <data format="bedgraph" name="signal_unique_str1" label="${tool.name} on ${on_string}: Coverage Uniquely mapped strand 1" from_work_dir="Signal.Unique.str1.out"> | 345 <data format="bedgraph" name="signal_unique_str1" label="${tool.name} on ${on_string}: Coverage Uniquely mapped strand 1" from_work_dir="Signal.Unique.str1.out"> |
| 343 <filter>outWig['outWigType'] != "None"</filter> | 346 <filter>outWig['outWigType'] != "None"</filter> |
| 344 <expand macro="dbKeyActions" /> | 347 <expand macro="dbKeyActions"/> |
| 345 <change_format> | 348 <change_format> |
| 346 <when input="outWig.outWigType" value="wiggle" format="wig" /> | 349 <when input="outWig.outWigType" value="wiggle" format="wig"/> |
| 347 </change_format> | 350 </change_format> |
| 348 </data> | 351 </data> |
| 349 <data format="bedgraph" name="signal_uniquemultiple_str1" label="${tool.name} on ${on_string}: Coverage Uniquely + Multiple mapped strand 1" from_work_dir="Signal.UniqueMultiple.str1.out"> | 352 <data format="bedgraph" name="signal_uniquemultiple_str1" label="${tool.name} on ${on_string}: Coverage Uniquely + Multiple mapped strand 1" from_work_dir="Signal.UniqueMultiple.str1.out"> |
| 350 <filter>outWig['outWigType'] != "None"</filter> | 353 <filter>outWig['outWigType'] != "None"</filter> |
| 351 <expand macro="dbKeyActions" /> | 354 <expand macro="dbKeyActions"/> |
| 352 <change_format> | 355 <change_format> |
| 353 <when input="outWig.outWigType" value="wiggle" format="wig" /> | 356 <when input="outWig.outWigType" value="wiggle" format="wig"/> |
| 354 </change_format> | 357 </change_format> |
| 355 </data> | 358 </data> |
| 356 <data format="bedgraph" name="signal_unique_str2" label="${tool.name} on ${on_string}: Coverage Uniquely mapped strand 2" from_work_dir="Signal.Unique.str2.out"> | 359 <data format="bedgraph" name="signal_unique_str2" label="${tool.name} on ${on_string}: Coverage Uniquely mapped strand 2" from_work_dir="Signal.Unique.str2.out"> |
| 357 <filter>outWig['outWigType'] != "None" and outWig['outWigStrand']</filter> | 360 <filter>outWig['outWigType'] != "None" and outWig['outWigStrand']</filter> |
| 358 <expand macro="dbKeyActions" /> | 361 <expand macro="dbKeyActions"/> |
| 359 <change_format> | 362 <change_format> |
| 360 <when input="outWig.outWigType" value="wiggle" format="wig" /> | 363 <when input="outWig.outWigType" value="wiggle" format="wig"/> |
| 361 </change_format> | 364 </change_format> |
| 362 </data> | 365 </data> |
| 363 <data format="bedgraph" name="signal_uniquemultiple_str2" label="${tool.name} on ${on_string}: Coverage Uniquely + Multiple mapped strand 2" from_work_dir="Signal.UniqueMultiple.str2.out"> | 366 <data format="bedgraph" name="signal_uniquemultiple_str2" label="${tool.name} on ${on_string}: Coverage Uniquely + Multiple mapped strand 2" from_work_dir="Signal.UniqueMultiple.str2.out"> |
| 364 <filter>outWig['outWigType'] != "None" and outWig['outWigStrand']</filter> | 367 <filter>outWig['outWigType'] != "None" and outWig['outWigStrand']</filter> |
| 365 <expand macro="dbKeyActions" /> | 368 <expand macro="dbKeyActions"/> |
| 366 <change_format> | 369 <change_format> |
| 367 <when input="outWig.outWigType" value="wiggle" format="wig" /> | 370 <when input="outWig.outWigType" value="wiggle" format="wig"/> |
| 368 </change_format> | 371 </change_format> |
| 369 </data> | 372 </data> |
| 370 </xml> | 373 </xml> |
| 371 <xml name="quantMode"> | 374 <xml name="quantMode"> |
| 372 <conditional name="quantmode_output"> | 375 <conditional name="quantmode_output"> |
| 373 <param argument="--quantMode" type="select" | 376 <param argument="--quantMode" type="select" label="Per gene/transcript output" help="STAR can provide analysis results not only with respect to the reference genome, but also with respect to genes and transcripts described by a gene model. Note: This functionality requires either the selection above of a cached index with a gene model, or a gene model provided alongside the index/reference genome in GTF or GFF3 format!"> |
| 374 label="Per gene/transcript output" | |
| 375 help="STAR can provide analysis results not only with respect to the reference genome, but also with respect to genes and transcripts described by a gene model. Note: This functionality requires either the selection above of a cached index with a gene model, or a gene model provided alongside the index/reference genome in GTF or GFF3 format!"> | |
| 376 <option value="-">No per gene or transcript output</option> | 377 <option value="-">No per gene or transcript output</option> |
| 377 <option value="GeneCounts">Per gene read counts (GeneCounts)</option> | 378 <option value="GeneCounts">Per gene read counts (GeneCounts)</option> |
| 378 <option value="TranscriptomeSAM">Transcript-based BAM output (TranscriptomeSAM)</option> | 379 <option value="TranscriptomeSAM">Transcript-based BAM output (TranscriptomeSAM)</option> |
| 379 <option value="TranscriptomeSAM GeneCounts">Both per gene read counts and transcript-based BAM output (TranscriptomeSAM GeneCounts)</option> | 380 <option value="TranscriptomeSAM GeneCounts">Both per gene read counts and transcript-based BAM output (TranscriptomeSAM GeneCounts)</option> |
| 380 </param> | 381 </param> |
| 381 <when value="-" /> | 382 <when value="-"/> |
| 382 <when value="GeneCounts" /> | 383 <when value="GeneCounts"/> |
| 383 <when value="TranscriptomeSAM"> | 384 <when value="TranscriptomeSAM"> |
| 384 <param argument="--quantTranscriptomeBan" type="boolean" truevalue="IndelSoftclipSingleend" falsevalue="Singleend" | 385 <param argument="--quantTranscriptomeBan" type="boolean" truevalue="IndelSoftclipSingleend" falsevalue="Singleend" label="Exclude alignments with indels or soft clipping from the transcriptome BAM output?" help="You will need to exclude alignments with indels and soft-clipped bases from the transcriptome BAM output for compatibility with certain transcript quantification tools, most notably RSEM. If you are using a tool, like eXpress, that can deal with indels and soft-clipped bases, you can achieve better results by leaving this option disabled."/> |
| 385 label="Exclude alignments with indels or soft clipping from the transcriptome BAM output?" | |
| 386 help="You will need to exclude alignments with indels and soft-clipped bases from the transcriptome BAM output for compatibility with certain transcript quantification tools, most notably RSEM. If you are using a tool, like eXpress, that can deal with indels and soft-clipped bases, you can achieve better results by leaving this option disabled." /> | |
| 387 </when> | 386 </when> |
| 388 <when value="TranscriptomeSAM GeneCounts"> | 387 <when value="TranscriptomeSAM GeneCounts"> |
| 389 <param argument="--quantTranscriptomeBan" type="boolean" truevalue="IndelSoftclipSingleend" falsevalue="Singleend" | 388 <param argument="--quantTranscriptomeBan" type="boolean" truevalue="IndelSoftclipSingleend" falsevalue="Singleend" label="Exclude alignments with indels or soft clipping from the transcriptome BAM output?" help="You will need to exclude alignments with indels and soft-clipped bases from the transcriptome BAM output for compatibility with certain transcript quantification tools, most notably RSEM. If you are using a tool, like eXpress, that can deal with indels and soft-clipped bases, you can achieve better results by leaving this option disabled."/> |
| 390 label="Exclude alignments with indels or soft clipping from the transcriptome BAM output?" | |
| 391 help="You will need to exclude alignments with indels and soft-clipped bases from the transcriptome BAM output for compatibility with certain transcript quantification tools, most notably RSEM. If you are using a tool, like eXpress, that can deal with indels and soft-clipped bases, you can achieve better results by leaving this option disabled." /> | |
| 392 </when> | 389 </when> |
| 393 </conditional> | 390 </conditional> |
| 394 </xml> | 391 </xml> |
| 395 <xml name="quantModeNoGTF"> | 392 <xml name="quantModeNoGTF"> |
| 396 <conditional name="quantmode_output"> | 393 <conditional name="quantmode_output"> |
| 397 <param argument="--quantMode" type="select" | 394 <param argument="--quantMode" type="select" label="Per gene/transcript output"> |
| 398 label="Per gene/transcript output"> | |
| 399 <option value="-">No per gene or transcript output as no GTF was provided</option> | 395 <option value="-">No per gene or transcript output as no GTF was provided</option> |
| 400 </param> | 396 </param> |
| 401 <when value="-" /> | 397 <when value="-"/> |
| 402 </conditional> | 398 </conditional> |
| 403 </xml> | 399 </xml> |
| 404 <xml name="outSAMmapqUnique"> | 400 <xml name="outSAMmapqUnique"> |
| 405 <!-- MAPQ 255 is the default in STAR (coming from tophat behaviour and compatibility for Cufflinks) but it is a problematic value | 401 <!-- MAPQ 255 is the default in STAR (coming from tophat behaviour and compatibility for Cufflinks) but it is a problematic value |
| 406 - according to SAM/BAM specs it means "undefined". | 402 - according to SAM/BAM specs it means "undefined". |
| 407 - Using 255 as the max mapq causes problem with modern downstream tools like mutect2: https://sites.duke.edu/workblog/2021/08/18/star-rnaseq-gatk-mutect2/ and 60 has become an inofficial replacement for 255. --> | 403 - Using 255 as the max mapq causes problem with modern downstream tools like mutect2: https://sites.duke.edu/workblog/2021/08/18/star-rnaseq-gatk-mutect2/ and 60 has become an inofficial replacement for 255. --> |
| 408 <param argument="--outSAMmapqUnique" type="integer" value="60" min="0" max="255" | 404 <param argument="--outSAMmapqUnique" type="integer" value="60" min="0" max="255" label="MAPQ value for unique mappers" help="STAR bases the mapping quality scores of alignment records in its BAM output on the number of alternative mappings for the read. If a read maps to multiple locations on the reference genome, the following MAPQ scoring scheme is used: >=5 mappings => MAPQ=0; 3-4 mappings => MAPQ=1; 2 mappings => MAPQ=3. This setting lets you control the MAPQ used for reads mapped to a single location. Set to 255 for compatibility with Cufflink (default in STAR) but keep to 60 for modern downstream tools like mutect2."/> |
| 409 label="MAPQ value for unique mappers" | 405 </xml> |
| 410 help="STAR bases the mapping quality scores of alignment records in its BAM output on the number of alternative mappings for the read. If a read maps to multiple locations on the reference genome, the following MAPQ scoring scheme is | 406 <xml name="wasp"> |
| 411 used: >=5 mappings => MAPQ=0; 3-4 mappings => MAPQ=1; 2 mappings => MAPQ=3. This setting lets you control the MAPQ used for reads mapped to a single location. Set to 255 for compatibility with Cufflink (default in STAR) but keep to 60 for modern downstream tools like mutect2." /> | 407 <!-- |
| 408 This is re-implementation of the original WASP algorithm by Bryce van de Geijn, Graham McVicker, | |
| 409 Yoav Gilad and Jonathan K Pritchard. Please cite the original WASP paper: Nature Methods 12, | |
| 410 1061–1063 (2015) https://www.nature.com/articles/nmeth.3582. WASP filtering is activated | |
| 411 with "waspOutputMode SAMtag". | |
| 412 --> | |
| 413 <conditional name="wasp_conditional"> | |
| 414 <param argument="--waspOutputMode" type="select" label="Actiavte WASP filtering"> | |
| 415 <help><![CDATA[This is a reimplementation of the original WASP algorithm by Bryce van de Geijn, Graham McVicker, | |
| 416 Yoav Gilad and Jonathan K Pritchard. https://doi.org/10.1038/nmeth.3582. This option will add the vW tag to the SAM output. vW:i:1 means | |
| 417 alignment passed WASP filtering, and all other values mean it did not:<br/> | |
| 418 - vW:i:2 = multi-mapping read<br/> | |
| 419 - vW:i:3 = variant base in the read is N (non-ACGT)<br/> | |
| 420 - vW:i:4 = remapped read did not map <br/> | |
| 421 - vW:i:5 = remapped read multi-maps <br/> | |
| 422 - vW:i:6 = remapped read maps to a different locus <br/> | |
| 423 - vW:i:7 = read overlaps too many variants <br/> | |
| 424 ]]> | |
| 425 </help> | |
| 426 <option value="" selected="true">No WASP filtering</option> | |
| 427 <option value="wasp_mode">Activate WASP filtering</option> | |
| 428 </param> | |
| 429 <when value="wasp_mode"> | |
| 430 <param argument="--varVCFfile" type="data" format="vcf" label="VCF file with personal variants" help="Each variant is expected to have a genotype with two alleles. The VCF file needs to have the 10th column with genotype recorded as 0/1, 1/0, 1/1 (or | instead of /)"/> | |
| 431 </when> | |
| 432 <when value=""/> | |
| 433 </conditional> | |
| 412 </xml> | 434 </xml> |
| 413 </macros> | 435 </macros> |
