12
|
1 <tool id="cnvsim" name="Simulate CNV" version="0.9.2">
|
8
|
2 <description>in NGS short reads </description>
|
|
3 <command interpreter="python" detect_errors="exit_code">
|
|
4 #if $type.simulation_type=="whole_genome"
|
12
|
5 cnv-sim.py -n $number_of_reads -l $read_length -g $regions_count -a $amplifications_percentage -d $deletions_percentage -cn_min $minimum_copy_number -cn_max $maximum_copy_number -r_min $minimum_region_length -r_max $maximum_region_length genome $reference
|
8
|
6 #else
|
12
|
7 cnv-sim.py -n $number_of_reads -l $read_length -g $regions_count -a $amplifications_percentage -d $deletions_percentage -cn_min $minimum_copy_number -cn_max $maximum_copy_number -r_min $minimum_region_length -r_max $maximum_region_length exome $reference $target
|
8
|
8 #end if
|
|
9 </command>
|
|
10 <inputs>
|
|
11 <conditional name="type">
|
|
12 <param name="simulation_type" type="select" label="Simulation Type">
|
12
|
13 <option value="whole_genome">CNV Simulation in Whole Genome Sequencing</option>
|
|
14 <option value="targeted_exome">CNV Simulation in Targeted Exome Sequencing</option>
|
8
|
15 </param>
|
|
16 <when value="whole_genome">
|
|
17 <param format="fasta" name="reference" type="data" label="Reference Genome" help="Reference genome to generate reads from"/>
|
|
18 </when>
|
12
|
19 <when value="targeted_exome">
|
8
|
20 <param format="fasta" name="reference" type="data" label="Reference Genome" help="Reference genome to generate reads from"/>
|
|
21 <param format="bed" name="target" type="data" label="Target Regions" help="a list of exonic regions"/>
|
|
22 </when>
|
|
23 </conditional>
|
|
24 <param name="number_of_reads" type="integer" value="100000" label="Number of Reads" help="determines the number of reads to be generated for the control and simulated CNV (approximately)"/>
|
|
25 <param name="read_length" type="integer" value="100" label="Read Length (bp)" help="determines the read length fot the generated FASTQ files"/>
|
|
26
|
|
27 <param name="regions_count" type="integer" value="30" label="Regions Count" help="determines how many randomly-generated regions will show CNVs"/>
|
12
|
28 <param name="minimum_region_length" type="integer" value="1000" label="Minimum Region Length" help="Minimum length of each CNV region"/>
|
|
29 <param name="maximum_region_length" type="integer" value="100000" label="Maximum Region Length" help="Minimum length of each CNV region"/>
|
|
30 <param name="amplifications_percentage" type="float" value="0.5" label="Percentage of amplifications" help="determines what fraction of the regions will show amplifications (range: 0.0-1.0)"/>
|
|
31 <param name="deletions_percentage" type="float" value="0.5" label="Percentage of deletions" help="determines what fraction of the regions will show deletions (range: 0.0-1.0)"/>
|
|
32 <param name="minimum_copy_number" type="integer" value="3" label="Variation minimum" help="determines the minumum number of amplifications/deletions introduced in each region"/>
|
|
33 <param name="maximum_copy_number" type="integer" value="10" label="Variation maximum" help="determines the maximum number of amplifications/deletions introduced in each region"/>
|
8
|
34
|
|
35 </inputs>
|
|
36 <outputs>
|
12
|
37 <data format="bed" name="cnv_list" from_work_dir="simulation_output/copynumber.bed" label="CNV List from ${tool.name} on ${on_string}"/>
|
|
38 <data format="fastq" name="control_1" from_work_dir="simulation_output/control_1.fastq" label="Control reads 1 from ${tool.name} on ${on_string}"/>
|
|
39 <data format="fastq" name="control_2" from_work_dir="simulation_output/control_2.fastq" label="Control reads 2 from ${tool.name} on ${on_string}"/>
|
|
40 <data format="fastq" name="cnv_1" from_work_dir="simulation_output/cnv_1.fastq" label="CNV reads 1 from ${tool.name} on ${on_string}"/>
|
|
41 <data format="fastq" name="cnv_2" from_work_dir="simulation_output/cnv_2.fastq" label="CNV reads 2 from ${tool.name} on ${on_string}"/>
|
8
|
42 </outputs>
|
|
43 <help><![CDATA[
|
|
44 .. class:: infomark
|
|
45 '''TIP''' This tool requires *fasta* format.
|
|
46 ----
|
|
47 **CNV Simulator**
|
12
|
48 In genomics, Copy Number Variations (CNVs) is a type of structural variation in a genome where sections of the genome are duplicated or deleted. The number of variations (duplications/deletions) varies between individuals in the human population.
|
8
|
49
|
12
|
50 The Copy Number Variation Simulator (CNV-Sim) is a simulation tool that extends the functionality of existing next-generation sequencing read simulators to introduce copy number variations in the generated reads. The resulting reads encompass amplifications as well as deletions according to a predefined list of variant regions.
|
|
51
|
|
52 CNV-Sim aids testing and benchmarking tools for copy number variation detection and analysis. The tool offers two types of simulation:
|
8
|
53
|
|
54 CNV-Sim offers two types of simulation:
|
12
|
55 1. CNV simulation in whole genome. CNV-Sim utilizes the functionality of ART to introduce variations in the genome.
|
|
56 2. CNV simulation in targeted exome. CNV-Sim utilizes the functionality of Wessim to introduce variations in the targets.
|
8
|
57
|
|
58 Homepage: http://nabavilab.github.io/CNV-Sim/
|
|
59 ]]></help>
|
|
60 </tool> |