Mercurial > repos > iuc > snpsift_dbnsfp
changeset 1:13191d4914f7 draft
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tool_collections/snpsift/snpsift_dbnsfp commit 21b46ae2c90ba7e569b2b3a9eaf938f8dedb2c31
author | iuc |
---|---|
date | Tue, 07 Jun 2016 10:04:48 -0400 |
parents | dc480609d9c1 |
children | c838e7136a40 |
files | repository_dependencies.xml snpSift_dbnsfp.xml snpSift_macros.xml tool-data/snpsift_dbnsfps.loc.sample tool_data_table_conf.xml.sample tool_dependencies.xml |
diffstat | 6 files changed, 59 insertions(+), 42 deletions(-) [+] |
line wrap: on
line diff
--- a/repository_dependencies.xml Thu Jan 22 08:53:21 2015 -0500 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,4 +0,0 @@ -<?xml version="1.0"?> -<repositories description="This requires the SnpEff dbnsfp datatype definitions."> - <repository changeset_revision="0c4372b93e85" name="snpsift_dbnsfp_datatypes" owner="iuc" toolshed="https://toolshed.g2.bx.psu.edu" /> -</repositories>
--- a/snpSift_dbnsfp.xml Thu Jan 22 08:53:21 2015 -0500 +++ b/snpSift_dbnsfp.xml Tue Jun 07 10:04:48 2016 -0400 @@ -1,24 +1,27 @@ -<tool id="snpSift_dbnsfp" name="SnpSift dbNSFP" version="4.0.0"> - <description>Add Annotations from dbNSFP</description> - <expand macro="requirements" /> +<tool id="snpSift_dbnsfp" name="SnpSift dbNSFP" version="@WRAPPER_VERSION@.0"> + <description>Add Annotations from dbNSFP or similar annotation DBs</description> <macros> <import>snpSift_macros.xml</import> </macros> - <command> - java -Xmx6G -jar \$SNPEFF_JAR_PATH/SnpSift.jar dbnsfp -v - #if $db.dbsrc == 'cached' : - -db $db.dbnsfp - #if $db.annotations and $db.annotations.__str__ != '': + <expand macro="requirements" /> + <expand macro="stdio" /> + <expand macro="version_command" /> + <command><![CDATA[ + java -Xmx6G -jar "\$SNPEFF_JAR_PATH/SnpSift.jar" dbnsfp -v + #if $db.dbsrc == 'cached': + -db "$db.dbnsfp" + #if $db.annotations and str($db.annotations) != '': -f "$db.annotations" #end if - #else : + #else: -db "${db.dbnsfpdb.extra_files_path}/${db.dbnsfpdb.metadata.bgzip}" - #if $db.annotations and $db.annotations.__str__ != '': + #if $db.annotations and str($db.annotations) != '': -f "$db.annotations" #end if - #end if - $input > $output - 2> tmp.err && grep -v file tmp.err + #end if + "$input" > "$output" + 2> tmp.err && grep -v file tmp.err +]]> </command> <inputs> <param name="input" type="data" format="vcf" label="Variant input file in VCF format"/> @@ -29,17 +32,17 @@ </param> <when value="cached"> <param name="dbnsfp" type="select" label="Genome"> - <options from_data_table="snpsift_dbnsfp"> - <column name="name" index="1"/> - <column name="value" index="2"/> + <options from_data_table="snpsift_dbnsfps"> + <column name="name" index="2"/> + <column name="value" index="3"/> </options> </param> <param name="annotations" type="select" multiple="true" display="checkboxes" label="Annotate with"> - <options from_data_table="snpsift_dbnsfp"> - <column name="name" index="3"/> - <column name="value" index="3"/> - <filter type="param_value" ref="dbnsfp" column="2" /> - <filter type="multiple_splitter" column="3" separator=","/> + <options from_data_table="snpsift_dbnsfps"> + <column name="name" index="4"/> + <column name="value" index="4"/> + <filter type="param_value" ref="dbnsfp" column="3" /> + <filter type="multiple_splitter" column="4" separator=","/> </options> </param> </when> @@ -53,7 +56,6 @@ </when> </conditional> </inputs> - <expand macro="stdio" /> <outputs> <data format="vcf" name="output" /> </outputs> @@ -70,9 +72,10 @@ </output> </test> </tests> - <help> + <help><![CDATA[ The dbNSFP is an integrated database of functional predictions from multiple algorithms (SIFT, Polyphen2, LRT and MutationTaster, PhyloP and GERP++, etc.). +It contains variant annotations such as: 1000Gp1_AC @@ -124,7 +127,7 @@ ESP6500_EA_AF Alternative allele frequency in the European American samples of the NHLBI GO Exome Sequencing Project (ESP6500 data set) FATHMM_pred - If a FATHMM_score is <=-1.5 (or rankscore <=0.81415) the corresponding non-synonymous SNP is predicted as "D(AMAGING)"; otherwise it is predicted as "T(OLERATED)". Multiple predictions separated by ";" + If a FATHMM_score is <=-1.5 (or rankscore <=0.81415) the corresponding non-synonymous SNP is predicted as "D(AMAGING)"; otherwise it is predicted as "T(OLERATED)". Multiple predictions separated by ";" FATHMM_rankscore FATHMMori scores were ranked among all FATHMMori scores in dbNSFP. The rankscore is the ratio of the rank of the score over the total number of FATHMMori scores in dbNSFP. If there are multiple scores, only the most damaging (largest) rankscore is presented. The scores range from 0 to 1 FATHMM_score @@ -152,7 +155,7 @@ LRT_Omega Estimated nonsynonymous-to-synonymous-rate ratio (Omega, reported by LRT) LRT_converted_rankscore - LRTori scores were first converted as LRTnew=1-LRTori*0.5 if Omega<1, or LRTnew=LRTori*0.5 if Omega>=1. Then LRTnew scores were ranked among all LRTnew scores in dbNSFP. The rankscore is the ratio of the rank over the total number of the scores in dbNSFP. The scores range from 0.00166 to 0.85682 + LRTori scores were first converted as LRTnew=1-LRTori*0.5 if Omega<1, or LRTnew=LRTori*0.5 if Omega>=1. Then LRTnew scores were ranked among all LRTnew scores in dbNSFP. The rankscore is the ratio of the rank over the total number of the scores in dbNSFP. The scores range from 0.00166 to 0.85682 LRT_pred LRT prediction, D(eleterious), N(eutral) or U(nknown), which is not solely determined by the score LRT_score @@ -222,7 +225,7 @@ SIFT_converted_rankscore SIFTori scores were first converted to SIFTnew=1-SIFTori, then ranked among all SIFTnew scores in dbNSFP. The rankscore is the ratio of the rank the SIFTnew score over the total number of SIFTnew scores in dbNSFP. If there are multiple scores, only the most damaging (largest) rankscore is presented. The rankscores range from 0.02654 to 0.87932 SIFT_pred - If SIFTori is smaller than 0.05 (rankscore>0.55) the corresponding non-synonymous SNP is predicted as "D(amaging)"; otherwise it is predicted as "T(olerated)". Multiple predictions separated by ";" + If SIFTori is smaller than 0.05 (rankscore>0.55) the corresponding non-synonymous SNP is predicted as "D(amaging)"; otherwise it is predicted as "T(olerated)". Multiple predictions separated by ";" SIFT_score SIFT score (SIFTori). Scores range from 0 to 1. The smaller the score the more likely the SNP has damaging effect. Multiple scores separated by ";" SiPhy_29way_logOdds @@ -241,7 +244,11 @@ rs numbers from UniSNP, which is a cleaned version of dbSNP build 129, in format: rs number1;rs number2;... -The website for dbNSFP database is https://sites.google.com/site/jpopgen/dbNSFP and there is only annotation for human hg18 and hg19 genome builds. +The website for dbNSFP database is https://sites.google.com/site/jpopgen/dbNSFP and there is only annotation for human genome builds. + +The procedure for preparing the dbNSFP data for use in SnpSift dbnsfp is in the SnpSift documentation: +*( It also provides links for dbNSFP databases prebuilt for SnpSift )* +http://snpeff.sourceforge.net/SnpSift.html#dbNSFP However, any dbNSFP-like tabular file that be can used with SnpSift dbnsfp if it has:: @@ -265,10 +272,9 @@ 4 100239319 T G H P ADH1B 0 -The uploaded tabular file should be set to datatype: "dbnsfp.tabular" -Using "Convert Format" the "dbnsfp.tabular" can be converted to the correct format for SnpSift dbnsfp. - -The procedure for preparing the dbNSFP data for use in SnpSift dbnsfp is in the SnpSift documentation. +The galaxy datatypes for dbNSFP can automatically convert the specially formatted tabular file for use by SnpSift dbNSFP: + 1. Upload the tabular file, set the datatype as: **"dbnsfp.tabular"** + 2. Edit the history dataset attributes (pencil icon): Use "Convert Format" to convert the **"dbnsfp.tabular"** to the correct format for SnpSift dbnsfp: **"snpsiftdbnsfp"**. @EXTERNAL_DOCUMENTATION@ @@ -276,6 +282,14 @@ @CITATION_SECTION@ - +]]> </help> + <expand macro="citations"> + <citation type="doi">DOI: 10.1002/humu.21517</citation> + <citation type="doi">DOI: 10.1002/humu.22376</citation> + <citation type="doi">DOI: 10.1002/humu.22932</citation> + <citation type="doi">doi: 10.1093/hmg/ddu733</citation> + <citation type="doi">doi: 10.1093/nar/gku1206</citation> + <citation type="doi">doi: 10.3389/fgene.2012.00035</citation> + </expand> </tool>
--- a/snpSift_macros.xml Thu Jan 22 08:53:21 2015 -0500 +++ b/snpSift_macros.xml Tue Jun 07 10:04:48 2016 -0400 @@ -1,7 +1,7 @@ <macros> <xml name="requirements"> <requirements> - <requirement type="package" version="4.0">snpEff</requirement> + <requirement type="package" version="4.1">snpEff</requirement> </requirements> </xml> <xml name="stdio"> @@ -10,6 +10,10 @@ <exit_code range="1:" level="fatal" description="Error" /> </stdio> </xml> + <xml name="version_command"> + <version_command>java -jar "$SNPEFF_JAR_PATH/snpEff.jar" -version</version_command> + </xml> + <token name="@WRAPPER_VERSION@">4.1</token> <token name="@EXTERNAL_DOCUMENTATION@"> For details about this tool, please go to:
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/tool-data/snpsift_dbnsfps.loc.sample Tue Jun 07 10:04:48 2016 -0400 @@ -0,0 +1,3 @@ +#key build description path annotations +#GRCh37_dbNSFP2.4 GRCh37 GRCh37 dbNSFP2.4 /depot/snpeff/dbNSFP2.4.txt.gz SIFT_pred,Uniprot_acc +#GRCh38_dbNSFP3.1c GRCh38 GRCh38 dbNSFP3.1c /depot/snpeff/dbNSFP3.1c.txt.gz SIFT_pred,Uniprot_acc
--- a/tool_data_table_conf.xml.sample Thu Jan 22 08:53:21 2015 -0500 +++ b/tool_data_table_conf.xml.sample Tue Jun 07 10:04:48 2016 -0400 @@ -1,7 +1,7 @@ <tables> - <table name="snpsift_dbnsfp" comment_char="#"> - <columns>dbkey, name, value, annotations</columns> - <file path="tool-data/snpsift_dbnsfp.loc" /> + <table name="snpsift_dbnsfps" comment_char="#"> + <columns>key, build, name, value, annotations</columns> + <file path="tool-data/snpsift_dbnsfps.loc" /> </table> </tables>
--- a/tool_dependencies.xml Thu Jan 22 08:53:21 2015 -0500 +++ b/tool_dependencies.xml Tue Jun 07 10:04:48 2016 -0400 @@ -1,6 +1,6 @@ <?xml version="1.0"?> <tool_dependency> - <package name="snpEff" version="4.0"> - <repository changeset_revision="6bc55957927b" name="package_snpeff_4_0" owner="iuc" toolshed="https://toolshed.g2.bx.psu.edu" /> + <package name="snpEff" version="4.1"> + <repository changeset_revision="374c7f8421fb" name="package_snpeff_4_1" owner="iuc" toolshed="https://toolshed.g2.bx.psu.edu" /> </package> </tool_dependency>