# HG changeset patch # User proteore # Date 1524229643 14400 # Node ID c6ba1e6f686955126f67e085adeab232604f1357 # Parent 1e99111901424e224aacebb860a816858257b19e planemo upload commit 74b6a02a2e64d02551c05b52d571b888ac73cac9 diff -r 1e9911190142 -r c6ba1e6f6869 README.rst --- a/README.rst Wed Mar 14 10:24:54 2018 -0400 +++ b/README.rst Fri Apr 20 09:07:23 2018 -0400 @@ -13,7 +13,7 @@ ------------------------------------------------------- -This tool allows to filter out data according to your specific needs (e.g. contaminants, non-significant values or related to a particular annotation) from a proteomics results file (e.g. MaxQuant or Proline output). +This tool allows to remove unneeded data (e.g. contaminants, non-significant values) from a proteomics results file (e.g. MaxQuant or Proline output). **For each row, if there are more than one protein IDs/protein names/gene names, only the first one will be considered in the output** @@ -31,17 +31,17 @@ ALDOA_RABBIT -**The line that contains these keywords will be filtered from input file and provided in a separate file.** +**The line that contains these keywords will be eliminated from input file.** **Keywords search can be applied by performing either exact match or partial one by using the following option** -- If you choose **Yes**, only the fields that contains exactly the same content will be filtered. +- If you choose **Yes**, only the fields that contains exactly the same content will be removed. -- If you choose **No**, all the fields containing the keyword will be filtered. +- If you choose **No**, all the fields containing the keyword will be removed. For example: -**Yes** option (exact match) selected using the keyword "kinase": only lines which contain exactly "kinase" is filtered (and not "Kinase"). +**Yes** option (exact match) selected using the keyword "kinase": only lines which contain exactly "kinase" is removed. **No** option (partial match) for "kinase": not only lines which contain "kinase" but also lines with "alpha-kinase" (and so on) are removed. @@ -57,4 +57,4 @@ * A text file containing the resulting filtered input file. -* A text file containing the rows that have been filtered from the input file. +* A text file containing the rows removed from the input file. \ No newline at end of file diff -r 1e9911190142 -r c6ba1e6f6869 filter_kw_val.py --- a/filter_kw_val.py Wed Mar 14 10:24:54 2018 -0400 +++ b/filter_kw_val.py Fri Apr 20 09:07:23 2018 -0400 @@ -33,8 +33,8 @@ """ Check if a variable is a float or an integer """ - float_format = re.compile(r"^[-]?[1-9][0-9]*.?[0-9]+$") - int_format = re.compile(r"^[-]?[1-9][0-9]*$") + float_format = re.compile(r"^[-]?[0-9][0-9]*.?[0-9]+$") + int_format = re.compile(r"^[-]?[0-9][0-9]*$") test = "" if number_format == "int": test = re.match(int_format, n) diff -r 1e9911190142 -r c6ba1e6f6869 filter_kw_val.xml diff -r 1e9911190142 -r c6ba1e6f6869 test-data/FKW_Lacombe_et_al_2017_OK.txt diff -r 1e9911190142 -r c6ba1e6f6869 test-data/Lacombe_et_al_2017_OK.txt diff -r 1e9911190142 -r c6ba1e6f6869 test-data/Trash_FKW_Lacombe_et_al_2017_OK.txt