Mercurial > repos > computational-metabolomics > mspurity_createdatabase
annotate dimsPredictPuritySingle.R @ 0:f52287a06c02 draft
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
| author | computational-metabolomics | 
|---|---|
| date | Wed, 27 Nov 2019 13:44:58 -0500 | 
| parents | |
| children | 2f71b3495221 | 
| rev | line source | 
|---|---|
| 0 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 1 library(msPurity) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 2 library(optparse) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 3 print(sessionInfo()) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 4 | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 5 option_list <- list( | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 6 make_option(c("--mzML_file"), type="character"), | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 7 make_option(c("--mzML_files"), type="character"), | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 8 make_option(c("--mzML_filename"), type="character", default=''), | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 9 make_option(c("--mzML_galaxy_names"), type="character", default=''), | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 10 make_option(c("--peaks_file"), type="character"), | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 11 make_option(c("-o", "--out_dir"), type="character"), | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 12 make_option("--minoffset", default=0.5), | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 13 make_option("--maxoffset", default=0.5), | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 14 make_option("--ilim", default=0.05), | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 15 make_option("--ppm", default=4), | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 16 make_option("--dimspy", action="store_true"), | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 17 make_option("--sim", action="store_true"), | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 18 make_option("--remove_nas", action="store_true"), | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 19 make_option("--iwNorm", default="none", type="character"), | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 20 make_option("--file_num_dimspy", default=1), | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 21 make_option("--exclude_isotopes", action="store_true"), | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 22 make_option("--isotope_matrix", type="character") | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 23 ) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 24 | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 25 # store options | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 26 opt<- parse_args(OptionParser(option_list=option_list)) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 27 | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 28 print(sessionInfo()) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 29 print(opt) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 30 | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 31 print(opt$mzML_files) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 32 print(opt$mzML_galaxy_names) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 33 | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 34 str_to_vec <- function(x){ | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 35 print(x) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 36 x <- trimws(strsplit(x, ',')[[1]]) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 37 return(x[x != ""]) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 38 } | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 39 | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 40 find_mzml_file <- function(mzML_files, galaxy_names, mzML_filename){ | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 41 mzML_filename <- trimws(mzML_filename) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 42 mzML_files <- str_to_vec(mzML_files) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 43 galaxy_names <- str_to_vec(galaxy_names) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 44 if (mzML_filename %in% galaxy_names){ | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 45 return(mzML_files[galaxy_names==mzML_filename]) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 46 }else{ | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 47 stop(paste("mzML file not found - ", mzML_filename)) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 48 } | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 49 } | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 50 | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 51 | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 52 if (is.null(opt$dimspy)){ | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 53 df <- read.table(opt$peaks_file, header = TRUE, sep='\t') | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 54 if (file.exists(opt$mzML_file)){ | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 55 mzML_file <- opt$mzML_file | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 56 }else if (!is.null(opt$mzML_files)){ | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 57 mzML_file <- find_mzml_file(opt$mzML_files, opt$mzML_galaxy_names, | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 58 opt$mzML_filename) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 59 }else{ | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 60 mzML_file <- file.path(opt$mzML_file, filename) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 61 } | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 62 }else{ | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 63 indf <- read.table(opt$peaks_file, | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 64 header = TRUE, sep='\t', stringsAsFactors = FALSE) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 65 | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 66 filename <- colnames(indf)[8:ncol(indf)][opt$file_num_dimspy] | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 67 print(filename) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 68 # check if the data file is mzML or RAW (can only use mzML currently) so | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 69 # we expect an mzML file of the same name in the same folder | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 70 indf$i <- indf[,colnames(indf)==filename] | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 71 indf[,colnames(indf)==filename] <- as.numeric(indf[,colnames(indf)==filename]) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 72 | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 73 filename = sub("raw", "mzML", filename, ignore.case = TRUE) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 74 print(filename) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 75 | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 76 | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 77 if (file.exists(opt$mzML_file)){ | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 78 mzML_file <- opt$mzML_file | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 79 }else if (!is.null(opt$mzML_files)){ | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 80 mzML_file <- find_mzml_file(opt$mzML_files, opt$mzML_galaxy_names, filename) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 81 }else{ | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 82 mzML_file <- file.path(opt$mzML_file, filename) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 83 } | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 84 | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 85 # Update the dimspy output with the correct information | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 86 df <- indf[4:nrow(indf),] | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 87 if ('blank_flag' %in% colnames(df)){ | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 88 df <- df[df$blank_flag==1,] | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 89 } | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 90 colnames(df)[colnames(df)=='m.z'] <- 'mz' | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 91 | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 92 if ('nan' %in% df$mz){ | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 93 df[df$mz=='nan',]$mz <- NA | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 94 } | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 95 df$mz <- as.numeric(df$mz) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 96 } | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 97 | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 98 if (!is.null(opt$remove_nas)){ | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 99 df <- df[!is.na(df$mz),] | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 100 } | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 101 | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 102 if (is.null(opt$isotope_matrix)){ | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 103 im <- NULL | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 104 }else{ | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 105 im <- read.table(opt$isotope_matrix, | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 106 header = TRUE, sep='\t', stringsAsFactors = FALSE) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 107 } | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 108 | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 109 if (is.null(opt$exclude_isotopes)){ | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 110 isotopes <- FALSE | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 111 }else{ | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 112 isotopes <- TRUE | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 113 } | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 114 | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 115 if (is.null(opt$sim)){ | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 116 sim=FALSE | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 117 }else{ | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 118 sim=TRUE | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 119 } | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 120 | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 121 minOffset = as.numeric(opt$minoffset) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 122 maxOffset = as.numeric(opt$maxoffset) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 123 | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 124 if (opt$iwNorm=='none'){ | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 125 iwNorm = FALSE | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 126 iwNormFun = NULL | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 127 }else if (opt$iwNorm=='gauss'){ | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 128 iwNorm = TRUE | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 129 iwNormFun = msPurity::iwNormGauss(minOff=-minOffset, maxOff=maxOffset) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 130 }else if (opt$iwNorm=='rcosine'){ | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 131 iwNorm = TRUE | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 132 iwNormFun = msPurity::iwNormRcosine(minOff=-minOffset, maxOff=maxOffset) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 133 }else if (opt$iwNorm=='QE5'){ | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 134 iwNorm = TRUE | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 135 iwNormFun = msPurity::iwNormQE.5() | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 136 } | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 137 | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 138 print('FIRST ROWS OF PEAK FILE') | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 139 print(head(df)) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 140 print(mzML_file) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 141 predicted <- msPurity::dimsPredictPuritySingle(df$mz, | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 142 filepth=mzML_file, | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 143 minOffset=minOffset, | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 144 maxOffset=maxOffset, | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 145 ppm=opt$ppm, | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 146 mzML=TRUE, | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 147 sim = sim, | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 148 ilim = opt$ilim, | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 149 isotopes = isotopes, | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 150 im = im, | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 151 iwNorm = iwNorm, | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 152 iwNormFun = iwNormFun | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 153 ) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 154 predicted <- cbind(df, predicted) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 155 | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 156 print(head(predicted)) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 157 print(file.path(opt$out_dir, 'dimsPredictPuritySingle_output.tsv')) | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 158 | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 159 write.table(predicted, | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 160 file.path(opt$out_dir, 'dimsPredictPuritySingle_output.tsv'), | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 161 row.names=FALSE, sep='\t') | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 162 | 
| 
f52287a06c02
"planemo upload for repository https://github.com/computational-metabolomics/mspurity-galaxy commit cb903cd93f9378cfb5eeb68512a54178dcea7bbc-dirty"
 computational-metabolomics parents: diff
changeset | 163 | 
