annotate rrBLUP.R @ 103:e7115e44d8d8 draft default tip

Uploaded
author nicolas
date Mon, 31 Oct 2016 07:20:49 -0400
parents 2f423d8656ae
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
87
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
1
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
2 ########################################################
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
3 #
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
4 # creation date : 05/01/16
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
5 # last modification : 25/10/16
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
6 # author : Dr Nicolas Beaume
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
7 #
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
8 ########################################################
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
9
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
10
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
11 library(rrBLUP)
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
12 ############################ helper functions #######################
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
13
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
14
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
15 ################################## main function ###########################
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
16 # do rrBLUP evaluation of classification.
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
17 # optimization of paramaters is included in rrBLUP package
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
18 rrBLUP <- function(genotype, phenotype, outFile, evaluation=F, folds) {
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
19 # Evaluation mode
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
20 if(evaluation) {
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
21 prediction <- NULL
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
22 # run over folds
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
23 for(i in 1:length(folds)) {
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
24 # create training and test set for this fold
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
25 train <- genotype[-folds[[i]],]
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
26 test <- genotype[folds[[i]],]
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
27 phenoTrain <- phenotype[-folds[[i]]]
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
28 phenoTest <- phenotype[folds[[i]]]
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
29 # create model
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
30 model <-mixed.solve(phenoTrain, Z=train,K=NULL, SE=F,return.Hinv = F)
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
31 # predict current test set
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
32 pred <- as.matrix(test) %*% as.matrix(model$u)
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
33 pred <- pred[,1]+model$beta
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
34 prediction <- c(prediction, list(pred))
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
35 }
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
36 # save results
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
37 saveRDS(prediction, file=paste(outFile,".rds", sep=""))
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
38 # just create a model
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
39 } else {
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
40 # create and save modle
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
41 model <-mixed.solve(phenotype, Z=genotype,K=NULL, SE=F,return.Hinv = F)
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
42 saveRDS(model, file = paste(outFile, ".rds", sep = ""))
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
43 }
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
44 }
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
45
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
46
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
47 ############################ main #############################
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
48 # get argument from xml file
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
49 cmd <- commandArgs(T)
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
50 source(cmd[1])
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
51 # for evaluation mode : set evaluation as True and load fold file
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
52 if(as.integer(evaluation) == 1) {
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
53 evaluation <- T
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
54 con = file(folds)
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
55 folds <- readLines(con = con, n = 1, ok=T)
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
56 close(con)
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
57 folds <- readRDS(folds)
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
58 } else{
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
59 evaluation <- F
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
60 }
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
61 # load genotype and phenotype
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
62 con = file(genotype)
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
63 genotype <- readLines(con = con, n = 1, ok=T)
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
64 close(con)
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
65 genotype <- read.table(genotype, sep="\t", h=T)
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
66 phenotype <- read.table(phenotype, sep="\t", h=T)[,1]
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
67 # run !
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
68 rrBLUP(genotype = genotype, phenotype = phenotype, outFile = out,
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
69 evaluation = evaluation, folds = folds)
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
70 # return path of the result to galaxy
2f423d8656ae Uploaded
nicolas
parents:
diff changeset
71 cat(paste(paste(out, ".rds", sep = ""), "\n", sep=""))