Mercurial > repos > davidvanzessen > shm_csr
comparison merge_and_filter.r @ 13:933fb21568ce draft
Uploaded
author | davidvanzessen |
---|---|
date | Fri, 11 Nov 2016 03:49:30 -0500 |
parents | 6b66c1c57f22 |
children | 59765d2c8890 |
comparison
equal
deleted
inserted
replaced
12:6b66c1c57f22 | 13:933fb21568ce |
---|---|
185 | 185 |
186 if(nrow(summ) == 0){ | 186 if(nrow(summ) == 0){ |
187 stop("No data remaining after filter") | 187 stop("No data remaining after filter") |
188 } | 188 } |
189 | 189 |
190 result$best_match_class = gsub(",.*", "", result$best_match) #gsub so the unmatched don't have a class after it | |
191 | |
190 result$past = do.call(paste, c(result[unlist(strsplit(unique.type, ","))], sep = ":")) | 192 result$past = do.call(paste, c(result[unlist(strsplit(unique.type, ","))], sep = ":")) |
191 | 193 |
192 result = result[!(duplicated(result$past)), ] | 194 result = result[!(duplicated(result$past)), ] |
193 | 195 |
194 result = result[,!(names(result) %in% c("past"))] | 196 result = result[,!(names(result) %in% c("past", "best_match_class"))] |
195 | 197 |
196 print(paste("Number of sequences in result after", unique.type, "filtering:", nrow(result))) | 198 print(paste("Number of sequences in result after", unique.type, "filtering:", nrow(result))) |
197 | 199 |
198 filtering.steps = rbind(filtering.steps, c("After remove duplicates based on filter", nrow(result))) | 200 filtering.steps = rbind(filtering.steps, c("After remove duplicates based on filter", nrow(result))) |
199 | 201 |