changeset 13:933fb21568ce draft

Uploaded
author davidvanzessen
date Fri, 11 Nov 2016 03:49:30 -0500
parents 6b66c1c57f22
children 59765d2c8890
files merge_and_filter.r shm_csr.xml
diffstat 2 files changed, 7 insertions(+), 5 deletions(-) [+]
line wrap: on
line diff
--- a/merge_and_filter.r	Thu Nov 10 08:36:18 2016 -0500
+++ b/merge_and_filter.r	Fri Nov 11 03:49:30 2016 -0500
@@ -187,11 +187,13 @@
 	stop("No data remaining after filter")
 }
 
+result$best_match_class = gsub(",.*", "", result$best_match) #gsub so the unmatched don't have a class after it
+
 result$past = do.call(paste, c(result[unlist(strsplit(unique.type, ","))], sep = ":"))
 
 result = result[!(duplicated(result$past)), ]
 
-result = result[,!(names(result) %in% c("past"))]
+result = result[,!(names(result) %in% c("past", "best_match_class"))]
 
 print(paste("Number of sequences in result after", unique.type, "filtering:", nrow(result)))
 
--- a/shm_csr.xml	Thu Nov 10 08:36:18 2016 -0500
+++ b/shm_csr.xml	Fri Nov 11 03:49:30 2016 -0500
@@ -22,14 +22,14 @@
 			<option value="no">No</option>
 		</param>
 		<param name="unique" type="select" label="Remove duplicates based on" help="" >
-			<option value="VGene,AA.JUNCTION,best_match">Top.V.Gene, CDR3 (AA), C region</option>
+			<option value="VGene,AA.JUNCTION,best_match_class">Top.V.Gene, CDR3 (AA), C region</option>
 			<option value="VGene,AA.JUNCTION">Top.V.Gene, CDR3 (AA)</option>
-			<option value="AA.JUNCTION,best_match">CDR3 (AA), C region</option>
+			<option value="AA.JUNCTION,best_match_class">CDR3 (AA), C region</option>
 			<option value="AA.JUNCTION">CDR3 (AA)</option>
 			
-			<option value="VGene,CDR3.IMGT.seq,best_match">Top.V.Gene, CDR3.nt.Seq, C region</option>
+			<option value="VGene,CDR3.IMGT.seq,best_match_class">Top.V.Gene, CDR3.nt.Seq, C region</option>
 			<option value="VGene,CDR3.IMGT.seq">Top.V.Gene, CDR3 (nt)</option>
-			<option value="CDR3.IMGT.seq,best_match">CDR3 (nt), C region</option>
+			<option value="CDR3.IMGT.seq,best_match_class">CDR3 (nt), C region</option>
 			<option value="CDR3.IMGT.seq">CDR3 (nt)</option>
 			<option value="Sequence.ID" selected="true">Don't remove duplicates</option>
 		</param>