clonal_sequences_in_paired_samples: RScript.r comparison

comparison RScript.r @ 50:7dd7cefcf72d draft

Uploaded

author	davidvanzessen
date	Thu, 08 Oct 2015 10:07:28 -0400
parents	7658e9f3d416
children	17e677c72e49

comparison

equal deleted inserted replaced

-:7658e9f3d416
+:7dd7cefcf72d
 second.match.filter = merge.filter & sequence.filter & second.sample.filter
 first.rows = patient.fuzzy[first.match.filter,]
 second.rows = patient.fuzzy[second.match.filter,]
+first.rows.v = table(first.rows$V_Segment_Major_Gene)
+first.rows.v = names(first.rows.v[which.max(first.rows.v)])
+first.rows.j = table(first.rows$J_Segment_Major_Gene)
+first.rows.j = names(first.rows.j[which.max(first.rows.j)])
 first.sum = data.frame(merge = first.clone.sequence,
 Patient = patient,
 Receptor = first.rows[1,"Receptor"],
 Sample = first.rows[1,"Sample"],
 Cell_Count = first.rows[1,"Cell_Count"],
 Clone_Molecule_Count_From_Spikes = sum(first.rows$Clone_Molecule_Count_From_Spikes),
 Log10_Frequency = log10(sum(first.rows$Frequency)),
 Total_Read_Count = sum(first.rows$Total_Read_Count),
 dsPerM = sum(first.rows$dsPerM),
-J_Segment_Major_Gene = sort(table(first.rows$J_Segment_Major_Gene),decreasing=TRUE)[1],
+J_Segment_Major_Gene = first.rows.j,
-V_Segment_Major_Gene = sort(table(first.rows$V_Segment_Major_Gene),decreasing=TRUE)[1],
+V_Segment_Major_Gene = first.rows.v,
 Clone_Sequence = first.clone.sequence,
 CDR3_Sense_Sequence = first.rows[1,"CDR3_Sense_Sequence"],
 Related_to_leukemia_clone = F,
 Frequency = sum(first.rows$Frequency),
 locus_V = first.rows[1,"locus_V"],
 normalized_read_count = sum(first.rows$normalized_read_count),
 paste = first.rows[1,"paste"],
 min_cell_paste = first.rows[1,"min_cell_paste"])
 if(nrow(second.rows) > 0){
+second.rows.v = table(second.rows$V_Segment_Major_Gene)
+second.rows.v = names(second.rows.v[which.max(second.rows.v)])
+second.rows.j = table(second.rows$J_Segment_Major_Gene)
+second.rows.j = names(second.rows.j[which.max(second.rows.j)])
 second.sum = data.frame(merge = first.clone.sequence,
 Patient = patient,
 Receptor = second.rows[1,"Receptor"],
 Sample = second.rows[1,"Sample"],
 Cell_Count = second.rows[1,"Cell_Count"],
 Clone_Molecule_Count_From_Spikes = sum(second.rows$Clone_Molecule_Count_From_Spikes),
 Log10_Frequency = log10(sum(second.rows$Frequency)),
 Total_Read_Count = sum(second.rows$Total_Read_Count),
 dsPerM = sum(second.rows$dsPerM),
-J_Segment_Major_Gene = sort(table(second.rows$J_Segment_Major_Gene),decreasing=TRUE)[1],
+J_Segment_Major_Gene = second.rows.j,
-V_Segment_Major_Gene = sort(table(second.rows$V_Segment_Major_Gene),decreasing=TRUE)[1],
+V_Segment_Major_Gene = second.rows.v,
 Clone_Sequence = first.clone.sequence,
 CDR3_Sense_Sequence = second.rows[1,"CDR3_Sense_Sequence"],
 Related_to_leukemia_clone = F,
 Frequency = sum(second.rows$Frequency),
 locus_V = second.rows[1,"locus_V"],
 min_cell_paste = second.rows[1,"min_cell_paste"])
 patientMerge = rbind(patientMerge, merge(first.sum, second.sum, by="merge"))
 patient.fuzzy = patient.fuzzy[!(first.match.filter | second.match.filter),]
+hidden.clone.sequences = c(first.rows[-1,"Clone_Sequence"], second.rows[second.rows$Clone_Sequence != first.clone.sequence,"Clone_Sequence"])
+merge.list[["second"]] = append(merge.list[["second"]], hidden.clone.sequences)
 if(sum(first.match.filter) == 1 & sum(second.match.filter) == 1){
 second.clone.sequence = patient.fuzzy[second.match.filter, "Clone_Sequence"]
-if(nchar(first.clone.sequence) == nchar(second.clone.sequence)){
+if(first.clone.sequence != second.clone.sequence){
-merge.list[["second"]] = append(merge.list[["second"]], second.clone.sequence)
+#merge.list[["second"]] = append(merge.list[["second"]], second.clone.sequence)
 }
 }
 if(nrow(first.rows) > 1 | nrow(second.rows) > 1){

Mercurial > repos > davidvanzessen > clonal_sequences_in_paired_samples

comparison RScript.r @ 50:7dd7cefcf72d draft