Mercurial > repos > davidvanzessen > mutation_analysis
comparison mutation_analysis.r @ 3:a0b27058dcac draft
Uploaded
author | davidvanzessen |
---|---|
date | Wed, 17 Sep 2014 07:25:17 -0400 |
parents | 2f4298673519 |
children | 069419cccba4 |
comparison
equal
deleted
inserted
replaced
2:2f4298673519 | 3:a0b27058dcac |
---|---|
7 | 7 |
8 #dat = read.table("NWK276_MID6_25NT/8_V-REGION-nt-mutation-statistics_NWK276_MID6_25NT_051113.txt", header=T, sep="\t", fill=T, stringsAsFactors=F) | 8 #dat = read.table("NWK276_MID6_25NT/8_V-REGION-nt-mutation-statistics_NWK276_MID6_25NT_051113.txt", header=T, sep="\t", fill=T, stringsAsFactors=F) |
9 dat = read.table(input, header=T, sep="\t", fill=T, stringsAsFactors=F) | 9 dat = read.table(input, header=T, sep="\t", fill=T, stringsAsFactors=F) |
10 | 10 |
11 datSum = read.table(summaryinput, header=T, sep="\t", fill=T, stringsAsFactors=F) | 11 datSum = read.table(summaryinput, header=T, sep="\t", fill=T, stringsAsFactors=F) |
12 datSum = datSum[,c("Sequence.ID", "AA.JUNCTION")] | 12 datSum = datSum[,c("Sequence.ID","J.GENE.and.allele", "AA.JUNCTION")] |
13 | 13 |
14 dat = merge(dat, datSum, by="Sequence.ID", all.x=T) | 14 dat = merge(dat, datSum, by="Sequence.ID", all.x=T) |
15 | |
16 #dat = dat[dat$Functionality == "productive",] | |
17 | |
18 dat$VGene = gsub("^Homsap ", "", dat$V.GENE.and.allele) | |
19 dat$VGene = gsub("[*].*", "", dat$VGene) | |
20 | |
21 dat$past = paste(dat$AA.JUNCTION, dat$VGene) | |
22 | |
23 #dat = dat[!duplicated(dat$past), ] | |
24 | 15 |
25 if(length(dat$Sequence.ID) == 0){ | 16 if(length(dat$Sequence.ID) == 0){ |
26 setwd(outputdir) | 17 setwd(outputdir) |
27 result = data.frame(x = rep(0, 5), y = rep(0, 5), z = rep(NA, 5)) | 18 result = data.frame(x = rep(0, 5), y = rep(0, 5), z = rep(NA, 5)) |
28 row.names(result) = c("Number of Mutations (%)", "Transition (%)", "Transversions (%)", "Transitions at G C (%)", "Targeting of C G (%)") | 19 row.names(result) = c("Number of Mutations (%)", "Transition (%)", "Transversions (%)", "Transitions at G C (%)", "Targeting of C G (%)") |
118 #dat[dat[,col] == "",] = "0" | 109 #dat[dat[,col] == "",] = "0" |
119 dat[,col] = as.numeric(dat[,col]) | 110 dat[,col] = as.numeric(dat[,col]) |
120 dat[is.na(dat[,col]),] = 0 | 111 dat[is.na(dat[,col]),] = 0 |
121 } | 112 } |
122 | 113 |
114 dat$VGene = gsub("^Homsap ", "", dat$V.GENE.and.allele) | |
115 dat$VGene = gsub("[*].*", "", dat$VGene) | |
116 dat$JGene = gsub("^Homsap ", "", dat$J.GENE.and.allele) | |
117 dat$JGene = gsub("[*].*", "", dat$JGene) | |
118 | |
119 dat$past = paste(dat$AA.JUNCTION, dat$VGene, dat$JGene, (dat$FR1.IMGT.Nb.of.mutations + dat$CDR1.IMGT.Nb.of.mutations + dat$FR2.IMGT.Nb.of.mutations + dat$CDR2.IMGT.Nb.of.mutations + dat$FR3.IMGT.Nb.of.mutations)) | |
120 | |
121 dat = dat[!duplicated(dat$past), ] | |
122 | |
123 VRegionMutations = sum(dat$FR1.IMGT.Nb.of.mutations + | 123 VRegionMutations = sum(dat$FR1.IMGT.Nb.of.mutations + |
124 dat$CDR1.IMGT.Nb.of.mutations + | 124 dat$CDR1.IMGT.Nb.of.mutations + |
125 dat$FR2.IMGT.Nb.of.mutations + | 125 dat$FR2.IMGT.Nb.of.mutations + |
126 dat$CDR2.IMGT.Nb.of.mutations + | 126 dat$CDR2.IMGT.Nb.of.mutations + |
127 dat$FR3.IMGT.Nb.of.mutations) | 127 dat$FR3.IMGT.Nb.of.mutations) |