Mercurial > repos > davidvanzessen > mutation_analysis
comparison mutation_analysis.r @ 3:a0b27058dcac draft
Uploaded
| author | davidvanzessen |
|---|---|
| date | Wed, 17 Sep 2014 07:25:17 -0400 |
| parents | 2f4298673519 |
| children | 069419cccba4 |
comparison
equal
deleted
inserted
replaced
| 2:2f4298673519 | 3:a0b27058dcac |
|---|---|
| 7 | 7 |
| 8 #dat = read.table("NWK276_MID6_25NT/8_V-REGION-nt-mutation-statistics_NWK276_MID6_25NT_051113.txt", header=T, sep="\t", fill=T, stringsAsFactors=F) | 8 #dat = read.table("NWK276_MID6_25NT/8_V-REGION-nt-mutation-statistics_NWK276_MID6_25NT_051113.txt", header=T, sep="\t", fill=T, stringsAsFactors=F) |
| 9 dat = read.table(input, header=T, sep="\t", fill=T, stringsAsFactors=F) | 9 dat = read.table(input, header=T, sep="\t", fill=T, stringsAsFactors=F) |
| 10 | 10 |
| 11 datSum = read.table(summaryinput, header=T, sep="\t", fill=T, stringsAsFactors=F) | 11 datSum = read.table(summaryinput, header=T, sep="\t", fill=T, stringsAsFactors=F) |
| 12 datSum = datSum[,c("Sequence.ID", "AA.JUNCTION")] | 12 datSum = datSum[,c("Sequence.ID","J.GENE.and.allele", "AA.JUNCTION")] |
| 13 | 13 |
| 14 dat = merge(dat, datSum, by="Sequence.ID", all.x=T) | 14 dat = merge(dat, datSum, by="Sequence.ID", all.x=T) |
| 15 | |
| 16 #dat = dat[dat$Functionality == "productive",] | |
| 17 | |
| 18 dat$VGene = gsub("^Homsap ", "", dat$V.GENE.and.allele) | |
| 19 dat$VGene = gsub("[*].*", "", dat$VGene) | |
| 20 | |
| 21 dat$past = paste(dat$AA.JUNCTION, dat$VGene) | |
| 22 | |
| 23 #dat = dat[!duplicated(dat$past), ] | |
| 24 | 15 |
| 25 if(length(dat$Sequence.ID) == 0){ | 16 if(length(dat$Sequence.ID) == 0){ |
| 26 setwd(outputdir) | 17 setwd(outputdir) |
| 27 result = data.frame(x = rep(0, 5), y = rep(0, 5), z = rep(NA, 5)) | 18 result = data.frame(x = rep(0, 5), y = rep(0, 5), z = rep(NA, 5)) |
| 28 row.names(result) = c("Number of Mutations (%)", "Transition (%)", "Transversions (%)", "Transitions at G C (%)", "Targeting of C G (%)") | 19 row.names(result) = c("Number of Mutations (%)", "Transition (%)", "Transversions (%)", "Transitions at G C (%)", "Targeting of C G (%)") |
| 118 #dat[dat[,col] == "",] = "0" | 109 #dat[dat[,col] == "",] = "0" |
| 119 dat[,col] = as.numeric(dat[,col]) | 110 dat[,col] = as.numeric(dat[,col]) |
| 120 dat[is.na(dat[,col]),] = 0 | 111 dat[is.na(dat[,col]),] = 0 |
| 121 } | 112 } |
| 122 | 113 |
| 114 dat$VGene = gsub("^Homsap ", "", dat$V.GENE.and.allele) | |
| 115 dat$VGene = gsub("[*].*", "", dat$VGene) | |
| 116 dat$JGene = gsub("^Homsap ", "", dat$J.GENE.and.allele) | |
| 117 dat$JGene = gsub("[*].*", "", dat$JGene) | |
| 118 | |
| 119 dat$past = paste(dat$AA.JUNCTION, dat$VGene, dat$JGene, (dat$FR1.IMGT.Nb.of.mutations + dat$CDR1.IMGT.Nb.of.mutations + dat$FR2.IMGT.Nb.of.mutations + dat$CDR2.IMGT.Nb.of.mutations + dat$FR3.IMGT.Nb.of.mutations)) | |
| 120 | |
| 121 dat = dat[!duplicated(dat$past), ] | |
| 122 | |
| 123 VRegionMutations = sum(dat$FR1.IMGT.Nb.of.mutations + | 123 VRegionMutations = sum(dat$FR1.IMGT.Nb.of.mutations + |
| 124 dat$CDR1.IMGT.Nb.of.mutations + | 124 dat$CDR1.IMGT.Nb.of.mutations + |
| 125 dat$FR2.IMGT.Nb.of.mutations + | 125 dat$FR2.IMGT.Nb.of.mutations + |
| 126 dat$CDR2.IMGT.Nb.of.mutations + | 126 dat$CDR2.IMGT.Nb.of.mutations + |
| 127 dat$FR3.IMGT.Nb.of.mutations) | 127 dat$FR3.IMGT.Nb.of.mutations) |
