annotate mutation_analysis.r @ 0:74d2bc479bee draft

Uploaded
author davidvanzessen
date Mon, 18 Aug 2014 04:04:37 -0400
parents
children 2f4298673519
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
1 args <- commandArgs(trailingOnly = TRUE)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
2
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
3 input = args[1]
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
4 summaryinput = args[2]
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
5 outputdir = args[3]
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
6 setwd(outputdir)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
7
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
8 #dat = read.table("NWK276_MID6_25NT/8_V-REGION-nt-mutation-statistics_NWK276_MID6_25NT_051113.txt", header=T, sep="\t", fill=T, stringsAsFactors=F)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
9 dat = read.table(input, header=T, sep="\t", fill=T, stringsAsFactors=F)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
10
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
11 datSum = read.table(summaryinput, header=T, sep="\t", fill=T, stringsAsFactors=F)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
12 datSum = datSum[,c("Sequence.ID", "AA.JUNCTION")]
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
13
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
14 dat = merge(dat, datSum, by="Sequence.ID", all.x=T)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
15
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
16 #dat = dat[dat$Functionality == "productive",]
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
17
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
18 dat$VGene = gsub("^Homsap ", "", dat$V.GENE.and.allele)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
19 dat$VGene = gsub("[*].*", "", dat$VGene)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
20
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
21 dat$past = paste(dat$AA.JUNCTION, dat$VGene)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
22
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
23 #dat = dat[!duplicated(dat$past), ]
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
24
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
25 if(length(dat$Sequence.ID) == 0){
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
26 setwd(outputdir)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
27 result = data.frame(x = rep(0, 5), y = rep(0, 5), z = rep(NA, 5))
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
28 row.names(result) = c("Number of Mutations (%)", "Transition (%)", "Transversions (%)", "Transitions at G C (%)", "Targeting of C G (%)")
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
29 write.table(x=result, file="mutations.txt", sep=",",quote=F,row.names=T,col.names=F)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
30 transitionTable = data.frame(A=rep(0, 4),C=rep(0, 4),G=rep(0, 4),T=rep(0, 4))
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
31 row.names(transitionTable) = c("A", "C", "G", "T")
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
32 transitionTable["A","A"] = NA
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
33 transitionTable["C","C"] = NA
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
34 transitionTable["G","G"] = NA
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
35 transitionTable["T","T"] = NA
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
36 write.table(x=transitionTable, file="transitions.txt", sep=",",quote=F,row.names=T,col.names=NA)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
37 cat("0", file="n.txt")
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
38 stop("No data")
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
39 }
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
40
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
41 #print(paste("After filtering on 'productive' and deduplicating based on V and AA JUNCTION there are", length(dat$Sequence.ID), "sequences left"))
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
42
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
43 result = data.frame(x = 1:5, y = 1:5, z = 1:5)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
44 row.names(result) = c("Number of Mutations (%)", "Transition (%)", "Transversions (%)", "Transitions at G C (%)", "Targeting of C G (%)")
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
45
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
46 cleanup_columns = c("FR1.IMGT.c.a",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
47 "FR2.IMGT.g.t",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
48 "CDR1.IMGT.Nb.of.nucleotides",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
49 "CDR2.IMGT.t.a",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
50 "FR1.IMGT.c.g",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
51 "CDR1.IMGT.c.t",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
52 "FR2.IMGT.a.c",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
53 "FR2.IMGT.Nb.of.mutations",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
54 "FR2.IMGT.g.c",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
55 "FR2.IMGT.a.g",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
56 "FR3.IMGT.t.a",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
57 "FR3.IMGT.t.c",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
58 "FR2.IMGT.g.a",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
59 "FR3.IMGT.c.g",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
60 "FR1.IMGT.Nb.of.mutations",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
61 "CDR1.IMGT.g.a",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
62 "CDR1.IMGT.t.g",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
63 "CDR1.IMGT.g.c",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
64 "CDR2.IMGT.Nb.of.nucleotides",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
65 "FR2.IMGT.a.t",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
66 "CDR1.IMGT.Nb.of.mutations",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
67 "CDR1.IMGT.a.g",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
68 "FR3.IMGT.a.c",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
69 "FR1.IMGT.g.a",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
70 "FR3.IMGT.a.g",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
71 "FR1.IMGT.a.t",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
72 "CDR2.IMGT.a.g",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
73 "CDR2.IMGT.Nb.of.mutations",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
74 "CDR2.IMGT.g.t",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
75 "CDR2.IMGT.a.c",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
76 "CDR1.IMGT.t.c",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
77 "FR3.IMGT.g.c",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
78 "FR1.IMGT.g.t",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
79 "FR3.IMGT.g.t",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
80 "CDR1.IMGT.a.t",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
81 "FR1.IMGT.a.g",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
82 "FR3.IMGT.a.t",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
83 "FR3.IMGT.Nb.of.nucleotides",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
84 "FR2.IMGT.t.c",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
85 "CDR2.IMGT.g.a",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
86 "FR2.IMGT.t.a",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
87 "CDR1.IMGT.t.a",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
88 "FR2.IMGT.t.g",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
89 "FR3.IMGT.t.g",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
90 "FR2.IMGT.Nb.of.nucleotides",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
91 "FR1.IMGT.t.a",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
92 "FR1.IMGT.t.g",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
93 "FR3.IMGT.c.t",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
94 "FR1.IMGT.t.c",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
95 "CDR2.IMGT.a.t",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
96 "FR2.IMGT.c.t",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
97 "CDR1.IMGT.g.t",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
98 "CDR2.IMGT.t.g",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
99 "FR1.IMGT.Nb.of.nucleotides",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
100 "CDR1.IMGT.c.g",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
101 "CDR2.IMGT.t.c",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
102 "FR3.IMGT.g.a",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
103 "CDR1.IMGT.a.c",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
104 "FR2.IMGT.c.a",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
105 "FR3.IMGT.Nb.of.mutations",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
106 "FR2.IMGT.c.g",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
107 "CDR2.IMGT.g.c",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
108 "FR1.IMGT.g.c",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
109 "CDR2.IMGT.c.t",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
110 "FR3.IMGT.c.a",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
111 "CDR1.IMGT.c.a",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
112 "CDR2.IMGT.c.g",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
113 "CDR2.IMGT.c.a",
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
114 "FR1.IMGT.c.t")
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
115
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
116 for(col in cleanup_columns){
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
117 dat[,col] = gsub("\\(.*\\)", "", dat[,col])
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
118 #dat[dat[,col] == "",] = "0"
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
119 dat[,col] = as.numeric(dat[,col])
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
120 dat[is.na(dat[,col]),] = 0
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
121 }
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
122
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
123 VRegionMutations = sum(dat$FR1.IMGT.Nb.of.mutations +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
124 dat$CDR1.IMGT.Nb.of.mutations +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
125 dat$FR2.IMGT.Nb.of.mutations +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
126 dat$CDR2.IMGT.Nb.of.mutations +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
127 dat$FR3.IMGT.Nb.of.mutations)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
128
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
129 VRegionNucleotides = sum( dat$FR1.IMGT.Nb.of.nucleotides +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
130 dat$CDR1.IMGT.Nb.of.nucleotides +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
131 dat$FR2.IMGT.Nb.of.nucleotides +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
132 dat$CDR2.IMGT.Nb.of.nucleotides +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
133 dat$FR3.IMGT.Nb.of.nucleotides)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
134
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
135 result[1,"x"] = VRegionMutations
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
136 result[1,"y"] = VRegionNucleotides
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
137 result[1,"z"] = round(result[1,"x"] / result[1,"y"] * 100, digits=1)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
138
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
139 transitionMutations = sum(dat$FR1.IMGT.a.g +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
140 dat$FR1.IMGT.g.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
141 dat$FR1.IMGT.c.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
142 dat$FR1.IMGT.t.c +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
143 dat$CDR1.IMGT.a.g +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
144 dat$CDR1.IMGT.g.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
145 dat$CDR1.IMGT.c.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
146 dat$CDR1.IMGT.t.c +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
147 dat$FR2.IMGT.a.g +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
148 dat$FR2.IMGT.g.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
149 dat$FR2.IMGT.c.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
150 dat$FR2.IMGT.t.c +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
151 dat$CDR2.IMGT.a.g +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
152 dat$CDR2.IMGT.g.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
153 dat$CDR2.IMGT.c.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
154 dat$CDR2.IMGT.t.c +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
155 dat$FR3.IMGT.a.g +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
156 dat$FR3.IMGT.g.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
157 dat$FR3.IMGT.c.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
158 dat$FR3.IMGT.t.c)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
159
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
160 result[2,"x"] = transitionMutations
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
161 result[2,"y"] = VRegionMutations
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
162 result[2,"z"] = round(result[2,"x"] / result[2,"y"] * 100, digits=1)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
163
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
164 transversionMutations = sum( dat$FR1.IMGT.a.c +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
165 dat$FR1.IMGT.c.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
166 dat$FR1.IMGT.a.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
167 dat$FR1.IMGT.t.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
168 dat$FR1.IMGT.g.c +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
169 dat$FR1.IMGT.c.g +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
170 dat$FR1.IMGT.g.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
171 dat$FR1.IMGT.t.g +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
172 dat$CDR1.IMGT.a.c +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
173 dat$CDR1.IMGT.c.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
174 dat$CDR1.IMGT.a.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
175 dat$CDR1.IMGT.t.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
176 dat$CDR1.IMGT.g.c +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
177 dat$CDR1.IMGT.c.g +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
178 dat$CDR1.IMGT.g.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
179 dat$CDR1.IMGT.t.g +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
180 dat$FR2.IMGT.a.c +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
181 dat$FR2.IMGT.c.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
182 dat$FR2.IMGT.a.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
183 dat$FR2.IMGT.t.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
184 dat$FR2.IMGT.g.c +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
185 dat$FR2.IMGT.c.g +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
186 dat$FR2.IMGT.g.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
187 dat$FR2.IMGT.t.g +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
188 dat$CDR2.IMGT.a.c +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
189 dat$CDR2.IMGT.c.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
190 dat$CDR2.IMGT.a.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
191 dat$CDR2.IMGT.t.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
192 dat$CDR2.IMGT.g.c +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
193 dat$CDR2.IMGT.c.g +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
194 dat$CDR2.IMGT.g.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
195 dat$CDR2.IMGT.t.g +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
196 dat$FR3.IMGT.a.c +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
197 dat$FR3.IMGT.c.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
198 dat$FR3.IMGT.a.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
199 dat$FR3.IMGT.t.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
200 dat$FR3.IMGT.g.c +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
201 dat$FR3.IMGT.c.g +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
202 dat$FR3.IMGT.g.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
203 dat$FR3.IMGT.t.g)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
204
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
205 result[3,"x"] = transversionMutations
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
206 result[3,"y"] = VRegionMutations
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
207 result[3,"z"] = round(result[3,"x"] / result[3,"y"] * 100, digits=1)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
208
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
209 transitionMutationsAtGC = sum(dat$FR1.IMGT.g.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
210 dat$FR1.IMGT.c.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
211 dat$CDR1.IMGT.g.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
212 dat$CDR1.IMGT.c.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
213 dat$FR2.IMGT.g.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
214 dat$FR2.IMGT.c.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
215 dat$CDR2.IMGT.g.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
216 dat$CDR2.IMGT.c.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
217 dat$FR3.IMGT.g.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
218 dat$FR3.IMGT.c.t)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
219
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
220 totalMutationsAtGC = sum(dat$FR1.IMGT.g.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
221 dat$FR1.IMGT.c.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
222 dat$FR1.IMGT.c.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
223 dat$FR1.IMGT.g.c +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
224 dat$FR1.IMGT.c.g +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
225 dat$FR1.IMGT.g.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
226 dat$CDR1.IMGT.g.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
227 dat$CDR1.IMGT.c.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
228 dat$CDR1.IMGT.c.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
229 dat$CDR1.IMGT.g.c +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
230 dat$CDR1.IMGT.c.g +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
231 dat$CDR1.IMGT.g.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
232 dat$FR2.IMGT.g.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
233 dat$FR2.IMGT.c.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
234 dat$FR2.IMGT.c.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
235 dat$FR2.IMGT.g.c +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
236 dat$FR2.IMGT.c.g +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
237 dat$FR2.IMGT.g.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
238 dat$CDR2.IMGT.g.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
239 dat$CDR2.IMGT.c.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
240 dat$CDR2.IMGT.c.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
241 dat$CDR2.IMGT.g.c +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
242 dat$CDR2.IMGT.c.g +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
243 dat$CDR2.IMGT.g.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
244 dat$FR3.IMGT.g.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
245 dat$FR3.IMGT.c.t +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
246 dat$FR3.IMGT.c.a +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
247 dat$FR3.IMGT.g.c +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
248 dat$FR3.IMGT.c.g +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
249 dat$FR3.IMGT.g.t)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
250
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
251 result[4,"x"] = transitionMutationsAtGC
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
252 result[4,"y"] = totalMutationsAtGC
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
253 result[4,"z"] = round(result[4,"x"] / result[4,"y"] * 100, digits=1)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
254
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
255 result[5,"x"] = totalMutationsAtGC
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
256 result[5,"y"] = VRegionMutations
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
257 result[5,"z"] = round(result[5,"x"] / result[5,"y"] * 100, digits=1)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
258
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
259
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
260 #transitiontable
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
261
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
262 transitionTable = data.frame(A=1:4,C=1:4,G=1:4,T=1:4)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
263 row.names(transitionTable) = c("A", "C", "G", "T")
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
264 transitionTable["A","A"] = NA
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
265 transitionTable["C","C"] = NA
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
266 transitionTable["G","G"] = NA
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
267 transitionTable["T","T"] = NA
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
268 nts = c("a", "c", "g", "t")
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
269
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
270
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
271 for(nt1 in nts){
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
272 for(nt2 in nts){
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
273 if(nt1 == nt2){
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
274 next
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
275 }
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
276 NT1 = LETTERS[letters == nt1]
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
277 NT2 = LETTERS[letters == nt2]
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
278 FR1 = paste("FR1.IMGT.", nt1, ".", nt2, sep="")
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
279 CDR1 = paste("CDR1.IMGT.", nt1, ".", nt2, sep="")
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
280 FR2 = paste("FR2.IMGT.", nt1, ".", nt2, sep="")
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
281 CDR2 = paste("CDR2.IMGT.", nt1, ".", nt2, sep="")
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
282 FR3 = paste("FR3.IMGT.", nt1, ".", nt2, sep="")
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
283 transitionTable[NT1,NT2] = sum( dat[,FR1] +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
284 dat[,CDR1] +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
285 dat[,FR2] +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
286 dat[,CDR2] +
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
287 dat[,FR3])
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
288 }
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
289 }
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
290
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
291 setwd(outputdir)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
292 write.table(x=result, file="mutations.txt", sep=",",quote=F,row.names=T,col.names=F)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
293 write.table(x=transitionTable, file="transitions.txt", sep=",",quote=F,row.names=T,col.names=NA)
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
294 cat(length(dat$Sequence.ID), file="n.txt")
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
295
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
296
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
297
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
298
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
299
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
300
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
301
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
302
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
303
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
304
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
305
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
306
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
307
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
308
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
309
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
310
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
311
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
312
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
313
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
314
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
315
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
316
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
317
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
318
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
319
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
320
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
321
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
322
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
323
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
324
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
325
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
326
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
327
74d2bc479bee Uploaded
davidvanzessen
parents:
diff changeset
328