95
|
1 args <- commandArgs(trailingOnly = TRUE)
|
|
2
|
|
3 imgt.dir = args[1]
|
|
4 merged.file = args[2]
|
99
|
5 gene = args[3]
|
95
|
6
|
|
7 merged = read.table(merged.file, header=T, sep="\t", fill=T, stringsAsFactors=F)
|
|
8
|
101
|
9 print(head(merged$best_match))
|
|
10
|
99
|
11 if(gene != "-"){
|
|
12 merged = merged[grepl(gene, merged$best_match),]
|
|
13 }
|
|
14
|
97
|
15 merged = merged[!grepl("unmatched", merged$best_match),]
|
|
16
|
95
|
17 for(f in list.files(imgt.dir, pattern="*.txt$")){
|
|
18 print(paste("filtering", f))
|
|
19 path = paste(imgt.dir, f, sep="")
|
|
20 dat = read.table(path, header=T, sep="\t", fill=T, quote="", stringsAsFactors=F)
|
|
21
|
|
22 dat = dat[dat$Sequence.ID %in% merged$Sequence.ID,]
|
|
23
|
99
|
24 if(nrow(dat) > 0 & "FR1.IMGT" %in% colnames(dat)){
|
95
|
25 dat$FR1.IMGT = ""
|
|
26 }
|
|
27
|
|
28 write.table(dat, path, quote=F, sep="\t", row.names=F, col.names=T)
|
|
29 }
|