comparison extract_duplicates.r @ 1:a3c4e3e62e10 draft

Uploaded
author davidvanzessen
date Tue, 01 Sep 2015 07:49:47 -0400
parents 02cf2dd19564
children 1f1640608245
comparison
equal deleted inserted replaced
0:02cf2dd19564 1:a3c4e3e62e10
3 input=args[1] 3 input=args[1]
4 column=as.numeric(args[2]) 4 column=as.numeric(args[2])
5 header=(args[3] == "yes") 5 header=(args[3] == "yes")
6 out_file=args[4] 6 out_file=args[4]
7 7
8 dat = read.table(input, header=header, sep="\t", fill=T, stringsAsFactors=F) 8 dat = read.table(input, header=header, sep="\t", fill=T, stringsAsFactors=F, quote="")
9 9
10 duplicates = dat[duplicated(dat[,column]),column] 10 duplicates = dat[duplicated(dat[,column]),column]
11 11
12 dat = dat[dat[,column] %in% duplicates,] 12 dat = dat[dat[,column] %in% duplicates,]
13 13