blob: d1f9738ae6ee7a51d71eb928267b9f95f64383eb [file] [log] [blame]
filename = "imaginary.data"
data = read.table(file = filename, header = T, sep = ",")
length(data[is.na(data$seq), ])
pairs = data.frame(unique(data[c("ta", "ra")]))
pairs$num = c(1:length(pairs))
data$pair_num = NA
# I hate this workaround but the proper way doesn't work: should be
# data[data$ta == as.character(pairs$ta) & data$ra == as.character(pairs$ra),"pair_num"] = pairs$num
# but complains about the length. I don't know how to make R happy here.
ordinal = 1;
for (pair in pairs) {
data[ data$ta == as.character(pair[1])
& data$ra == as.character(pair[2])
,"pair_num"] = ordinal;
ordinal = ordinal + 1;
}
write.table(
data,
file=paste(filename, ".prepared", sep=""),
sep=",",
quote=F,
na="",
row.names=F);