Basic script for assessing simulation sensitivity and specificity

git-svn-id: file:///humgen/gsa-scr1/gsa-engineering/svn_contents/trunk@4638 348d0f76-0448-11de-a6fe-93d51630548a
This commit is contained in:
depristo 2010-11-08 21:02:10 +00:00
parent 4759fdd2ac
commit 3c08a1c061
1 changed files with 41 additions and 0 deletions

View File

@ -0,0 +1,41 @@
#d <- read.table("sim_calls.table", header=T)
d$sim.VAR <- d$sim.AC > 0
d$called.VAR <- d$called.AC > 0
QS = unique(d$sim.Q)
MODES = unique(d$sim.MODE)
NS = unique(d$called.AN / 2)
DEPTHS = unique(d$sim.DP)
results <- expand.grid(Q = QS, mode = MODES, nSamples = NS, depth = DEPTHS)
results$sensitivity = 0
results$specificity = 0
determineRates <- function(raw, Q, mode, depth) {
sub <- subset(raw, sim.Q == Q & sim.MODE == mode & sim.DP == depth)
ct <- table(sub$called.VAR, sub$sim.VAR, dnn = c("called.VAR", "sim.VAR"))
sensitivity = ct[2,2] / sum(ct[,2])
specificity = ct[1,1] / sum(ct[,1])
list(sensitivity = sensitivity, specificity = specificity, ct = ct)
}
for ( i in 1:(dim(results)[1]) ) {
r <- results[i,]
x <- determineRates(d, r$Q, r$mode, r$depth)
results[i,]$sensitivity = x$sensitivity
results[i,]$specificity = x$specificity
}
for ( depth in DEPTHS )
boxplot(called.AC ~ sim.AC, data = subset(d, called.DP == depth * NS), main = paste("Depth of coverage ", depth), xlab = "Simulation AC", ylab = "Called AC")
print(results)
par(mfcol=c(2,1))
for ( Qt in QS ) {
x <- subset(results, Q == Qt)
print(x)
plot(x$depth, x$sensitivity, type="b")
plot(x$depth, x$specificity, type="b")
}